-
-
Save eduardo4jesus/d8c022d452fdc0e196a55104c6b50a6d to your computer and use it in GitHub Desktop.
Tracing: Confusion with duration of similar `flip` operations
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"schemaVersion": 1, | |
"deviceProperties": [ | |
{ | |
"id": 0, "name": "Tesla P100-PCIE-16GB", "totalGlobalMem": 17071734784, | |
"computeMajor": 6, "computeMinor": 0, | |
"maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, | |
"regsPerBlock": 65536, "regsPerMultiprocessor": 65536, "warpSize": 32, | |
"sharedMemPerBlock": 49152, "sharedMemPerMultiprocessor": 65536, | |
"numSms": 56, "sharedMemPerBlockOptin": 49152 | |
} | |
], | |
"traceEvents": [ | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363535483, "dur": 1560, | |
"args": { | |
"Device": 618, "External id": 31, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363537072, "dur": 5921, | |
"args": { | |
"Device": 618, "External id": 32, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363535467, "dur": 7533, | |
"args": { | |
"Device": 618, "External id": 30, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363543033, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 34, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363543046, "dur": 31, | |
"args": { | |
"Device": 618, "External id": 35, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363543029, "dur": 52, | |
"args": { | |
"Device": 618, "External id": 33, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363543147, "dur": 273, | |
"args": { | |
"Device": 618, "External id": 37, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363543428, "dur": 36, | |
"args": { | |
"Device": 618, "External id": 38, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363543479, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 41, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363543474, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 40, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363543469, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 39, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363543494, "dur": 36, | |
"args": { | |
"Device": 618, "External id": 42, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363543139, "dur": 395, | |
"args": { | |
"Device": 618, "External id": 36, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363543590, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 44, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363543571, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 43, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363543603, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 46, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363543602, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 45, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363543617, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 48, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363543616, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 47, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363543669, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 50, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363543628, "dur": 48, | |
"args": { | |
"Device": 618, "External id": 49, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363543681, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 52, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363543679, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 51, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363543808, "dur": 192, | |
"args": { | |
"Device": 618, "External id": 55, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363543803, "dur": 202, | |
"args": { | |
"Device": 618, "External id": 54, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363544073, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 57, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363544086, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 58, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363544047, "dur": 44, | |
"args": { | |
"Device": 618, "External id": 56, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544121, "dur": 187, | |
"args": { | |
"Device": 618, "External id": 60, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363544314, "dur": 209, | |
"args": { | |
"Device": 618, "External id": 61, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363544110, "dur": 423, | |
"args": { | |
"Device": 618, "External id": 59, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544558, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 63, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363544570, "dur": 33, | |
"args": { | |
"Device": 618, "External id": 64, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363544538, "dur": 73, | |
"args": { | |
"Device": 618, "External id": 62, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544616, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 66, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363544625, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 67, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363544613, "dur": 37, | |
"args": { | |
"Device": 618, "External id": 65, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544659, "dur": 13, | |
"args": { | |
"Device": 618, "External id": 69, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363544690, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 70, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363544654, "dur": 66, | |
"args": { | |
"Device": 618, "External id": 68, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363543770, "dur": 985, | |
"args": { | |
"Device": 618, "External id": 53, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544776, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 72, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544772, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 71, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544785, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 74, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544784, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 73, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544791, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 76, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544790, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 75, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544797, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 78, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363544795, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 77, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544803, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 80, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544802, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 79, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363544807, "dur": 43, | |
"args": { | |
"Device": 618, "External id": 81, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544879, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 83, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544877, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 82, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544886, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 85, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544885, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 84, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544891, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 87, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544890, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 86, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544914, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 89, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544913, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 88, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363544919, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 91, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363544918, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 90, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363544939, "dur": 217, | |
"args": { | |
"Device": 618, "External id": 94, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363544936, "dur": 224, | |
"args": { | |
"Device": 618, "External id": 93, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363545170, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 96, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363545184, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 97, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363545167, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 95, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545193, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 99, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363545204, "dur": 39, | |
"args": { | |
"Device": 618, "External id": 100, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363545190, "dur": 55, | |
"args": { | |
"Device": 618, "External id": 98, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545251, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 102, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363545260, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 103, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363545247, "dur": 33, | |
"args": { | |
"Device": 618, "External id": 101, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545284, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 105, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363545292, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 106, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363545282, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 104, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545314, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 108, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363545322, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 109, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363545312, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 107, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363544931, "dur": 434, | |
"args": { | |
"Device": 618, "External id": 92, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545383, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 111, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363545379, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 110, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545391, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 113, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363545390, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 112, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545396, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 115, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363545395, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 114, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545401, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 117, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363545400, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 116, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363545406, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 119, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363545405, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 118, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363545409, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 120, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363545471, "dur": 314, | |
"args": { | |
"Device": 618, "External id": 122, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363545807, "dur": 50, | |
"args": { | |
"Device": 618, "External id": 123, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363545468, "dur": 392, | |
"args": { | |
"Device": 618, "External id": 121, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363545883, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 125, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363545908, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 126, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363545880, "dur": 53, | |
"args": { | |
"Device": 618, "External id": 124, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363545979, "dur": 225, | |
"args": { | |
"Device": 618, "External id": 128, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363546209, "dur": 49, | |
"args": { | |
"Device": 618, "External id": 129, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546266, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 132, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363546263, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 131, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363546261, "dur": 11, | |
"args": { | |
"Device": 618, "External id": 130, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363546273, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 133, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363545974, "dur": 325, | |
"args": { | |
"Device": 618, "External id": 127, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546330, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 135, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363546313, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 134, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546338, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 137, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363546336, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 136, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546343, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 139, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363546342, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 138, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546350, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 141, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363546348, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 140, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546358, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 143, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363546356, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 142, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363546377, "dur": 31, | |
"args": { | |
"Device": 618, "External id": 146, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363546374, "dur": 36, | |
"args": { | |
"Device": 618, "External id": 145, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363546417, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 148, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363546422, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 149, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363546415, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 147, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363546431, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 151, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363546441, "dur": 2900, | |
"args": { | |
"Device": 618, "External id": 152, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363546428, "dur": 2917, | |
"args": { | |
"Device": 618, "External id": 150, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549354, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 154, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549366, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 155, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549350, "dur": 44, | |
"args": { | |
"Device": 618, "External id": 153, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549418, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 157, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549427, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 158, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549397, "dur": 49, | |
"args": { | |
"Device": 618, "External id": 156, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549451, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 160, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549485, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 161, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549448, "dur": 58, | |
"args": { | |
"Device": 618, "External id": 159, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363546369, "dur": 3163, | |
"args": { | |
"Device": 618, "External id": 144, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549551, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 163, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549546, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 162, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549559, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 165, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549557, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 164, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549563, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 167, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549562, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 166, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549570, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 169, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363549567, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 168, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549575, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 171, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549574, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 170, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549579, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 172, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549619, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 174, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549617, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 173, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549626, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 176, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549625, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 175, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549631, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 178, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549630, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 177, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549635, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 180, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549634, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 179, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549640, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 182, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549639, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 181, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363549674, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 185, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363549672, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 184, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363549695, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 187, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363549714, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 188, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363549693, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 186, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549722, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 190, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549732, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 191, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549719, "dur": 39, | |
"args": { | |
"Device": 618, "External id": 189, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549763, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 193, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549775, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 194, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549761, "dur": 34, | |
"args": { | |
"Device": 618, "External id": 192, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549799, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 196, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549807, "dur": 31, | |
"args": { | |
"Device": 618, "External id": 197, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549796, "dur": 43, | |
"args": { | |
"Device": 618, "External id": 195, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549844, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 199, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549851, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 200, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363549841, "dur": 34, | |
"args": { | |
"Device": 618, "External id": 198, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363549667, "dur": 230, | |
"args": { | |
"Device": 618, "External id": 183, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549912, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 202, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549909, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 201, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549919, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 204, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549918, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 203, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549924, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 206, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549923, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 205, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549927, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 208, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549927, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 207, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363549931, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 210, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363549930, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 209, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363549934, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 211, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363549980, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 213, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363550005, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 214, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363549977, "dur": 58, | |
"args": { | |
"Device": 618, "External id": 212, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363550051, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 216, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363550058, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 217, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363550049, "dur": 31, | |
"args": { | |
"Device": 618, "External id": 215, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363550110, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 219, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363550119, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 220, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550145, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 223, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363550143, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 222, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363550141, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 221, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363550151, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 224, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363550105, "dur": 67, | |
"args": { | |
"Device": 618, "External id": 218, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550184, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 226, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363550182, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 225, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550190, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 228, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363550189, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 227, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550196, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 230, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363550195, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 229, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550202, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 232, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363550200, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 231, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550207, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 234, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363550206, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 233, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363550228, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 237, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363550226, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 236, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363550253, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 239, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363550257, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 240, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363550252, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 238, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363550280, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 242, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363550288, "dur": 3614, | |
"args": { | |
"Device": 618, "External id": 243, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363550262, "dur": 3644, | |
"args": { | |
"Device": 618, "External id": 241, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363553914, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 245, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363553925, "dur": 24, | |
"args": { | |
"Device": 618, "External id": 246, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363553910, "dur": 56, | |
"args": { | |
"Device": 618, "External id": 244, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363553972, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 248, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363553980, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 249, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363553969, "dur": 30, | |
"args": { | |
"Device": 618, "External id": 247, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554003, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 251, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554011, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 252, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363554001, "dur": 27, | |
"args": { | |
"Device": 618, "External id": 250, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363550222, "dur": 3830, | |
"args": { | |
"Device": 618, "External id": 235, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554068, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 254, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554064, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 253, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554084, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 256, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554082, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 255, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554089, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 258, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554088, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 257, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554095, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 260, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363554093, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 259, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554100, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 262, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554099, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 261, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554109, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 263, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554149, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 265, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554146, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 264, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554155, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 267, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554154, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 266, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554159, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 269, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554158, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 268, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554163, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 271, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554162, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 270, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554168, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 273, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554167, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 272, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554184, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 276, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363554182, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 275, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554197, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 278, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363554201, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 279, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363554196, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 277, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554209, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 281, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554217, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 282, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363554206, "dur": 41, | |
"args": { | |
"Device": 618, "External id": 280, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554252, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 284, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554261, "dur": 32, | |
"args": { | |
"Device": 618, "External id": 285, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363554249, "dur": 46, | |
"args": { | |
"Device": 618, "External id": 283, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554299, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 287, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554323, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 288, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363554297, "dur": 79, | |
"args": { | |
"Device": 618, "External id": 286, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554382, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 290, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554391, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 291, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363554378, "dur": 32, | |
"args": { | |
"Device": 618, "External id": 289, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363554177, "dur": 254, | |
"args": { | |
"Device": 618, "External id": 274, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554446, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 293, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554442, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 292, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554452, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 295, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554451, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 294, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554457, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 297, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554456, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 296, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554462, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 299, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554461, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 298, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554466, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 301, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554465, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 300, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554470, "dur": 24, | |
"args": { | |
"Device": 618, "External id": 302, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554515, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 304, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363554524, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 305, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363554512, "dur": 40, | |
"args": { | |
"Device": 618, "External id": 303, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554566, "dur": 13, | |
"args": { | |
"Device": 618, "External id": 307, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363554581, "dur": 36, | |
"args": { | |
"Device": 618, "External id": 308, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363554564, "dur": 55, | |
"args": { | |
"Device": 618, "External id": 306, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554668, "dur": 11, | |
"args": { | |
"Device": 618, "External id": 310, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363554683, "dur": 39, | |
"args": { | |
"Device": 618, "External id": 311, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554731, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 314, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554728, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 313, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363554726, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 312, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554737, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 315, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363554663, "dur": 97, | |
"args": { | |
"Device": 618, "External id": 309, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554775, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 317, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554772, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 316, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554781, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 319, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554780, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 318, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554786, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 321, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554785, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 320, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554792, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 323, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363554790, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 322, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554797, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 325, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363554796, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 324, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554814, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 328, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363554812, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 327, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363554828, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 330, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363554832, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 331, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363554826, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 329, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363554840, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 333, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363554850, "dur": 3610, | |
"args": { | |
"Device": 618, "External id": 334, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363554837, "dur": 3626, | |
"args": { | |
"Device": 618, "External id": 332, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558469, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 336, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558480, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 337, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558466, "dur": 36, | |
"args": { | |
"Device": 618, "External id": 335, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558507, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 339, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558532, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 340, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558504, "dur": 61, | |
"args": { | |
"Device": 618, "External id": 338, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558570, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 342, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558578, "dur": 31, | |
"args": { | |
"Device": 618, "External id": 343, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558567, "dur": 43, | |
"args": { | |
"Device": 618, "External id": 341, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363554807, "dur": 3825, | |
"args": { | |
"Device": 618, "External id": 326, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558647, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 345, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558644, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 344, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558654, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 347, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558653, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 346, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558659, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 349, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558658, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 348, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558665, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 351, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363558663, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 350, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558670, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 353, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558669, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 352, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558674, "dur": 38, | |
"args": { | |
"Device": 618, "External id": 354, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558725, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 356, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558722, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 355, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558731, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 358, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558730, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 357, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558735, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 360, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558734, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 359, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558739, "dur": 52, | |
"args": { | |
"Device": 618, "External id": 362, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558738, "dur": 55, | |
"args": { | |
"Device": 618, "External id": 361, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558797, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 364, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363558795, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 363, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363558830, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 367, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363558828, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 366, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363558859, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 369, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363558863, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 370, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363558858, "dur": 15, | |
"args": { | |
"Device": 618, "External id": 368, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558880, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 372, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558889, "dur": 38, | |
"args": { | |
"Device": 618, "External id": 373, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558877, "dur": 52, | |
"args": { | |
"Device": 618, "External id": 371, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558934, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 375, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558942, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 376, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558931, "dur": 30, | |
"args": { | |
"Device": 618, "External id": 374, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558966, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 378, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363558973, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 379, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558963, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 377, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363558996, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 381, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363559003, "dur": 15, | |
"args": { | |
"Device": 618, "External id": 382, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363558993, "dur": 27, | |
"args": { | |
"Device": 618, "External id": 380, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363558824, "dur": 216, | |
"args": { | |
"Device": 618, "External id": 365, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559054, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 384, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559050, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 383, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559076, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 386, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559075, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 385, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559080, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 388, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559079, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 387, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559084, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 390, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559083, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 389, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559089, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 392, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559088, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 391, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363559092, "dur": 37, | |
"args": { | |
"Device": 618, "External id": 393, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363559165, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 395, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363559189, "dur": 24, | |
"args": { | |
"Device": 618, "External id": 396, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363559162, "dur": 52, | |
"args": { | |
"Device": 618, "External id": 394, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363559228, "dur": 14, | |
"args": { | |
"Device": 618, "External id": 398, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363559244, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 399, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363559227, "dur": 41, | |
"args": { | |
"Device": 618, "External id": 397, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363559312, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 401, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363559321, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 402, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559347, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 405, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559345, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 404, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363559343, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 403, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363559353, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 406, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363559308, "dur": 66, | |
"args": { | |
"Device": 618, "External id": 400, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559387, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 408, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559385, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 407, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559409, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 410, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559407, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 409, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559414, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 412, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559413, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 411, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559420, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 414, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363559418, "dur": 13, | |
"args": { | |
"Device": 618, "External id": 413, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559434, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 416, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363559432, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 415, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363559464, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 419, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363559462, "dur": 11, | |
"args": { | |
"Device": 618, "External id": 418, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363559478, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 421, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363559483, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 422, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363559477, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 420, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363559491, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 424, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363559500, "dur": 3551, | |
"args": { | |
"Device": 618, "External id": 425, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363559488, "dur": 3565, | |
"args": { | |
"Device": 618, "External id": 423, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563059, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 427, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563069, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 428, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563056, "dur": 34, | |
"args": { | |
"Device": 618, "External id": 426, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563095, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 430, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563103, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 431, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563092, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 429, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563126, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 433, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563149, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 434, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563124, "dur": 54, | |
"args": { | |
"Device": 618, "External id": 432, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363559458, "dur": 3758, | |
"args": { | |
"Device": 618, "External id": 417, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563252, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 436, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563248, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 435, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563260, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 438, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563259, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 437, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563265, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 440, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563264, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 439, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563271, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 442, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363563269, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 441, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563276, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 444, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563275, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 443, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563287, "dur": 27, | |
"args": { | |
"Device": 618, "External id": 445, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563328, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 447, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563325, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 446, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563334, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 449, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563333, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 448, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563338, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 451, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563337, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 450, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563342, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 453, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563341, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 452, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563345, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 455, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563344, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 454, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363563361, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 458, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363563359, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 457, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363563374, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 460, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363563378, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 461, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363563372, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 459, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563385, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 463, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563394, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 464, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563382, "dur": 37, | |
"args": { | |
"Device": 618, "External id": 462, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563424, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 466, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563432, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 467, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563421, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 465, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563454, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 469, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563462, "dur": 40, | |
"args": { | |
"Device": 618, "External id": 470, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563452, "dur": 52, | |
"args": { | |
"Device": 618, "External id": 468, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563509, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 472, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563517, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 473, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363563506, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 471, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363563355, "dur": 199, | |
"args": { | |
"Device": 618, "External id": 456, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563567, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 475, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563564, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 474, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563574, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 477, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563573, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 476, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563578, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 479, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563577, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 478, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563582, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 481, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563581, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 480, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563586, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 483, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563585, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 482, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563589, "dur": 38, | |
"args": { | |
"Device": 618, "External id": 484, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363563647, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 486, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363563674, "dur": 54, | |
"args": { | |
"Device": 618, "External id": 487, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363563644, "dur": 86, | |
"args": { | |
"Device": 618, "External id": 485, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363563766, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 489, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363563775, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 490, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363563763, "dur": 35, | |
"args": { | |
"Device": 618, "External id": 488, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363563827, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 492, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363563852, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 493, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563878, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 496, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563876, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 495, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363563874, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 494, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363563885, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 497, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363563823, "dur": 84, | |
"args": { | |
"Device": 618, "External id": 491, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563920, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 499, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563917, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 498, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563927, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 501, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563926, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 500, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563935, "dur": 15, | |
"args": { | |
"Device": 618, "External id": 503, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563933, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 502, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563956, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 505, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363563954, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 504, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363563961, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 507, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363563961, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 506, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363563977, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 510, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363563975, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 509, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363564006, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 512, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363564010, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 513, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363564004, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 511, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363564018, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 515, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363564027, "dur": 3585, | |
"args": { | |
"Device": 618, "External id": 516, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363564015, "dur": 3599, | |
"args": { | |
"Device": 618, "External id": 514, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567621, "dur": 31, | |
"args": { | |
"Device": 618, "External id": 518, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363567654, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 519, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363567618, "dur": 58, | |
"args": { | |
"Device": 618, "External id": 517, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567682, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 521, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363567690, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 522, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363567678, "dur": 30, | |
"args": { | |
"Device": 618, "External id": 520, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567713, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 524, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363567747, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 525, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363567710, "dur": 59, | |
"args": { | |
"Device": 618, "External id": 523, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363563971, "dur": 3820, | |
"args": { | |
"Device": 618, "External id": 508, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567807, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 527, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567803, "dur": 9, | |
"args": { | |
"Device": 618, "External id": 526, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567814, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 529, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567813, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 528, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567819, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 531, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567818, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 530, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567824, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 533, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363567822, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 532, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567829, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 535, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567828, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 534, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363567833, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 536, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567868, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 538, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567866, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 537, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567874, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 540, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567873, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 539, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567878, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 542, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567877, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 541, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567984, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 544, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567971, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 543, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363567989, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 546, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363567988, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 545, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568007, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 549, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363568005, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 548, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568032, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 551, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363568036, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 552, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363568031, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 550, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568044, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 554, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568053, "dur": 24, | |
"args": { | |
"Device": 618, "External id": 555, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363568041, "dur": 37, | |
"args": { | |
"Device": 618, "External id": 553, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568084, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 557, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568091, "dur": 18, | |
"args": { | |
"Device": 618, "External id": 558, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363568081, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 556, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568115, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 560, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568123, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 561, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363568112, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 559, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568145, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 563, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568152, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 564, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363568143, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 562, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363568001, "dur": 188, | |
"args": { | |
"Device": 618, "External id": 547, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568203, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 566, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568200, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 565, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568210, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 568, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568209, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 567, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568215, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 570, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568214, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 569, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568219, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 572, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568218, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 571, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568223, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 574, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568222, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 573, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568226, "dur": 47, | |
"args": { | |
"Device": 618, "External id": 575, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568318, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 577, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363568328, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 578, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363568315, "dur": 39, | |
"args": { | |
"Device": 618, "External id": 576, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568369, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 580, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363568376, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 581, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363568367, "dur": 30, | |
"args": { | |
"Device": 618, "External id": 579, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568437, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 583, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363568446, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 584, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568471, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 587, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568469, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 586, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363568467, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 585, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568477, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 588, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363568434, "dur": 63, | |
"args": { | |
"Device": 618, "External id": 582, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568509, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 590, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568507, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 589, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568516, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 592, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568515, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 591, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568528, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 594, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568520, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 593, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568535, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 596, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363568533, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 595, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568539, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 598, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363568538, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 597, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568554, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 601, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363568552, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 600, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363568576, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 603, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363568580, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 604, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363568566, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 602, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363568589, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 606, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363568598, "dur": 3643, | |
"args": { | |
"Device": 618, "External id": 607, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363568586, "dur": 3657, | |
"args": { | |
"Device": 618, "External id": 605, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572251, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 609, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572261, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 610, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572247, "dur": 38, | |
"args": { | |
"Device": 618, "External id": 608, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572290, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 612, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572298, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 613, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572287, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 611, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572320, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 615, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572328, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 616, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572318, "dur": 27, | |
"args": { | |
"Device": 618, "External id": 614, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363568548, "dur": 3819, | |
"args": { | |
"Device": 618, "External id": 599, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572383, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 618, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572380, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 617, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572391, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 620, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572389, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 619, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572395, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 622, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572394, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 621, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572401, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 624, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363572399, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 623, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572406, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 626, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572405, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 625, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572409, "dur": 38, | |
"args": { | |
"Device": 618, "External id": 627, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572460, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 629, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572458, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 628, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572466, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 631, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572465, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 630, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572478, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 633, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572477, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 632, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572482, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 635, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572481, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 634, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572486, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 637, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572485, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 636, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363572502, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 640, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363572500, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 639, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363572515, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 642, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363572519, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 643, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363572514, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 641, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572526, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 645, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572534, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 646, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572524, "dur": 35, | |
"args": { | |
"Device": 618, "External id": 644, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572564, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 648, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572572, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 649, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572561, "dur": 28, | |
"args": { | |
"Device": 618, "External id": 647, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572593, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 651, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572601, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 652, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572591, "dur": 27, | |
"args": { | |
"Device": 618, "External id": 650, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572622, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 654, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572629, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 655, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363572620, "dur": 40, | |
"args": { | |
"Device": 618, "External id": 653, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363572496, "dur": 185, | |
"args": { | |
"Device": 618, "External id": 638, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572695, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 657, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572692, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 656, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572702, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 659, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572701, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 658, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572707, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 661, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572706, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 660, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572711, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 663, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572710, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 662, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572715, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 665, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572714, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 664, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572718, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 666, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363572777, "dur": 14, | |
"args": { | |
"Device": 618, "External id": 668, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363572794, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 669, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363572774, "dur": 47, | |
"args": { | |
"Device": 618, "External id": 667, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363572836, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 671, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::random_", "pid": 618, "tid": "618", | |
"ts": 1624691363572843, "dur": 20, | |
"args": { | |
"Device": 618, "External id": 672, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "Int", "Int", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::randint", "pid": 618, "tid": "618", | |
"ts": 1624691363572834, "dur": 30, | |
"args": { | |
"Device": 618, "External id": 670, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], [], []], "Input type": ["Int", "GenericList", "", "Int", "Int", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363572891, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 674, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::fill_", "pid": 618, "tid": "618", | |
"ts": 1624691363572900, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 675, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], []], "Input type": ["float", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572925, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 678, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572923, "dur": 5, | |
"args": { | |
"Device": 618, "External id": 677, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::narrow", "pid": 618, "tid": "618", | |
"ts": 1624691363572921, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 676, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "Int", "Int", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363572930, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 679, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [128, 64, 3, 32, 17], []], "Input type": ["float", "float", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::constant_pad_nd", "pid": 618, "tid": "618", | |
"ts": 1624691363572887, "dur": 64, | |
"args": { | |
"Device": 618, "External id": 673, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "GenericList", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572963, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 681, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572961, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 680, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572969, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 683, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572968, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 682, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572982, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 685, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572981, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 684, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572988, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 687, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363572986, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 686, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363572993, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 689, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363572992, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 688, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363573008, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 692, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363573006, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 691, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363573022, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 694, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363573026, "dur": 15, | |
"args": { | |
"Device": 618, "External id": 695, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363573021, "dur": 21, | |
"args": { | |
"Device": 618, "External id": 693, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363573049, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 697, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363573057, "dur": 3599, | |
"args": { | |
"Device": 618, "External id": 698, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363573046, "dur": 3613, | |
"args": { | |
"Device": 618, "External id": 696, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576667, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 700, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363576677, "dur": 22, | |
"args": { | |
"Device": 618, "External id": 701, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363576662, "dur": 38, | |
"args": { | |
"Device": 618, "External id": 699, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576705, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 703, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363576713, "dur": 17, | |
"args": { | |
"Device": 618, "External id": 704, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [4], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363576702, "dur": 29, | |
"args": { | |
"Device": 618, "External id": 702, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[4], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576764, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 706, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363576772, "dur": 42, | |
"args": { | |
"Device": 618, "External id": 707, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [1], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363576761, "dur": 56, | |
"args": { | |
"Device": 618, "External id": 705, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[1], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363573002, "dur": 3838, | |
"args": { | |
"Device": 618, "External id": 690, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576856, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 709, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576853, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 708, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576864, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 711, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576863, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 710, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576869, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 713, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576868, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 712, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576875, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 715, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::select", "pid": 618, "tid": "618", | |
"ts": 1624691363576873, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 714, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], []], "Input type": ["float", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576880, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 717, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576879, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 716, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363576883, "dur": 25, | |
"args": { | |
"Device": 618, "External id": 718, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 15], [128, 64, 3, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576922, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 720, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576919, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 719, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576928, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 722, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576927, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 721, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576932, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 724, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576931, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 723, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576937, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 726, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576936, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 725, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576941, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 728, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363576940, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 727, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 17], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363576956, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 731, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "Int", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_like", "pid": 618, "tid": "618", | |
"ts": 1624691363576954, "dur": 10, | |
"args": { | |
"Device": 618, "External id": 730, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [], [], [], [], []], "Input type": ["float", "", "", "", "", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty", "pid": 618, "tid": "618", | |
"ts": 1624691363576969, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 733, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "Int", "", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zero_", "pid": 618, "tid": "618", | |
"ts": 1624691363576973, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 734, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5]], "Input type": ["long int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::zeros", "pid": 618, "tid": "618", | |
"ts": 1624691363576968, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 732, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], []], "Input type": ["GenericList", "Int", "", "", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363576981, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 736, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363576989, "dur": 24, | |
"args": { | |
"Device": 618, "External id": 737, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363576978, "dur": 37, | |
"args": { | |
"Device": 618, "External id": 735, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577020, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 739, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363577040, "dur": 19, | |
"args": { | |
"Device": 618, "External id": 740, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363577017, "dur": 44, | |
"args": { | |
"Device": 618, "External id": 738, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577065, "dur": 7, | |
"args": { | |
"Device": 618, "External id": 742, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363577073, "dur": 32, | |
"args": { | |
"Device": 618, "External id": 743, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [5], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363577063, "dur": 43, | |
"args": { | |
"Device": 618, "External id": 741, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[5], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::empty_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577110, "dur": 6, | |
"args": { | |
"Device": 618, "External id": 745, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[], [], [], [], [], []], "Input type": ["GenericList", "GenericList", "Int", "Int", "", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363577117, "dur": 16, | |
"args": { | |
"Device": 618, "External id": 746, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [2], []], "Input type": ["long int", "long int", "Bool"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::to", "pid": 618, "tid": "618", | |
"ts": 1624691363577108, "dur": 26, | |
"args": { | |
"Device": 618, "External id": 744, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[2], [], [], [], [], [], [], []], "Input type": ["long int", "Int", "Int", "", "", "Bool", "Bool", ""] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::flip", "pid": 618, "tid": "618", | |
"ts": 1624691363576950, "dur": 204, | |
"args": { | |
"Device": 618, "External id": 729, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], []], "Input type": ["float", "GenericList"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577168, "dur": 2, | |
"args": { | |
"Device": 618, "External id": 748, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363577164, "dur": 8, | |
"args": { | |
"Device": 618, "External id": 747, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577175, "dur": 0, | |
"args": { | |
"Device": 618, "External id": 750, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363577173, "dur": 4, | |
"args": { | |
"Device": 618, "External id": 749, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577179, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 752, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363577178, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 751, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577183, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 754, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363577182, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 753, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 32, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::as_strided", "pid": 618, "tid": "618", | |
"ts": 1624691363577187, "dur": 1, | |
"args": { | |
"Device": 618, "External id": 756, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], []], "Input type": ["float", "GenericList", "GenericList", "Int"] | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::slice", "pid": 618, "tid": "618", | |
"ts": 1624691363577186, "dur": 3, | |
"args": { | |
"Device": 618, "External id": 755, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 32], [], [], [], []], "Input type": ["float", "Int", "Int", "Int", "Int"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Operator", | |
"name": "aten::copy_", "pid": 618, "tid": "618", | |
"ts": 1624691363577190, "dur": 23, | |
"args": { | |
"Device": 618, "External id": 757, | |
"Trace name": "PyTorch Profiler", "Trace iteration": 0 , | |
"Input Dims": [[128, 64, 3, 31, 15], [128, 64, 3, 31, 15], []], "Input type": ["float", "float", "Bool"], "Fwd thread id": 0, "Sequence number": 0 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363536484, "dur": 536, | |
"args": { | |
"cbid": 20, "correlation": 118, | |
"external id": 31, "external ts": 1624691363535483 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363542981, "dur": 335, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 125, "external id": 32, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 125, "pid": 0, "tid": "stream 7", "ts": 1624691363542981, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363537125, "dur": 5859, | |
"args": { | |
"cbid": 211, "correlation": 125, | |
"external id": 32, "external ts": 1624691363537072 | |
} | |
}, | |
{ | |
"ph": "s", "id": 125, "pid": 618, "tid": 618, "ts": 1624691363537125, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363543317, "dur": 334, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 136, "external id": 35, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 136, "pid": 0, "tid": "stream 7", "ts": 1624691363543317, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363543059, "dur": 16, | |
"args": { | |
"cbid": 211, "correlation": 136, | |
"external id": 35, "external ts": 1624691363543046 | |
} | |
}, | |
{ | |
"ph": "s", "id": 136, "pid": 618, "tid": 618, "ts": 1624691363543059, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363543154, "dur": 257, | |
"args": { | |
"cbid": 20, "correlation": 142, | |
"external id": 37, "external ts": 1624691363543147 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363543652, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 146, "external id": 38, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 146, "pid": 0, "tid": "stream 7", "ts": 1624691363543652, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363543440, "dur": 21, | |
"args": { | |
"cbid": 211, "correlation": 146, | |
"external id": 38, "external ts": 1624691363543428 | |
} | |
}, | |
{ | |
"ph": "s", "id": 146, "pid": 618, "tid": 618, "ts": 1624691363543440, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363543838, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 151, "external id": 42, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 151, "pid": 0, "tid": "stream 7", "ts": 1624691363543838, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363543511, "dur": 15, | |
"args": { | |
"cbid": 211, "correlation": 151, | |
"external id": 42, "external ts": 1624691363543494 | |
} | |
}, | |
{ | |
"ph": "s", "id": 151, "pid": 618, "tid": 618, "ts": 1624691363543511, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363543815, "dur": 176, | |
"args": { | |
"cbid": 20, "correlation": 161, | |
"external id": 55, "external ts": 1624691363543808 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363544136, "dur": 162, | |
"args": { | |
"cbid": 20, "correlation": 171, | |
"external id": 60, "external ts": 1624691363544121 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363544516, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 176, "external id": 61, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.019230769230769232 | |
} | |
}, | |
{ | |
"ph": "f", "id": 176, "pid": 0, "tid": "stream 7", "ts": 1624691363544516, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363544324, "dur": 189, | |
"args": { | |
"cbid": 41, "correlation": 176, | |
"external id": 61, "external ts": 1624691363544314 | |
} | |
}, | |
{ | |
"ph": "s", "id": 176, "pid": 618, "tid": 618, "ts": 1624691363544324, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363544514, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 177, | |
"external id": 61, "external ts": 1624691363544314 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363544587, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 189, "external id": 64, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 189, "pid": 0, "tid": "stream 7", "ts": 1624691363544587, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363544575, "dur": 8, | |
"args": { | |
"cbid": 41, "correlation": 189, | |
"external id": 64, "external ts": 1624691363544570 | |
} | |
}, | |
{ | |
"ph": "s", "id": 189, "pid": 618, "tid": 618, "ts": 1624691363544575, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363544599, "dur": 3, | |
"args": { | |
"cbid": 131, "correlation": 190, | |
"external id": 64, "external ts": 1624691363544570 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363544640, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 202, "external id": 67, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 202, "pid": 0, "tid": "stream 7", "ts": 1624691363544640, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363544629, "dur": 8, | |
"args": { | |
"cbid": 41, "correlation": 202, | |
"external id": 67, "external ts": 1624691363544625 | |
} | |
}, | |
{ | |
"ph": "s", "id": 202, "pid": 618, "tid": 618, "ts": 1624691363544629, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363544638, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 203, | |
"external id": 67, "external ts": 1624691363544625 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363544711, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 215, "external id": 70, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.005555555555555556 | |
} | |
}, | |
{ | |
"ph": "f", "id": 215, "pid": 0, "tid": "stream 7", "ts": 1624691363544711, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363544698, "dur": 9, | |
"args": { | |
"cbid": 41, "correlation": 215, | |
"external id": 70, "external ts": 1624691363544690 | |
} | |
}, | |
{ | |
"ph": "s", "id": 215, "pid": 618, "tid": 618, "ts": 1624691363544698, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363544708, "dur": 8, | |
"args": { | |
"cbid": 131, "correlation": 216, | |
"external id": 70, "external ts": 1624691363544690 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363544747, "dur": 59, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 218, "external id": 53, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 218, "pid": 0, "tid": "stream 7", "ts": 1624691363544747, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363544724, "dur": 21, | |
"args": { | |
"cbid": 211, "correlation": 218, | |
"external id": 53, "external ts": 1624691363543770 | |
} | |
}, | |
{ | |
"ph": "s", "id": 218, "pid": 618, "tid": 618, "ts": 1624691363544724, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363544842, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 224, "external id": 81, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 224, "pid": 0, "tid": "stream 7", "ts": 1624691363544842, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363544826, "dur": 14, | |
"args": { | |
"cbid": 211, "correlation": 224, | |
"external id": 81, "external ts": 1624691363544807 | |
} | |
}, | |
{ | |
"ph": "s", "id": 224, "pid": 618, "tid": 618, "ts": 1624691363544826, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363544947, "dur": 185, | |
"args": { | |
"cbid": 20, "correlation": 235, | |
"external id": 94, "external ts": 1624691363544939 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363545226, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 248, "external id": 100, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03205128205128205 | |
} | |
}, | |
{ | |
"ph": "f", "id": 248, "pid": 0, "tid": "stream 7", "ts": 1624691363545226, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363545211, "dur": 12, | |
"args": { | |
"cbid": 41, "correlation": 248, | |
"external id": 100, "external ts": 1624691363545204 | |
} | |
}, | |
{ | |
"ph": "s", "id": 248, "pid": 618, "tid": 618, "ts": 1624691363545211, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363545223, "dur": 8, | |
"args": { | |
"cbid": 131, "correlation": 249, | |
"external id": 100, "external ts": 1624691363545204 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363545274, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 261, "external id": 103, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 261, "pid": 0, "tid": "stream 7", "ts": 1624691363545274, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363545264, "dur": 6, | |
"args": { | |
"cbid": 41, "correlation": 261, | |
"external id": 103, "external ts": 1624691363545260 | |
} | |
}, | |
{ | |
"ph": "s", "id": 261, "pid": 618, "tid": 618, "ts": 1624691363545264, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363545271, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 262, | |
"external id": 103, "external ts": 1624691363545260 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363545304, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 274, "external id": 106, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 274, "pid": 0, "tid": "stream 7", "ts": 1624691363545304, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363545296, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 274, | |
"external id": 106, "external ts": 1624691363545292 | |
} | |
}, | |
{ | |
"ph": "s", "id": 274, "pid": 618, "tid": 618, "ts": 1624691363545296, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363545301, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 275, | |
"external id": 106, "external ts": 1624691363545292 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363545333, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 287, "external id": 109, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013513513513513514 | |
} | |
}, | |
{ | |
"ph": "f", "id": 287, "pid": 0, "tid": "stream 7", "ts": 1624691363545333, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363545325, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 287, | |
"external id": 109, "external ts": 1624691363545322 | |
} | |
}, | |
{ | |
"ph": "s", "id": 287, "pid": 618, "tid": 618, "ts": 1624691363545325, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363545330, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 288, | |
"external id": 109, "external ts": 1624691363545322 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363545358, "dur": 2284, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 290, "external id": 92, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 290, "pid": 0, "tid": "stream 7", "ts": 1624691363545358, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363545343, "dur": 14, | |
"args": { | |
"cbid": 211, "correlation": 290, | |
"external id": 92, "external ts": 1624691363544931 | |
} | |
}, | |
{ | |
"ph": "s", "id": 290, "pid": 618, "tid": 618, "ts": 1624691363545343, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363547644, "dur": 417, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 296, "external id": 120, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 296, "pid": 0, "tid": "stream 7", "ts": 1624691363547644, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363545419, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 296, | |
"external id": 120, "external ts": 1624691363545409 | |
} | |
}, | |
{ | |
"ph": "s", "id": 296, "pid": 618, "tid": 618, "ts": 1624691363545419, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363545478, "dur": 297, | |
"args": { | |
"cbid": 20, "correlation": 304, | |
"external id": 122, "external ts": 1624691363545471 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363548062, "dur": 336, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 311, "external id": 123, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 311, "pid": 0, "tid": "stream 7", "ts": 1624691363548062, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363545820, "dur": 33, | |
"args": { | |
"cbid": 211, "correlation": 311, | |
"external id": 123, "external ts": 1624691363545807 | |
} | |
}, | |
{ | |
"ph": "s", "id": 311, "pid": 618, "tid": 618, "ts": 1624691363545820, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363548399, "dur": 336, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 322, "external id": 126, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 322, "pid": 0, "tid": "stream 7", "ts": 1624691363548399, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363545916, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 322, | |
"external id": 126, "external ts": 1624691363545908 | |
} | |
}, | |
{ | |
"ph": "s", "id": 322, "pid": 618, "tid": 618, "ts": 1624691363545916, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMalloc", "pid": 618, "tid": "618", | |
"ts": 1624691363545986, "dur": 210, | |
"args": { | |
"cbid": 20, "correlation": 328, | |
"external id": 128, "external ts": 1624691363545979 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363548737, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 332, "external id": 129, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 332, "pid": 0, "tid": "stream 7", "ts": 1624691363548737, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363546218, "dur": 36, | |
"args": { | |
"cbid": 211, "correlation": 332, | |
"external id": 129, "external ts": 1624691363546209 | |
} | |
}, | |
{ | |
"ph": "s", "id": 332, "pid": 618, "tid": 618, "ts": 1624691363546218, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363548922, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 337, "external id": 133, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 337, "pid": 0, "tid": "stream 7", "ts": 1624691363548922, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363546283, "dur": 10, | |
"args": { | |
"cbid": 211, "correlation": 337, | |
"external id": 133, "external ts": 1624691363546273 | |
} | |
}, | |
{ | |
"ph": "s", "id": 337, "pid": 618, "tid": 618, "ts": 1624691363546283, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549329, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 358, "external id": 152, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.019230769230769232 | |
} | |
}, | |
{ | |
"ph": "f", "id": 358, "pid": 0, "tid": "stream 7", "ts": 1624691363549329, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363546447, "dur": 13, | |
"args": { | |
"cbid": 41, "correlation": 358, | |
"external id": 152, "external ts": 1624691363546441 | |
} | |
}, | |
{ | |
"ph": "s", "id": 358, "pid": 618, "tid": 618, "ts": 1624691363546447, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363546461, "dur": 2875, | |
"args": { | |
"cbid": 131, "correlation": 359, | |
"external id": 152, "external ts": 1624691363546441 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549388, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 371, "external id": 155, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02564102564102564 | |
} | |
}, | |
{ | |
"ph": "f", "id": 371, "pid": 0, "tid": "stream 7", "ts": 1624691363549388, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549372, "dur": 12, | |
"args": { | |
"cbid": 41, "correlation": 371, | |
"external id": 155, "external ts": 1624691363549366 | |
} | |
}, | |
{ | |
"ph": "s", "id": 371, "pid": 618, "tid": 618, "ts": 1624691363549372, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549385, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 372, | |
"external id": 155, "external ts": 1624691363549366 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549440, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 384, "external id": 158, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 384, "pid": 0, "tid": "stream 7", "ts": 1624691363549440, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549431, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 384, | |
"external id": 158, "external ts": 1624691363549427 | |
} | |
}, | |
{ | |
"ph": "s", "id": 384, "pid": 618, "tid": 618, "ts": 1624691363549431, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549436, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 385, | |
"external id": 158, "external ts": 1624691363549427 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549500, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 397, "external id": 161, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006578947368421052 | |
} | |
}, | |
{ | |
"ph": "f", "id": 397, "pid": 0, "tid": "stream 7", "ts": 1624691363549500, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549489, "dur": 6, | |
"args": { | |
"cbid": 41, "correlation": 397, | |
"external id": 161, "external ts": 1624691363549485 | |
} | |
}, | |
{ | |
"ph": "s", "id": 397, "pid": 618, "tid": 618, "ts": 1624691363549489, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549496, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 398, | |
"external id": 161, "external ts": 1624691363549485 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549525, "dur": 59, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 400, "external id": 144, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 400, "pid": 0, "tid": "stream 7", "ts": 1624691363549525, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363549508, "dur": 15, | |
"args": { | |
"cbid": 211, "correlation": 400, | |
"external id": 144, "external ts": 1624691363546369 | |
} | |
}, | |
{ | |
"ph": "s", "id": 400, "pid": 618, "tid": 618, "ts": 1624691363549508, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549604, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 406, "external id": 172, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 406, "pid": 0, "tid": "stream 7", "ts": 1624691363549604, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363549588, "dur": 13, | |
"args": { | |
"cbid": 211, "correlation": 406, | |
"external id": 172, "external ts": 1624691363549579 | |
} | |
}, | |
{ | |
"ph": "s", "id": 406, "pid": 618, "tid": 618, "ts": 1624691363549588, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549752, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 428, "external id": 191, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 428, "pid": 0, "tid": "stream 7", "ts": 1624691363549752, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549738, "dur": 10, | |
"args": { | |
"cbid": 41, "correlation": 428, | |
"external id": 191, "external ts": 1624691363549732 | |
} | |
}, | |
{ | |
"ph": "s", "id": 428, "pid": 618, "tid": 618, "ts": 1624691363549738, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549749, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 429, | |
"external id": 191, "external ts": 1624691363549732 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549788, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 441, "external id": 194, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 441, "pid": 0, "tid": "stream 7", "ts": 1624691363549788, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549779, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 441, | |
"external id": 194, "external ts": 1624691363549775 | |
} | |
}, | |
{ | |
"ph": "s", "id": 441, "pid": 618, "tid": 618, "ts": 1624691363549779, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549785, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 442, | |
"external id": 194, "external ts": 1624691363549775 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549834, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 454, "external id": 197, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 454, "pid": 0, "tid": "stream 7", "ts": 1624691363549834, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549825, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 454, | |
"external id": 197, "external ts": 1624691363549807 | |
} | |
}, | |
{ | |
"ph": "s", "id": 454, "pid": 618, "tid": 618, "ts": 1624691363549825, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549830, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 455, | |
"external id": 197, "external ts": 1624691363549807 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549862, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 467, "external id": 200, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013513513513513514 | |
} | |
}, | |
{ | |
"ph": "f", "id": 467, "pid": 0, "tid": "stream 7", "ts": 1624691363549862, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363549854, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 467, | |
"external id": 200, "external ts": 1624691363549851 | |
} | |
}, | |
{ | |
"ph": "s", "id": 467, "pid": 618, "tid": 618, "ts": 1624691363549854, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363549858, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 468, | |
"external id": 200, "external ts": 1624691363549851 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363549892, "dur": 2285, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 470, "external id": 183, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 470, "pid": 0, "tid": "stream 7", "ts": 1624691363549892, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363549877, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 470, | |
"external id": 183, "external ts": 1624691363549667 | |
} | |
}, | |
{ | |
"ph": "s", "id": 470, "pid": 618, "tid": 618, "ts": 1624691363549877, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363552178, "dur": 417, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 476, "external id": 211, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 476, "pid": 0, "tid": "stream 7", "ts": 1624691363552178, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363549943, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 476, | |
"external id": 211, "external ts": 1624691363549934 | |
} | |
}, | |
{ | |
"ph": "s", "id": 476, "pid": 618, "tid": 618, "ts": 1624691363549943, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363552597, "dur": 366, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 489, "external id": 214, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 489, "pid": 0, "tid": "stream 7", "ts": 1624691363552597, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363550015, "dur": 16, | |
"args": { | |
"cbid": 211, "correlation": 489, | |
"external id": 214, "external ts": 1624691363550005 | |
} | |
}, | |
{ | |
"ph": "s", "id": 489, "pid": 618, "tid": 618, "ts": 1624691363550015, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363552964, "dur": 334, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 500, "external id": 217, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 500, "pid": 0, "tid": "stream 7", "ts": 1624691363552964, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363550066, "dur": 10, | |
"args": { | |
"cbid": 211, "correlation": 500, | |
"external id": 217, "external ts": 1624691363550058 | |
} | |
}, | |
{ | |
"ph": "s", "id": 500, "pid": 618, "tid": 618, "ts": 1624691363550066, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363553299, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 508, "external id": 220, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 508, "pid": 0, "tid": "stream 7", "ts": 1624691363553299, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363550125, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 508, | |
"external id": 220, "external ts": 1624691363550119 | |
} | |
}, | |
{ | |
"ph": "s", "id": 508, "pid": 618, "tid": 618, "ts": 1624691363550125, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363553484, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 513, "external id": 224, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 513, "pid": 0, "tid": "stream 7", "ts": 1624691363553484, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363550158, "dur": 8, | |
"args": { | |
"cbid": 211, "correlation": 513, | |
"external id": 224, "external ts": 1624691363550151 | |
} | |
}, | |
{ | |
"ph": "s", "id": 513, "pid": 618, "tid": 618, "ts": 1624691363550158, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363553891, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 534, "external id": 243, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 534, "pid": 0, "tid": "stream 7", "ts": 1624691363553891, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363550294, "dur": 11, | |
"args": { | |
"cbid": 41, "correlation": 534, | |
"external id": 243, "external ts": 1624691363550288 | |
} | |
}, | |
{ | |
"ph": "s", "id": 534, "pid": 618, "tid": 618, "ts": 1624691363550294, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363550306, "dur": 3592, | |
"args": { | |
"cbid": 131, "correlation": 535, | |
"external id": 243, "external ts": 1624691363550288 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363553944, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 547, "external id": 246, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 547, "pid": 0, "tid": "stream 7", "ts": 1624691363553944, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363553931, "dur": 9, | |
"args": { | |
"cbid": 41, "correlation": 547, | |
"external id": 246, "external ts": 1624691363553925 | |
} | |
}, | |
{ | |
"ph": "s", "id": 547, "pid": 618, "tid": 618, "ts": 1624691363553931, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363553941, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 548, | |
"external id": 246, "external ts": 1624691363553925 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363553993, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 560, "external id": 249, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 560, "pid": 0, "tid": "stream 7", "ts": 1624691363553993, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363553984, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 560, | |
"external id": 249, "external ts": 1624691363553980 | |
} | |
}, | |
{ | |
"ph": "s", "id": 560, "pid": 618, "tid": 618, "ts": 1624691363553984, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363553989, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 561, | |
"external id": 249, "external ts": 1624691363553980 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554022, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 573, "external id": 252, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006756756756756757 | |
} | |
}, | |
{ | |
"ph": "f", "id": 573, "pid": 0, "tid": "stream 7", "ts": 1624691363554022, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363554014, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 573, | |
"external id": 252, "external ts": 1624691363554011 | |
} | |
}, | |
{ | |
"ph": "s", "id": 573, "pid": 618, "tid": 618, "ts": 1624691363554014, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363554018, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 574, | |
"external id": 252, "external ts": 1624691363554011 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554046, "dur": 58, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 576, "external id": 235, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 576, "pid": 0, "tid": "stream 7", "ts": 1624691363554046, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554031, "dur": 13, | |
"args": { | |
"cbid": 211, "correlation": 576, | |
"external id": 235, "external ts": 1624691363550222 | |
} | |
}, | |
{ | |
"ph": "s", "id": 576, "pid": 618, "tid": 618, "ts": 1624691363554031, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554134, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 582, "external id": 263, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 582, "pid": 0, "tid": "stream 7", "ts": 1624691363554134, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554119, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 582, | |
"external id": 263, "external ts": 1624691363554109 | |
} | |
}, | |
{ | |
"ph": "s", "id": 582, "pid": 618, "tid": 618, "ts": 1624691363554119, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554235, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 604, "external id": 282, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 604, "pid": 0, "tid": "stream 7", "ts": 1624691363554235, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363554222, "dur": 9, | |
"args": { | |
"cbid": 41, "correlation": 604, | |
"external id": 282, "external ts": 1624691363554217 | |
} | |
}, | |
{ | |
"ph": "s", "id": 604, "pid": 618, "tid": 618, "ts": 1624691363554222, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363554232, "dur": 12, | |
"args": { | |
"cbid": 131, "correlation": 605, | |
"external id": 282, "external ts": 1624691363554217 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554274, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 617, "external id": 285, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 617, "pid": 0, "tid": "stream 7", "ts": 1624691363554274, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363554265, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 617, | |
"external id": 285, "external ts": 1624691363554261 | |
} | |
}, | |
{ | |
"ph": "s", "id": 617, "pid": 618, "tid": 618, "ts": 1624691363554265, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363554271, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 618, | |
"external id": 285, "external ts": 1624691363554261 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554336, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 630, "external id": 288, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 630, "pid": 0, "tid": "stream 7", "ts": 1624691363554336, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363554327, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 630, | |
"external id": 288, "external ts": 1624691363554323 | |
} | |
}, | |
{ | |
"ph": "s", "id": 630, "pid": 618, "tid": 618, "ts": 1624691363554327, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363554332, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 631, | |
"external id": 288, "external ts": 1624691363554323 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554404, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 643, "external id": 291, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013513513513513514 | |
} | |
}, | |
{ | |
"ph": "f", "id": 643, "pid": 0, "tid": "stream 7", "ts": 1624691363554404, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363554395, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 643, | |
"external id": 291, "external ts": 1624691363554391 | |
} | |
}, | |
{ | |
"ph": "s", "id": 643, "pid": 618, "tid": 618, "ts": 1624691363554395, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363554401, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 644, | |
"external id": 291, "external ts": 1624691363554391 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363554427, "dur": 2286, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 646, "external id": 274, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 646, "pid": 0, "tid": "stream 7", "ts": 1624691363554427, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554413, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 646, | |
"external id": 274, "external ts": 1624691363554177 | |
} | |
}, | |
{ | |
"ph": "s", "id": 646, "pid": 618, "tid": 618, "ts": 1624691363554413, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363556713, "dur": 417, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 652, "external id": 302, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 652, "pid": 0, "tid": "stream 7", "ts": 1624691363556713, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554479, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 652, | |
"external id": 302, "external ts": 1624691363554470 | |
} | |
}, | |
{ | |
"ph": "s", "id": 652, "pid": 618, "tid": 618, "ts": 1624691363554479, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363557131, "dur": 334, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 665, "external id": 305, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 665, "pid": 0, "tid": "stream 7", "ts": 1624691363557131, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554535, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 665, | |
"external id": 305, "external ts": 1624691363554524 | |
} | |
}, | |
{ | |
"ph": "s", "id": 665, "pid": 618, "tid": 618, "ts": 1624691363554535, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363557467, "dur": 376, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 676, "external id": 308, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 676, "pid": 0, "tid": "stream 7", "ts": 1624691363557467, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554589, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 676, | |
"external id": 308, "external ts": 1624691363554581 | |
} | |
}, | |
{ | |
"ph": "s", "id": 676, "pid": 618, "tid": 618, "ts": 1624691363554589, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363557844, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 684, "external id": 311, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 684, "pid": 0, "tid": "stream 7", "ts": 1624691363557844, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554705, "dur": 14, | |
"args": { | |
"cbid": 211, "correlation": 684, | |
"external id": 311, "external ts": 1624691363554683 | |
} | |
}, | |
{ | |
"ph": "s", "id": 684, "pid": 618, "tid": 618, "ts": 1624691363554705, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558029, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 689, "external id": 315, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 689, "pid": 0, "tid": "stream 7", "ts": 1624691363558029, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363554745, "dur": 9, | |
"args": { | |
"cbid": 211, "correlation": 689, | |
"external id": 315, "external ts": 1624691363554737 | |
} | |
}, | |
{ | |
"ph": "s", "id": 689, "pid": 618, "tid": 618, "ts": 1624691363554745, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558436, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 710, "external id": 334, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 710, "pid": 0, "tid": "stream 7", "ts": 1624691363558436, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363554855, "dur": 11, | |
"args": { | |
"cbid": 41, "correlation": 710, | |
"external id": 334, "external ts": 1624691363554850 | |
} | |
}, | |
{ | |
"ph": "s", "id": 710, "pid": 618, "tid": 618, "ts": 1624691363554855, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363554867, "dur": 3590, | |
"args": { | |
"cbid": 131, "correlation": 711, | |
"external id": 334, "external ts": 1624691363554850 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558495, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 723, "external id": 337, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 723, "pid": 0, "tid": "stream 7", "ts": 1624691363558495, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363558484, "dur": 7, | |
"args": { | |
"cbid": 41, "correlation": 723, | |
"external id": 337, "external ts": 1624691363558480 | |
} | |
}, | |
{ | |
"ph": "s", "id": 723, "pid": 618, "tid": 618, "ts": 1624691363558484, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363558492, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 724, | |
"external id": 337, "external ts": 1624691363558480 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558544, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 736, "external id": 340, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 736, "pid": 0, "tid": "stream 7", "ts": 1624691363558544, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363558536, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 736, | |
"external id": 340, "external ts": 1624691363558532 | |
} | |
}, | |
{ | |
"ph": "s", "id": 736, "pid": 618, "tid": 618, "ts": 1624691363558536, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363558541, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 737, | |
"external id": 340, "external ts": 1624691363558532 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558604, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 749, "external id": 343, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006756756756756757 | |
} | |
}, | |
{ | |
"ph": "f", "id": 749, "pid": 0, "tid": "stream 7", "ts": 1624691363558604, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363558581, "dur": 19, | |
"args": { | |
"cbid": 41, "correlation": 749, | |
"external id": 343, "external ts": 1624691363558578 | |
} | |
}, | |
{ | |
"ph": "s", "id": 749, "pid": 618, "tid": 618, "ts": 1624691363558581, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363558601, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 750, | |
"external id": 343, "external ts": 1624691363558578 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558627, "dur": 58, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 752, "external id": 326, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 752, "pid": 0, "tid": "stream 7", "ts": 1624691363558627, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363558613, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 752, | |
"external id": 326, "external ts": 1624691363554807 | |
} | |
}, | |
{ | |
"ph": "s", "id": 752, "pid": 618, "tid": 618, "ts": 1624691363558613, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558711, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 758, "external id": 354, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 758, "pid": 0, "tid": "stream 7", "ts": 1624691363558711, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363558683, "dur": 26, | |
"args": { | |
"cbid": 211, "correlation": 758, | |
"external id": 354, "external ts": 1624691363558674 | |
} | |
}, | |
{ | |
"ph": "s", "id": 758, "pid": 618, "tid": 618, "ts": 1624691363558683, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558922, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 780, "external id": 373, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 780, "pid": 0, "tid": "stream 7", "ts": 1624691363558922, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363558894, "dur": 24, | |
"args": { | |
"cbid": 41, "correlation": 780, | |
"external id": 373, "external ts": 1624691363558889 | |
} | |
}, | |
{ | |
"ph": "s", "id": 780, "pid": 618, "tid": 618, "ts": 1624691363558894, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363558919, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 781, | |
"external id": 373, "external ts": 1624691363558889 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558955, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 793, "external id": 376, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 793, "pid": 0, "tid": "stream 7", "ts": 1624691363558955, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363558946, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 793, | |
"external id": 376, "external ts": 1624691363558942 | |
} | |
}, | |
{ | |
"ph": "s", "id": 793, "pid": 618, "tid": 618, "ts": 1624691363558946, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363558951, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 794, | |
"external id": 376, "external ts": 1624691363558942 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363558985, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 806, "external id": 379, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03205128205128205 | |
} | |
}, | |
{ | |
"ph": "f", "id": 806, "pid": 0, "tid": "stream 7", "ts": 1624691363558985, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363558977, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 806, | |
"external id": 379, "external ts": 1624691363558973 | |
} | |
}, | |
{ | |
"ph": "s", "id": 806, "pid": 618, "tid": 618, "ts": 1624691363558977, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363558981, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 807, | |
"external id": 379, "external ts": 1624691363558973 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363559014, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 819, "external id": 382, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013157894736842105 | |
} | |
}, | |
{ | |
"ph": "f", "id": 819, "pid": 0, "tid": "stream 7", "ts": 1624691363559014, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363559006, "dur": 3, | |
"args": { | |
"cbid": 41, "correlation": 819, | |
"external id": 382, "external ts": 1624691363559003 | |
} | |
}, | |
{ | |
"ph": "s", "id": 819, "pid": 618, "tid": 618, "ts": 1624691363559006, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363559010, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 820, | |
"external id": 382, "external ts": 1624691363559003 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363559035, "dur": 2285, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 822, "external id": 365, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 822, "pid": 0, "tid": "stream 7", "ts": 1624691363559035, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363559022, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 822, | |
"external id": 365, "external ts": 1624691363558824 | |
} | |
}, | |
{ | |
"ph": "s", "id": 822, "pid": 618, "tid": 618, "ts": 1624691363559022, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363561322, "dur": 416, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 828, "external id": 393, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 828, "pid": 0, "tid": "stream 7", "ts": 1624691363561322, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363559101, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 828, | |
"external id": 393, "external ts": 1624691363559092 | |
} | |
}, | |
{ | |
"ph": "s", "id": 828, "pid": 618, "tid": 618, "ts": 1624691363559101, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363561740, "dur": 333, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 841, "external id": 396, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 841, "pid": 0, "tid": "stream 7", "ts": 1624691363561740, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363559198, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 841, | |
"external id": 396, "external ts": 1624691363559189 | |
} | |
}, | |
{ | |
"ph": "s", "id": 841, "pid": 618, "tid": 618, "ts": 1624691363559198, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363562074, "dur": 376, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 852, "external id": 399, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 852, "pid": 0, "tid": "stream 7", "ts": 1624691363562074, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363559252, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 852, | |
"external id": 399, "external ts": 1624691363559244 | |
} | |
}, | |
{ | |
"ph": "s", "id": 852, "pid": 618, "tid": 618, "ts": 1624691363559252, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363562451, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 860, "external id": 402, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 860, "pid": 0, "tid": "stream 7", "ts": 1624691363562451, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363559327, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 860, | |
"external id": 402, "external ts": 1624691363559321 | |
} | |
}, | |
{ | |
"ph": "s", "id": 860, "pid": 618, "tid": 618, "ts": 1624691363559327, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363562636, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 865, "external id": 406, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 865, "pid": 0, "tid": "stream 7", "ts": 1624691363562636, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363559360, "dur": 8, | |
"args": { | |
"cbid": 211, "correlation": 865, | |
"external id": 406, "external ts": 1624691363559353 | |
} | |
}, | |
{ | |
"ph": "s", "id": 865, "pid": 618, "tid": 618, "ts": 1624691363559360, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563043, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 886, "external id": 425, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 886, "pid": 0, "tid": "stream 7", "ts": 1624691363563043, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363559506, "dur": 11, | |
"args": { | |
"cbid": 41, "correlation": 886, | |
"external id": 425, "external ts": 1624691363559500 | |
} | |
}, | |
{ | |
"ph": "s", "id": 886, "pid": 618, "tid": 618, "ts": 1624691363559506, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363559517, "dur": 3530, | |
"args": { | |
"cbid": 131, "correlation": 887, | |
"external id": 425, "external ts": 1624691363559500 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563084, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 899, "external id": 428, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 899, "pid": 0, "tid": "stream 7", "ts": 1624691363563084, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563073, "dur": 7, | |
"args": { | |
"cbid": 41, "correlation": 899, | |
"external id": 428, "external ts": 1624691363563069 | |
} | |
}, | |
{ | |
"ph": "s", "id": 899, "pid": 618, "tid": 618, "ts": 1624691363563073, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563081, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 900, | |
"external id": 428, "external ts": 1624691363563069 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563115, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 912, "external id": 431, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 912, "pid": 0, "tid": "stream 7", "ts": 1624691363563115, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563107, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 912, | |
"external id": 431, "external ts": 1624691363563103 | |
} | |
}, | |
{ | |
"ph": "s", "id": 912, "pid": 618, "tid": 618, "ts": 1624691363563107, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563112, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 913, | |
"external id": 431, "external ts": 1624691363563103 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563161, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 925, "external id": 434, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006756756756756757 | |
} | |
}, | |
{ | |
"ph": "f", "id": 925, "pid": 0, "tid": "stream 7", "ts": 1624691363563161, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563153, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 925, | |
"external id": 434, "external ts": 1624691363563149 | |
} | |
}, | |
{ | |
"ph": "s", "id": 925, "pid": 618, "tid": 618, "ts": 1624691363563153, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563173, "dur": 2, | |
"args": { | |
"cbid": 131, "correlation": 926, | |
"external id": 434, "external ts": 1624691363563149 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563195, "dur": 61, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 928, "external id": 417, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 928, "pid": 0, "tid": "stream 7", "ts": 1624691363563195, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563180, "dur": 27, | |
"args": { | |
"cbid": 211, "correlation": 928, | |
"external id": 417, "external ts": 1624691363559458 | |
} | |
}, | |
{ | |
"ph": "s", "id": 928, "pid": 618, "tid": 618, "ts": 1624691363563180, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563313, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 934, "external id": 445, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 934, "pid": 0, "tid": "stream 7", "ts": 1624691363563313, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563298, "dur": 13, | |
"args": { | |
"cbid": 211, "correlation": 934, | |
"external id": 445, "external ts": 1624691363563287 | |
} | |
}, | |
{ | |
"ph": "s", "id": 934, "pid": 618, "tid": 618, "ts": 1624691363563298, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563412, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 956, "external id": 464, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 956, "pid": 0, "tid": "stream 7", "ts": 1624691363563412, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563399, "dur": 9, | |
"args": { | |
"cbid": 41, "correlation": 956, | |
"external id": 464, "external ts": 1624691363563394 | |
} | |
}, | |
{ | |
"ph": "s", "id": 956, "pid": 618, "tid": 618, "ts": 1624691363563399, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563409, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 957, | |
"external id": 464, "external ts": 1624691363563394 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563444, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 969, "external id": 467, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 969, "pid": 0, "tid": "stream 7", "ts": 1624691363563444, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563436, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 969, | |
"external id": 467, "external ts": 1624691363563432 | |
} | |
}, | |
{ | |
"ph": "s", "id": 969, "pid": 618, "tid": 618, "ts": 1624691363563436, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563441, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 970, | |
"external id": 467, "external ts": 1624691363563432 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563498, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 982, "external id": 470, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 982, "pid": 0, "tid": "stream 7", "ts": 1624691363563498, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563488, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 982, | |
"external id": 470, "external ts": 1624691363563462 | |
} | |
}, | |
{ | |
"ph": "s", "id": 982, "pid": 618, "tid": 618, "ts": 1624691363563488, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563494, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 983, | |
"external id": 470, "external ts": 1624691363563462 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563528, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 995, "external id": 473, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.011111111111111112 | |
} | |
}, | |
{ | |
"ph": "f", "id": 995, "pid": 0, "tid": "stream 7", "ts": 1624691363563528, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363563520, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 995, | |
"external id": 473, "external ts": 1624691363563517 | |
} | |
}, | |
{ | |
"ph": "s", "id": 995, "pid": 618, "tid": 618, "ts": 1624691363563520, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363563525, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 996, | |
"external id": 473, "external ts": 1624691363563517 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363563549, "dur": 2286, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 998, "external id": 456, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 998, "pid": 0, "tid": "stream 7", "ts": 1624691363563549, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563537, "dur": 10, | |
"args": { | |
"cbid": 211, "correlation": 998, | |
"external id": 456, "external ts": 1624691363563355 | |
} | |
}, | |
{ | |
"ph": "s", "id": 998, "pid": 618, "tid": 618, "ts": 1624691363563537, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363565836, "dur": 417, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1004, "external id": 484, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1004, "pid": 0, "tid": "stream 7", "ts": 1624691363565836, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563612, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 1004, | |
"external id": 484, "external ts": 1624691363563589 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1004, "pid": 618, "tid": 618, "ts": 1624691363563612, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363566255, "dur": 372, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1017, "external id": 487, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1017, "pid": 0, "tid": "stream 7", "ts": 1624691363566255, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563696, "dur": 28, | |
"args": { | |
"cbid": 211, "correlation": 1017, | |
"external id": 487, "external ts": 1624691363563674 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1017, "pid": 618, "tid": 618, "ts": 1624691363563696, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363566628, "dur": 368, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1028, "external id": 490, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1028, "pid": 0, "tid": "stream 7", "ts": 1624691363566628, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563783, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1028, | |
"external id": 490, "external ts": 1624691363563775 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1028, "pid": 618, "tid": 618, "ts": 1624691363563783, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363566998, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1036, "external id": 493, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1036, "pid": 0, "tid": "stream 7", "ts": 1624691363566998, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563858, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1036, | |
"external id": 493, "external ts": 1624691363563852 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1036, "pid": 618, "tid": 618, "ts": 1624691363563858, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567183, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1041, "external id": 497, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1041, "pid": 0, "tid": "stream 7", "ts": 1624691363567183, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363563892, "dur": 9, | |
"args": { | |
"cbid": 211, "correlation": 1041, | |
"external id": 497, "external ts": 1624691363563885 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1041, "pid": 618, "tid": 618, "ts": 1624691363563892, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567590, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1062, "external id": 516, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1062, "pid": 0, "tid": "stream 7", "ts": 1624691363567590, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363564047, "dur": 11, | |
"args": { | |
"cbid": 41, "correlation": 1062, | |
"external id": 516, "external ts": 1624691363564027 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1062, "pid": 618, "tid": 618, "ts": 1624691363564047, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363564058, "dur": 3551, | |
"args": { | |
"cbid": 131, "correlation": 1063, | |
"external id": 516, "external ts": 1624691363564027 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567670, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1075, "external id": 519, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1075, "pid": 0, "tid": "stream 7", "ts": 1624691363567670, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363567659, "dur": 7, | |
"args": { | |
"cbid": 41, "correlation": 1075, | |
"external id": 519, "external ts": 1624691363567654 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1075, "pid": 618, "tid": 618, "ts": 1624691363567659, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363567667, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1076, | |
"external id": 519, "external ts": 1624691363567654 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567702, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1088, "external id": 522, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1088, "pid": 0, "tid": "stream 7", "ts": 1624691363567702, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363567693, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1088, | |
"external id": 522, "external ts": 1624691363567690 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1088, "pid": 618, "tid": 618, "ts": 1624691363567693, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363567699, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1089, | |
"external id": 522, "external ts": 1624691363567690 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567762, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1101, "external id": 525, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006756756756756757 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1101, "pid": 0, "tid": "stream 7", "ts": 1624691363567762, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363567752, "dur": 6, | |
"args": { | |
"cbid": 41, "correlation": 1101, | |
"external id": 525, "external ts": 1624691363567747 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1101, "pid": 618, "tid": 618, "ts": 1624691363567752, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363567759, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1102, | |
"external id": 525, "external ts": 1624691363567747 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567786, "dur": 59, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1104, "external id": 508, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1104, "pid": 0, "tid": "stream 7", "ts": 1624691363567786, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363567771, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 1104, | |
"external id": 508, "external ts": 1624691363563971 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1104, "pid": 618, "tid": 618, "ts": 1624691363567771, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363567854, "dur": 18, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1110, "external id": 536, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1110, "pid": 0, "tid": "stream 7", "ts": 1624691363567854, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363567841, "dur": 10, | |
"args": { | |
"cbid": 211, "correlation": 1110, | |
"external id": 536, "external ts": 1624691363567833 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1110, "pid": 618, "tid": 618, "ts": 1624691363567841, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363568072, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1132, "external id": 555, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1132, "pid": 0, "tid": "stream 7", "ts": 1624691363568072, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363568058, "dur": 10, | |
"args": { | |
"cbid": 41, "correlation": 1132, | |
"external id": 555, "external ts": 1624691363568053 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1132, "pid": 618, "tid": 618, "ts": 1624691363568058, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363568068, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1133, | |
"external id": 555, "external ts": 1624691363568053 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363568104, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1145, "external id": 558, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1145, "pid": 0, "tid": "stream 7", "ts": 1624691363568104, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363568095, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 1145, | |
"external id": 558, "external ts": 1624691363568091 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1145, "pid": 618, "tid": 618, "ts": 1624691363568095, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363568101, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1146, | |
"external id": 558, "external ts": 1624691363568091 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363568135, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1158, "external id": 561, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1158, "pid": 0, "tid": "stream 7", "ts": 1624691363568135, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363568126, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1158, | |
"external id": 561, "external ts": 1624691363568123 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1158, "pid": 618, "tid": 618, "ts": 1624691363568126, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363568131, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1159, | |
"external id": 561, "external ts": 1624691363568123 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363568163, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1171, "external id": 564, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013513513513513514 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1171, "pid": 0, "tid": "stream 7", "ts": 1624691363568163, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363568155, "dur": 3, | |
"args": { | |
"cbid": 41, "correlation": 1171, | |
"external id": 564, "external ts": 1624691363568152 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1171, "pid": 618, "tid": 618, "ts": 1624691363568155, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363568160, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1172, | |
"external id": 564, "external ts": 1624691363568152 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363568185, "dur": 2285, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1174, "external id": 547, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1174, "pid": 0, "tid": "stream 7", "ts": 1624691363568185, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363568171, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1174, | |
"external id": 547, "external ts": 1624691363568001 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1174, "pid": 618, "tid": 618, "ts": 1624691363568171, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363570472, "dur": 417, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1180, "external id": 575, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1180, "pid": 0, "tid": "stream 7", "ts": 1624691363570472, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363568243, "dur": 26, | |
"args": { | |
"cbid": 211, "correlation": 1180, | |
"external id": 575, "external ts": 1624691363568226 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1180, "pid": 618, "tid": 618, "ts": 1624691363568243, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363570890, "dur": 372, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1193, "external id": 578, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1193, "pid": 0, "tid": "stream 7", "ts": 1624691363570890, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363568338, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 1193, | |
"external id": 578, "external ts": 1624691363568328 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1193, "pid": 618, "tid": 618, "ts": 1624691363568338, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363571263, "dur": 368, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1204, "external id": 581, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1204, "pid": 0, "tid": "stream 7", "ts": 1624691363571263, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363568384, "dur": 10, | |
"args": { | |
"cbid": 211, "correlation": 1204, | |
"external id": 581, "external ts": 1624691363568376 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1204, "pid": 618, "tid": 618, "ts": 1624691363568384, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363571632, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1212, "external id": 584, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1212, "pid": 0, "tid": "stream 7", "ts": 1624691363571632, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363568452, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1212, | |
"external id": 584, "external ts": 1624691363568446 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1212, "pid": 618, "tid": 618, "ts": 1624691363568452, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363571818, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1217, "external id": 588, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1217, "pid": 0, "tid": "stream 7", "ts": 1624691363571818, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363568484, "dur": 8, | |
"args": { | |
"cbid": 211, "correlation": 1217, | |
"external id": 588, "external ts": 1624691363568477 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1217, "pid": 618, "tid": 618, "ts": 1624691363568484, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572224, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1238, "external id": 607, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1238, "pid": 0, "tid": "stream 7", "ts": 1624691363572224, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363568603, "dur": 27, | |
"args": { | |
"cbid": 41, "correlation": 1238, | |
"external id": 607, "external ts": 1624691363568598 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1238, "pid": 618, "tid": 618, "ts": 1624691363568603, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363568631, "dur": 3598, | |
"args": { | |
"cbid": 131, "correlation": 1239, | |
"external id": 607, "external ts": 1624691363568598 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572279, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1251, "external id": 610, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1251, "pid": 0, "tid": "stream 7", "ts": 1624691363572279, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572267, "dur": 8, | |
"args": { | |
"cbid": 41, "correlation": 1251, | |
"external id": 610, "external ts": 1624691363572261 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1251, "pid": 618, "tid": 618, "ts": 1624691363572267, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572276, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1252, | |
"external id": 610, "external ts": 1624691363572261 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572310, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1264, "external id": 613, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1264, "pid": 0, "tid": "stream 7", "ts": 1624691363572310, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572301, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1264, | |
"external id": 613, "external ts": 1624691363572298 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1264, "pid": 618, "tid": 618, "ts": 1624691363572301, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572306, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1265, | |
"external id": 613, "external ts": 1624691363572298 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572339, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1277, "external id": 616, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006578947368421052 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1277, "pid": 0, "tid": "stream 7", "ts": 1624691363572339, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572331, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1277, | |
"external id": 616, "external ts": 1624691363572328 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1277, "pid": 618, "tid": 618, "ts": 1624691363572331, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572336, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1278, | |
"external id": 616, "external ts": 1624691363572328 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572362, "dur": 59, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1280, "external id": 599, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1280, "pid": 0, "tid": "stream 7", "ts": 1624691363572362, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572347, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 1280, | |
"external id": 599, "external ts": 1624691363568548 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1280, "pid": 618, "tid": 618, "ts": 1624691363572347, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572447, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1286, "external id": 627, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1286, "pid": 0, "tid": "stream 7", "ts": 1624691363572447, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572418, "dur": 26, | |
"args": { | |
"cbid": 211, "correlation": 1286, | |
"external id": 627, "external ts": 1624691363572409 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1286, "pid": 618, "tid": 618, "ts": 1624691363572418, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572552, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1308, "external id": 646, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1308, "pid": 0, "tid": "stream 7", "ts": 1624691363572552, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572540, "dur": 9, | |
"args": { | |
"cbid": 41, "correlation": 1308, | |
"external id": 646, "external ts": 1624691363572534 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1308, "pid": 618, "tid": 618, "ts": 1624691363572540, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572549, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1309, | |
"external id": 646, "external ts": 1624691363572534 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572584, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1321, "external id": 649, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1321, "pid": 0, "tid": "stream 7", "ts": 1624691363572584, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572575, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1321, | |
"external id": 649, "external ts": 1624691363572572 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1321, "pid": 618, "tid": 618, "ts": 1624691363572575, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572580, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1322, | |
"external id": 649, "external ts": 1624691363572572 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572612, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1334, "external id": 652, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1334, "pid": 0, "tid": "stream 7", "ts": 1624691363572612, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572604, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1334, | |
"external id": 652, "external ts": 1624691363572601 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1334, "pid": 618, "tid": 618, "ts": 1624691363572604, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572608, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1335, | |
"external id": 652, "external ts": 1624691363572601 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572640, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1347, "external id": 655, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013513513513513514 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1347, "pid": 0, "tid": "stream 7", "ts": 1624691363572640, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363572632, "dur": 3, | |
"args": { | |
"cbid": 41, "correlation": 1347, | |
"external id": 655, "external ts": 1624691363572629 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1347, "pid": 618, "tid": 618, "ts": 1624691363572632, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363572636, "dur": 19, | |
"args": { | |
"cbid": 131, "correlation": 1348, | |
"external id": 655, "external ts": 1624691363572629 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363572676, "dur": 2285, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1350, "external id": 638, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1350, "pid": 0, "tid": "stream 7", "ts": 1624691363572676, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572662, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1350, | |
"external id": 638, "external ts": 1624691363572496 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1350, "pid": 618, "tid": 618, "ts": 1624691363572662, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363574962, "dur": 416, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1356, "external id": 666, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1356, "pid": 0, "tid": "stream 7", "ts": 1624691363574962, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572727, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1356, | |
"external id": 666, "external ts": 1624691363572718 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1356, "pid": 618, "tid": 618, "ts": 1624691363572727, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363575380, "dur": 336, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1369, "external id": 669, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1369, "pid": 0, "tid": "stream 7", "ts": 1624691363575380, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572804, "dur": 13, | |
"args": { | |
"cbid": 211, "correlation": 1369, | |
"external id": 669, "external ts": 1624691363572794 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1369, "pid": 618, "tid": 618, "ts": 1624691363572804, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::(anonymous namespace)::distribution_elementwise_grid_stride_kernel<unsigned int, 4, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::(anonymous namespace)::distribution_nullary_kernel<float, unsigned int, 4, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1}>(at::TensorIteratorBase&, at::CUDAGeneratorImpl*, curandStatePhilox4_32_10 const&, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#1}::operator()() const::{lambda(unsigned int)#1})::{lambda(int, unsigned int)#1}>(int, at::PhiloxCudaState, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2}, at::native::templates::cuda::random_from_to_kernel<at::CUDAGeneratorImpl*>(at::TensorIteratorBase&, unsigned long, long, at::CUDAGeneratorImpl*)::{lambda()#1}::operator()() const::{lambda()#8}::operator()() const::{lambda(curandStatePhilox4_32_10*)#2})", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363575717, "dur": 337, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1380, "external id": 672, | |
"registers per thread": 54, | |
"shared memory": 0, | |
"blocks per SM": 8.0, | |
"warps per SM": 64.0, | |
"grid": [448, 1, 1], | |
"block": [256, 1, 1], | |
"est. achieved occupancy %": 50 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1380, "pid": 0, "tid": "stream 7", "ts": 1624691363575717, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572851, "dur": 10, | |
"args": { | |
"cbid": 211, "correlation": 1380, | |
"external id": 672, "external ts": 1624691363572843 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1380, "pid": 618, "tid": 618, "ts": 1624691363572851, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::vectorized_elementwise_kernel<4, at::native::FillFunctor<float>, at::detail::Array<char*, 1> >(int, at::native::FillFunctor<float>, at::detail::Array<char*, 1>)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576055, "dur": 184, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1388, "external id": 675, | |
"registers per thread": 8, | |
"shared memory": 0, | |
"blocks per SM": 1755.4286, | |
"warps per SM": 3510.8572, | |
"grid": [98304, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1388, "pid": 0, "tid": "stream 7", "ts": 1624691363576055, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572906, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1388, | |
"external id": 675, "external ts": 1624691363572900 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1388, "pid": 618, "tid": 618, "ts": 1624691363572906, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576240, "dur": 405, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1393, "external id": 679, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 932.5714, | |
"warps per SM": 1865.1428, | |
"grid": [52224, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1393, "pid": 0, "tid": "stream 7", "ts": 1624691363576240, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363572937, "dur": 8, | |
"args": { | |
"cbid": 211, "correlation": 1393, | |
"external id": 679, "external ts": 1624691363572930 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1393, "pid": 618, "tid": 618, "ts": 1624691363572937, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576647, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1414, "external id": 698, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1414, "pid": 0, "tid": "stream 7", "ts": 1624691363576647, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363573063, "dur": 10, | |
"args": { | |
"cbid": 41, "correlation": 1414, | |
"external id": 698, "external ts": 1624691363573057 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1414, "pid": 618, "tid": 618, "ts": 1624691363573063, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363573074, "dur": 3579, | |
"args": { | |
"cbid": 131, "correlation": 1415, | |
"external id": 698, "external ts": 1624691363573057 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576694, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1427, "external id": 701, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02702702702702703 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1427, "pid": 0, "tid": "stream 7", "ts": 1624691363576694, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363576682, "dur": 8, | |
"args": { | |
"cbid": 41, "correlation": 1427, | |
"external id": 701, "external ts": 1624691363576677 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1427, "pid": 618, "tid": 618, "ts": 1624691363576682, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363576691, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1428, | |
"external id": 701, "external ts": 1624691363576677 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576725, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1440, "external id": 704, | |
"bytes": 32, "memory bandwidth (GB/s)": 0.02631578947368421 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1440, "pid": 0, "tid": "stream 7", "ts": 1624691363576725, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363576716, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 1440, | |
"external id": 704, "external ts": 1624691363576713 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1440, "pid": 618, "tid": 618, "ts": 1624691363576716, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363576722, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1441, | |
"external id": 704, "external ts": 1624691363576713 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576809, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1453, "external id": 707, | |
"bytes": 8, "memory bandwidth (GB/s)": 0.006756756756756757 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1453, "pid": 0, "tid": "stream 7", "ts": 1624691363576809, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363576776, "dur": 29, | |
"args": { | |
"cbid": 41, "correlation": 1453, | |
"external id": 707, "external ts": 1624691363576772 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1453, "pid": 618, "tid": 618, "ts": 1624691363576776, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363576805, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1454, | |
"external id": 707, "external ts": 1624691363576772 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576834, "dur": 58, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1456, "external id": 690, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 12.857142, | |
"warps per SM": 205.71428, | |
"grid": [720, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1456, "pid": 0, "tid": "stream 7", "ts": 1624691363576834, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363576819, "dur": 13, | |
"args": { | |
"cbid": 211, "correlation": 1456, | |
"external id": 690, "external ts": 1624691363573002 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1456, "pid": 618, "tid": 618, "ts": 1624691363576819, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363576907, "dur": 17, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1462, "external id": 718, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 25.714285, | |
"warps per SM": 51.42857, | |
"grid": [1440, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 80 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1462, "pid": 0, "tid": "stream 7", "ts": 1624691363576907, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363576892, "dur": 12, | |
"args": { | |
"cbid": 211, "correlation": 1462, | |
"external id": 718, "external ts": 1624691363576883 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1462, "pid": 618, "tid": 618, "ts": 1624691363576892, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363577008, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1484, "external id": 737, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1484, "pid": 0, "tid": "stream 7", "ts": 1624691363577008, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363576995, "dur": 9, | |
"args": { | |
"cbid": 41, "correlation": 1484, | |
"external id": 737, "external ts": 1624691363576989 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1484, "pid": 618, "tid": 618, "ts": 1624691363576995, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363577005, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1485, | |
"external id": 737, "external ts": 1624691363576989 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363577054, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1497, "external id": 740, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.033783783783783786 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1497, "pid": 0, "tid": "stream 7", "ts": 1624691363577054, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363577045, "dur": 5, | |
"args": { | |
"cbid": 41, "correlation": 1497, | |
"external id": 740, "external ts": 1624691363577040 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1497, "pid": 618, "tid": 618, "ts": 1624691363577045, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363577051, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1498, | |
"external id": 740, "external ts": 1624691363577040 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363577100, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1510, "external id": 743, | |
"bytes": 40, "memory bandwidth (GB/s)": 0.03289473684210526 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1510, "pid": 0, "tid": "stream 7", "ts": 1624691363577100, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363577077, "dur": 19, | |
"args": { | |
"cbid": 41, "correlation": 1510, | |
"external id": 743, "external ts": 1624691363577073 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1510, "pid": 618, "tid": 618, "ts": 1624691363577077, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363577096, "dur": 6, | |
"args": { | |
"cbid": 131, "correlation": 1511, | |
"external id": 743, "external ts": 1624691363577073 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Memcpy", | |
"name": "Memcpy HtoD (Pageable -> Device)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363577128, "dur": 1, | |
"args": { | |
"device": 0, "context": 1, | |
"stream": 7, "correlation": 1523, "external id": 746, | |
"bytes": 16, "memory bandwidth (GB/s)": 0.013513513513513514 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1523, "pid": 0, "tid": "stream 7", "ts": 1624691363577128, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaMemcpyAsync", "pid": 618, "tid": "618", | |
"ts": 1624691363577120, "dur": 4, | |
"args": { | |
"cbid": 41, "correlation": 1523, | |
"external id": 746, "external ts": 1624691363577117 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1523, "pid": 618, "tid": 618, "ts": 1624691363577120, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaStreamSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363577125, "dur": 7, | |
"args": { | |
"cbid": 131, "correlation": 1524, | |
"external id": 746, "external ts": 1624691363577117 | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::flip_cuda_kernel<float>(float*, float*, long, long*, long, long*, long*, long*, long)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363577150, "dur": 2285, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1526, "external id": 729, | |
"registers per thread": 32, | |
"shared memory": 0, | |
"blocks per SM": 398.57144, | |
"warps per SM": 6377.143, | |
"grid": [22320, 1, 1], | |
"block": [512, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1526, "pid": 0, "tid": "stream 7", "ts": 1624691363577150, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363577136, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1526, | |
"external id": 729, "external ts": 1624691363576950 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1526, "pid": 618, "tid": 618, "ts": 1624691363577136, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Kernel", | |
"name": "void at::native::unrolled_elementwise_kernel<at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast>(int, at::native::copy_device_to_device(at::TensorIterator&, bool)::{lambda()#2}::operator()() const::{lambda()#8}::operator()() const::{lambda(float)#1}, at::detail::Array<char*, 2>, OffsetCalculator<1, unsigned int>, char*, at::native::memory::LoadWithoutCast, at::detail::Array<char*, 2>::StoreWithoutCast)", "pid": 0, "tid": "stream 7", | |
"ts": 1624691363579436, "dur": 417, | |
"args": { | |
"queued": 0, "device": 0, "context": 1, | |
"stream": 7, "correlation": 1532, "external id": 757, | |
"registers per thread": 16, | |
"shared memory": 0, | |
"blocks per SM": 797.1429, | |
"warps per SM": 1594.2858, | |
"grid": [44640, 1, 1], | |
"block": [64, 1, 1], | |
"est. achieved occupancy %": 100 | |
} | |
}, | |
{ | |
"ph": "f", "id": 1532, "pid": 0, "tid": "stream 7", "ts": 1624691363579436, | |
"cat": "async", "name": "launch", "bp": "e" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaLaunchKernel", "pid": 618, "tid": "618", | |
"ts": 1624691363577199, "dur": 11, | |
"args": { | |
"cbid": 211, "correlation": 1532, | |
"external id": 757, "external ts": 1624691363577190 | |
} | |
}, | |
{ | |
"ph": "s", "id": 1532, "pid": 618, "tid": 618, "ts": 1624691363577199, | |
"cat": "async", "name": "launch" | |
}, | |
{ | |
"ph": "X", "cat": "Runtime", | |
"name": "cudaDeviceSynchronize", "pid": 618, "tid": "618", | |
"ts": 1624691363577276, "dur": 2582, | |
"args": { | |
"cbid": 165, "correlation": 1539, | |
"external id": 0, "external ts": 0 | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 618, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 618, "tid": 0, | |
"args": { | |
"labels": "CPU" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 0, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 0, "tid": 0, | |
"args": { | |
"labels": "GPU 0" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 1, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 1, "tid": 0, | |
"args": { | |
"labels": "GPU 1" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 2, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 2, "tid": 0, | |
"args": { | |
"labels": "GPU 2" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 3, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 3, "tid": 0, | |
"args": { | |
"labels": "GPU 3" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 4, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 4, "tid": 0, | |
"args": { | |
"labels": "GPU 4" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 5, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 5, "tid": 0, | |
"args": { | |
"labels": "GPU 5" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 6, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 6, "tid": 0, | |
"args": { | |
"labels": "GPU 6" | |
} | |
}, | |
{ | |
"name": "process_name", "ph": "M", "ts": 1624691363535292, "pid": 7, "tid": 0, | |
"args": { | |
"name": "python3" | |
} | |
}, | |
{ | |
"name": "process_labels", "ph": "M", "ts": 1624691363535292, "pid": 7, "tid": 0, | |
"args": { | |
"labels": "GPU 7" | |
} | |
}, | |
{ | |
"name": "thread_name", "ph": "M", "ts": 1624691363535292, "pid": 618, "tid": "618", | |
"args": { | |
"name": "thread 618 (python3)" | |
} | |
}, | |
{ | |
"ph": "X", "cat": "Trace", "ts": 1624691363535292, "dur": 44579, | |
"pid": "Traces", "tid": "PyTorch Profiler", | |
"name": "PyTorch Profiler (0)", | |
"args": { | |
"Op count": 0 | |
} | |
}, | |
{ | |
"name": "Iteration Start: PyTorch Profiler", "ph": "i", "s": "g", | |
"pid": "Traces", "tid": "Trace PyTorch Profiler", "ts": 1624691363535292 | |
}, | |
{ | |
"name": "Record Window End", "ph": "i", "s": "g", | |
"pid": "", "tid": "", "ts": 1624691363581974 | |
} | |
]} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment