Skip to content

Instantly share code, notes, and snippets.

@Delaunay
Created June 5, 2019 18:39
Show Gist options
  • Save Delaunay/7144dc9e1d1d4a14ee9958b1799c8b64 to your computer and use it in GitHub Desktop.
Save Delaunay/7144dc9e1d1d4a14ee9958b1799c8b64 to your computer and use it in GitHub Desktop.
rcprof_error.output
strace ../rcp/bin/rcprof -o result.atp -p -w . ./regression/polynome/pytorch/run.sh --repeat 10 --number 2 --batch-size 4096
execve("../rcp/bin/rcprof", ["../rcp/bin/rcprof", "-o", "result.atp", "-p", "-w", ".", "./regression/polynome/pytorch/ru"..., "--repeat", "10", "--number", "2", "--batch-size", "4096"], 0x7ffe56d40e50 /* 37 vars */) = 0
brk(NULL) = 0x12e9000
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
access("/etc/ld.so.preload", R_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/etc/ld.so.cache", O_RDONLY|O_CLOEXEC) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=163126, ...}) = 0
mmap(NULL, 163126, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7fd17ab27000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib/x86_64-linux-gnu/librt.so.1", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\0\"\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=31680, ...}) = 0
mmap(NULL, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7fd17ab25000
mmap(NULL, 2128864, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd17a720000
mprotect(0x7fd17a727000, 2093056, PROT_NONE) = 0
mmap(0x7fd17a926000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x6000) = 0x7fd17a926000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib/x86_64-linux-gnu/libdl.so.2", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0P\16\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=14560, ...}) = 0
mmap(NULL, 2109712, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd17a51c000
mprotect(0x7fd17a51f000, 2093056, PROT_NONE) = 0
mmap(0x7fd17a71e000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x7fd17a71e000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib/x86_64-linux-gnu/libpthread.so.0", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0000b\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=144976, ...}) = 0
mmap(NULL, 2221184, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd17a2fd000
mprotect(0x7fd17a317000, 2093056, PROT_NONE) = 0
mmap(0x7fd17a516000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x19000) = 0x7fd17a516000
mmap(0x7fd17a518000, 13440, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7fd17a518000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/usr/lib/x86_64-linux-gnu/libstdc++.so.6", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\3\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220\304\10\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=1594864, ...}) = 0
mmap(NULL, 3702848, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd179f74000
mprotect(0x7fd17a0ed000, 2097152, PROT_NONE) = 0
mmap(0x7fd17a2ed000, 49152, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x179000) = 0x7fd17a2ed000
mmap(0x7fd17a2f9000, 12352, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7fd17a2f9000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib/x86_64-linux-gnu/libm.so.6", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\3\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\200\272\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=1700792, ...}) = 0
mmap(NULL, 3789144, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd179bd6000
mprotect(0x7fd179d73000, 2093056, PROT_NONE) = 0
mmap(0x7fd179f72000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x19c000) = 0x7fd179f72000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib/x86_64-linux-gnu/libgcc_s.so.1", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\300*\0\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0644, st_size=96616, ...}) = 0
mmap(NULL, 2192432, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd1799be000
mprotect(0x7fd1799d5000, 2093056, PROT_NONE) = 0
mmap(0x7fd179bd4000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x16000) = 0x7fd179bd4000
close(3) = 0
access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib/x86_64-linux-gnu/libc.so.6", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\3\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\260\34\2\0\0\0\0\0"..., 832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=2030544, ...}) = 0
mmap(NULL, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7fd17ab23000
mmap(NULL, 4131552, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x7fd1795cd000
mprotect(0x7fd1797b4000, 2097152, PROT_NONE) = 0
mmap(0x7fd1799b4000, 24576, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1e7000) = 0x7fd1799b4000
mmap(0x7fd1799ba000, 15072, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7fd1799ba000
close(3) = 0
mmap(NULL, 12288, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7fd17ab20000
arch_prctl(ARCH_SET_FS, 0x7fd17ab20740) = 0
mprotect(0x7fd1799b4000, 16384, PROT_READ) = 0
mprotect(0x7fd179bd4000, 4096, PROT_READ) = 0
mprotect(0x7fd179f72000, 4096, PROT_READ) = 0
mprotect(0x7fd17a2ed000, 40960, PROT_READ) = 0
mprotect(0x7fd17a516000, 4096, PROT_READ) = 0
mprotect(0x7fd17a71e000, 4096, PROT_READ) = 0
mprotect(0x7fd17a926000, 4096, PROT_READ) = 0
mprotect(0x81c000, 28672, PROT_READ) = 0
mprotect(0x7fd17ab4f000, 4096, PROT_READ) = 0
munmap(0x7fd17ab27000, 163126) = 0
set_tid_address(0x7fd17ab20a10) = 4776
set_robust_list(0x7fd17ab20a20, 24) = 0
rt_sigaction(SIGRTMIN, {sa_handler=0x7fd17a302cb0, sa_mask=[], sa_flags=SA_RESTORER|SA_SIGINFO, sa_restorer=0x7fd17a30f890}, NULL, 8) = 0
rt_sigaction(SIGRT_1, {sa_handler=0x7fd17a302d50, sa_mask=[], sa_flags=SA_RESTORER|SA_RESTART|SA_SIGINFO, sa_restorer=0x7fd17a30f890}, NULL, 8) = 0
rt_sigprocmask(SIG_UNBLOCK, [RTMIN RT_1], NULL, 8) = 0
prlimit64(0, RLIMIT_STACK, NULL, {rlim_cur=8192*1024, rlim_max=RLIM64_INFINITY}) = 0
brk(NULL) = 0x12e9000
brk(0x130a000) = 0x130a000
futex(0x7fd17a2fa09c, FUTEX_WAKE_PRIVATE, 2147483647) = 0
futex(0x7fd17a2fa0a8, FUTEX_WAKE_PRIVATE, 2147483647) = 0
brk(0x132b000) = 0x132b000
brk(0x134c000) = 0x134c000
futex(0x7fd17a71f0c8, FUTEX_WAKE_PRIVATE, 2147483647) = 0
mmap(NULL, 10489856, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x7fd178bcc000
getcwd("/home/mila/source/training", 128) = 27
openat(AT_FDCWD, "/usr/lib/locale/locale-archive", O_RDONLY|O_CLOEXEC) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=10281936, ...}) = 0
mmap(NULL, 10281936, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7fd1781fd000
close(3) = 0
openat(AT_FDCWD, "/usr/lib/x86_64-linux-gnu/gconv/gconv-modules.cache", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=26376, ...}) = 0
mmap(NULL, 26376, PROT_READ, MAP_SHARED, 3, 0) = 0x7fd17ab48000
close(3) = 0
futex(0x7fd1799b9a08, FUTEX_WAKE_PRIVATE, 2147483647) = 0
getcwd("/home/mila/source/training", 4096) = 27
readlink("/proc/self/exe", "/home/mila/source/rcp/bin/rcprof", 4095) = 32
openat(AT_FDCWD, "/home/mila/source/rcp/bin/rcprof", O_RDONLY) = 3
lseek(3, 0, SEEK_END) = 6633648
lseek(3, 0, SEEK_CUR) = 6633648
lseek(3, 0, SEEK_SET) = 0
read(3, "\177ELF\2\1\1\3\0\0\0\0\0\0\0\0\2\0>\0\1\0\0\0\375BE\0\0\0\0\0"..., 8191) = 8191
close(3) = 0
stat("/home/mila/source/training", {st_mode=S_IFDIR|0777, st_size=4096, ...}) = 0
openat(AT_FDCWD, "/home/mila/", O_RDONLY|O_NONBLOCK|O_CLOEXEC|O_DIRECTORY) = 3
fstat(3, {st_mode=S_IFDIR|0777, st_size=4096, ...}) = 0
getdents(3, /* 37 entries */, 32768) = 1176
getdents(3, /* 0 entries */, 32768) = 0
close(3) = 0
readlink("/proc/self/exe", "/home/mila/source/rcp/bin/rcprof", 4095) = 32
getpid() = 4776
stat("/home/mila/source/training/./regression/polynome/pytorch/run.sh", {st_mode=S_IFREG|0777, st_size=123, ...}) = 0
openat(AT_FDCWD, "/home/mila/source/rcp/bin/libRCPCLProfileAgent.so", O_RDONLY) = 3
close(3) = 0
openat(AT_FDCWD, "/home/mila/.rcpdata", O_WRONLY|O_CREAT|O_TRUNC, 0666) = 3
write(3, "VersionMajor=5\n", 15) = 15
write(3, "VersionMinor=6\n", 15) = 15
write(3, "CmdArgs=--repeat 10 --number 2 -"..., 49) = 49
write(3, "OutputFile=/home/mila/source/tra"..., 49) = 49
write(3, "WorkingDir=.\n", 13) = 13
write(3, "SessionName=\n", 13) = 13
write(3, "DLLPath=/home/mila/source/rcp/bi"..., 35) = 35
write(3, "CounterFile=\n", 13) = 13
write(3, "KernelFile=\n", 12) = 12
write(3, "APIFilterFile=\n", 15) = 15
write(3, "Verbose=False\n", 14) = 14
write(3, "StartDisabled=False\n", 20) = 20
write(3, "OutputIL=False\n", 15) = 15
write(3, "OutputHSAIL=False\n", 18) = 18
write(3, "OutputISA=False\n", 16) = 16
write(3, "OutputCL=False\n", 15) = 15
write(3, "PerfCounter=True\n", 17) = 17
write(3, "Trace=False\n", 12) = 12
write(3, "HSATrace=False\n", 15) = 15
write(3, "HSAPMC=False\n", 13) = 13
write(3, "SinglePassPMC=False\n", 20) = 20
write(3, "GPUTimePMC=True\n", 16) = 16
write(3, "TimeOut=True\n", 13) = 13
write(3, "QueryRetStat=False\n", 19) = 19
write(3, "CollapseClGetEventInfo=True\n", 28) = 28
write(3, "Interval=100\n", 13) = 13
write(3, "Separator=,\n", 12) = 12
write(3, "UserTimerIsUsed=False\n", 22) = 22
write(3, "UserTimerDLLFileName=\n", 22) = 22
write(3, "UserTimerFunctionName=\n", 23) = 23
write(3, "UserTimerInitFunctionName=\n", 27) = 27
write(3, "UserTimerDestroyFunctionName=\n", 30) = 30
write(3, "UserPMC=False\n", 14) = 14
write(3, "CompatibilityMode=False\n", 24) = 24
write(3, "UserPMCLibPath=\n", 16) = 16
write(3, "StackTrace=False\n", 17) = 17
write(3, "MaxNumOfAPICalls=1000000\n", 25) = 25
write(3, "MaxKernels=100000\n", 18) = 18
write(3, "KernelOccupancy=False\n", 22) = 22
write(3, "GMTrace=False\n", 14) = 14
write(3, "FullEnvBlock=False\n", 19) = 19
write(3, "StartDelayEnabled=False\n", 24) = 24
write(3, "ProfilerDurationEnabled=False\n", 30) = 30
write(3, "StartDelaySeconds=0\n", 20) = 20
write(3, "ProfileDuration=0\n", 18) = 18
write(3, "ForceSingleGPU=False\n", 21) = 21
write(3, "ForcedGpuIndex=0\n", 17) = 17
write(3, "AqlPacketTracing=False\n", 23) = 23
write(3, "HSADisableKernelDemangle=False\n", 31) = 31
write(3, "NoHSATransferTime=False\n", 24) = 24
close(3) = 0
openat(AT_FDCWD, "/home/mila/.rcpdata.amdtperfmarker", O_WRONLY|O_CREAT|O_TRUNC, 0666) = 3
write(3, "TimeOut=True\n", 13) = 13
write(3, "PerfMarkerTempFileBaseName=/home"..., 39) = 39
write(3, "PerfMarkerOutputFileName=/home/m"..., 74) = 74
close(3) = 0
unlink("/home/mila/.rcpcltable") = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/home/mila/source/training/./regression/polynome/pytorch/run.sh", O_RDONLY) = 3
lseek(3, 0, SEEK_END) = 123
lseek(3, 0, SEEK_CUR) = 123
lseek(3, 0, SEEK_SET) = 0
read(3, "#!/bin/bash\n\nSCRIPT_PATH=$(dirna"..., 8191) = 123
close(3) = 0
stat("/home/mila/source/training/./regression/polynome/pytorch/run.sh", {st_mode=S_IFREG|0777, st_size=123, ...}) = 0
stat("/sys/class/drm/card0", {st_mode=S_IFDIR|0755, st_size=0, ...}) = 0
stat("/sys/class/drm/card0/device/power_dpm_force_performance_level", 0x7ffed9d13b00) = -1 ENOENT (No such file or directory)
clone(child_stack=NULL, flags=CLONE_CHILD_CLEARTID|CLONE_CHILD_SETTID|SIGCHLD, child_tidptr=0x7fd17ab20a10) = 4777
wait4(4777, No module named 'comet_ml'
--------------------------------------------------------------------------------
batch_size: 4096
cuda: True
workers: 0
seed: 0
devices: 1
jr_id: 0
vcd: 0
cpu_cores: 0
repeat: 10
number: 2
report: /home/mila/datasets/mlperf/output/bench_results
--------------------------------------------------------------------------------
[ 0/ 10] | ETA: 6.20 min | Batch Loss 15.0591
[ 1/ 10] | ETA: 0.00 min | Batch Loss 15.5790
[ 2/ 10] | ETA: 0.00 min | Batch Loss 14.7557
[ 3/ 10] | ETA: 0.00 min | Batch Loss 14.6686
[ 4/ 10] | ETA: 0.00 min | Batch Loss 15.5824
[ 5/ 10] | ETA: 0.00 min | Batch Loss 14.5039
[ 6/ 10] | ETA: 0.00 min | Batch Loss 14.6122
[ 7/ 10] | ETA: 0.00 min | Batch Loss 15.1097
[ 8/ 10] | ETA: 0.00 min | Batch Loss 15.5762
[ 9/ 10] | ETA: 0.00 min | Batch Loss 13.4211
==> Learned function: y = -0.07 x^4 +0.35 x^3 -0.49 x^2 +0.13 x^1 -0.28
==> Actual function: y = -0.73 x^4 -1.51 x^3 -4.99 x^2 +4.83 x^1 -3.89
--------------------------------------------------------------------------------
{
"batch_loss": [
15.186650276184082,
15.059094429016113,
15.376214027404785,
15.579010963439941,
15.46472454071045,
14.755709648132324,
15.025228500366211,
14.668600082397461,
12.463979721069336,
15.582362174987793,
14.454885482788086,
14.503859519958496,
14.339473724365234,
14.612238883972168,
13.658197402954102,
15.109685897827148,
13.81052017211914,
15.576239585876465,
14.470664024353027,
13.421065330505371
],
"batch_size": 4096,
"cpu_cores": 10,
"cuda": true,
"devices": 1,
"epoch_loss": [],
"gpu": "Vega 20",
"hostname": "RTX1",
"jr_id": 0,
"metrics": {},
"name": "regression_polynome_pytorch_main.py",
"number": 2,
"repeat": 10,
"train": {
"avg": 0.004000425338745117,
"count": 1,
"max": 0.004000425338745117,
"min": 0.004000425338745117,
"sd": 0.0,
"unit": "s"
},
"train_item": {
"avg": 2047782.249716908,
"max": 2047782.249716908,
"min": 2047782.249716908,
"range": 0.0,
"unit": "items/sec"
},
"unique_id": "87846bd3bd589384511d515fa2630547d784bec4d59faa14b89d870fb95ab6a3",
"vcd": 0,
"version": "308a5984e9",
"workers": 0
}
--------------------------------------------------------------------------------
[{WIFEXITED(s) && WEXITSTATUS(s) == 0}], 0, NULL) = 4777
--- SIGCHLD {si_signo=SIGCHLD, si_code=CLD_EXITED, si_pid=4777, si_uid=1000, si_status=0, si_utime=3597, si_stime=1596} ---
readlink("/proc/self/exe", "/home/mila/source/rcp/bin/rcprof", 4095) = 32
clone(child_stack=NULL, flags=CLONE_CHILD_CLEARTID|CLONE_CHILD_SETTID|SIGCHLD, child_tidptr=0x7fd17ab20a10) = 4941
wait4(4941, NULL, 0, NULL) = 4941
--- SIGCHLD {si_signo=SIGCHLD, si_code=CLD_EXITED, si_pid=4941, si_uid=1000, si_status=127, si_utime=0, si_stime=0} ---
rt_sigaction(SIGINT, {sa_handler=SIG_DFL, sa_mask=[INT], sa_flags=SA_RESTORER|SA_RESTART, sa_restorer=0x7fd17960bf20}, {sa_handler=SIG_DFL, sa_mask=[], sa_flags=0}, 8) = 0
rt_sigaction(SIGINT, {sa_handler=SIG_DFL, sa_mask=[INT], sa_flags=SA_RESTORER|SA_RESTART, sa_restorer=0x7fd17960bf20}, {sa_handler=SIG_DFL, sa_mask=[INT], sa_flags=SA_RESTORER|SA_RESTART, sa_restorer=0x7fd17960bf20}, 8) = 0
openat(AT_FDCWD, "/home/mila/source/training/result.csv", O_RDONLY) = -1 ENOENT (No such file or directory)
fstat(1, {st_mode=S_IFCHR|0620, st_rdev=makedev(136, 5), ...}) = 0
write(1, "Failed to generate profile resul"..., 73Failed to generate profile result /home/mila/source/training/result.csv.
) = 73
unlink("/home/mila/.rcpdata") = 0
unlink("/home/mila/.rcpdata.amdtperfmarker") = 0
exit_group(0) = ?
+++ exited with 0 +++
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment