Created
May 24, 2023 16:08
-
-
Save liuliu/f80ceaebe36b177c4d50598ad27c782b to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
CCV_NNC_GEMM_FORWARD [1]: [3] -> [1] (0) | |
|-> 1. 0x1438bd420 (0x285d90fc0:0) [2x320] 0.517578 0.953613 -0.921875 .. | |
|-> 2. 0x1438bd570 (0x285d841c0:0) [1280x320] -0.001888 0.001598 0.001110 .. | |
|-> 3. 0x1438bd5e0 (0x285d84280:0) [1280] -0.019775 0.008278 0.010788 .. | |
|<- 1. 0x1438a0000 (0x285da5600:0) [2x1280] 0.044556 -0.020798 0.078064 .. | |
CCV_NNC_SWISH_FORWARD [2]: [1] -> [1] (0) | |
|-> 1. 0x1438a0000 (0x285da5600:0) [2x1280] 0.044556 -0.020798 0.078064 .. | |
|<- 1. 0x1438a0000 (0x285da5600:0) [2x1280] 0.022781 -0.010292 0.040558 .. | |
CCV_NNC_GEMM_FORWARD [3]: [3] -> [1] (0) | |
|-> 1. 0x1438a0000 (0x285da5600:0) [2x1280] 0.022781 -0.010292 0.040558 .. | |
|-> 2. 0x1438bd650 (0x285d84b80:0) [1280x1280] 0.002268 0.001678 -0.003374 .. | |
|-> 3. 0x1438bd6c0 (0x285d85300:0) [1280] 0.006294 0.001841 -0.010101 .. | |
|<- 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.068420 -0.037476 -0.015541 .. | |
CCV_NNC_CONVOLUTION_FORWARD [4]: [3] -> [1] (1) | |
Wait: (1, 0) | |
|-> 1. 0x1438bd3b0 (0x285d90d00:0) [2x64x64x4] 1.300781 0.501465 0.404785 .. | |
|-> 2. 0x1438bd730 (0x285d85340:0) [320x4x3x3] -0.030701 0.085693 0.096252 .. | |
|-> 3. 0x1438bd7a0 (0x285d84440:0) [320] -0.096619 -0.114014 0.106323 .. | |
|<- 1. 0x14390db70 (0x285f78ac0:0) [2x64x64x320] -0.319092 -0.406982 0.225342 .. | |
CCV_NNC_GEMM_FORWARD [5]: [2] -> [1] (2) | |
Wait: (2, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438be290 (0x285d842c0:0) [320x768] 0.050140 0.022263 -0.017365 .. | |
|<- 1. 0x1438a1500 (0x285da5b80:0) [2x133x320] -0.231689 -0.019897 8.742188 .. | |
CCV_NNC_TRANSPOSE_FORWARD [6]: [1] -> [1] (2) | |
|-> 1. 0x1438d4ba0 (0x285da5b80:0) [2x133x8x40] -0.231689 -0.019897 8.742188 .. | |
|<- 1. 0x1438a1570 (0x285da5bc0:0) [2x8x133x40] -0.231689 -0.019897 8.742188 .. | |
Emit: (2, 6) | |
CCV_NNC_GEMM_FORWARD [7]: [2] -> [1] (3) | |
Wait: (3, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438be300 (0x285d84380:0) [320x768] -0.017517 -0.007912 -0.000061 .. | |
|<- 1. 0x1438a16c0 (0x285da5c40:0) [2x133x320] 0.030670 -0.073059 -0.036987 .. | |
CCV_NNC_TRANSPOSE_FORWARD [8]: [1] -> [1] (3) | |
|-> 1. 0x1438d4cf0 (0x285da5c40:0) [2x133x8x40] 0.030670 -0.073059 -0.036987 .. | |
|<- 1. 0x1438a1730 (0x285da5c80:0) [2x8x133x40] 0.030670 -0.073059 -0.036987 .. | |
Emit: (3, 7) | |
CCV_NNC_GEMM_FORWARD [9]: [2] -> [1] (4) | |
Wait: (4, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438bf330 (0x285d85800:0) [320x768] 0.037933 -0.010902 -0.072021 .. | |
|<- 1. 0x1438a3020 (0x285da5f00:0) [2x133x320] -0.131592 -0.084351 1.820312 .. | |
CCV_NNC_TRANSPOSE_FORWARD [10]: [1] -> [1] (4) | |
|-> 1. 0x1438d8b30 (0x285da5f00:0) [2x133x8x40] -0.131592 -0.084351 1.820312 .. | |
|<- 1. 0x1438a3090 (0x285da5f40:0) [2x8x133x40] -0.131592 -0.084351 1.820312 .. | |
Emit: (4, 14) | |
CCV_NNC_GEMM_FORWARD [11]: [2] -> [1] (5) | |
Wait: (5, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438bf3a0 (0x285d85840:0) [320x768] 0.004913 -0.008904 -0.008820 .. | |
|<- 1. 0x1438a31e0 (0x285da5f80:0) [2x133x320] 0.014427 -0.034271 -0.016800 .. | |
CCV_NNC_TRANSPOSE_FORWARD [12]: [1] -> [1] (5) | |
|-> 1. 0x1438d8c80 (0x285da5f80:0) [2x133x8x40] 0.014427 -0.034271 -0.016800 .. | |
|<- 1. 0x1438a3250 (0x285da5fc0:0) [2x8x133x40] 0.014427 -0.034271 -0.016800 .. | |
Emit: (5, 15) | |
CCV_NNC_GEMM_FORWARD [13]: [2] -> [1] (6) | |
Wait: (6, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c0590 (0x285d86280:0) [640x768] -0.077393 0.060516 -0.058655 .. | |
|<- 1. 0x1438a4b40 (0x285da6540:0) [2x133x640] 0.370605 -0.183228 -1.733398 .. | |
CCV_NNC_TRANSPOSE_FORWARD [14]: [1] -> [1] (6) | |
|-> 1. 0x1438dcac0 (0x285da6540:0) [2x133x8x80] 0.370605 -0.183228 -1.733398 .. | |
|<- 1. 0x1438a4bb0 (0x285da6580:0) [2x8x133x80] 0.370605 -0.183228 -1.733398 .. | |
Emit: (6, 24) | |
CCV_NNC_GEMM_FORWARD [15]: [2] -> [1] (7) | |
Wait: (7, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c0600 (0x285d862c0:0) [640x768] -0.010658 -0.064941 -0.039856 .. | |
|<- 1. 0x1438a4d00 (0x285da6600:0) [2x133x640] 0.013397 0.017731 0.048828 .. | |
CCV_NNC_TRANSPOSE_FORWARD [16]: [1] -> [1] (7) | |
|-> 1. 0x1438dcc10 (0x285da6600:0) [2x133x8x80] 0.013397 0.017731 0.048828 .. | |
|<- 1. 0x1438a4d70 (0x285da6640:0) [2x8x133x80] 0.013397 0.017731 0.048828 .. | |
Emit: (7, 25) | |
CCV_NNC_GEMM_FORWARD [17]: [2] -> [1] (8) | |
Wait: (8, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c1630 (0x285d86c00:0) [640x768] 0.046356 0.060303 0.039642 .. | |
|<- 1. 0x1438a6660 (0x285da6b40:0) [2x133x640] -0.381836 -0.479736 0.379883 .. | |
CCV_NNC_TRANSPOSE_FORWARD [18]: [1] -> [1] (8) | |
|-> 1. 0x1438e0a50 (0x285da6b40:0) [2x133x8x80] -0.381836 -0.479736 0.379883 .. | |
|<- 1. 0x1438a66d0 (0x285da6b80:0) [2x8x133x80] -0.381836 -0.479736 0.379883 .. | |
Emit: (8, 32) | |
CCV_NNC_GEMM_FORWARD [19]: [2] -> [1] (9) | |
Wait: (9, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c16a0 (0x285d86c40:0) [640x768] -0.002068 0.001761 0.008499 .. | |
|<- 1. 0x1438a6820 (0x285da6c00:0) [2x133x640] 0.031586 0.014740 -0.047302 .. | |
CCV_NNC_TRANSPOSE_FORWARD [20]: [1] -> [1] (9) | |
|-> 1. 0x1438e0ba0 (0x285da6c00:0) [2x133x8x80] 0.031586 0.014740 -0.047302 .. | |
|<- 1. 0x1438a6890 (0x285da6c40:0) [2x8x133x80] 0.031586 0.014740 -0.047302 .. | |
Emit: (9, 33) | |
CCV_NNC_GEMM_FORWARD [21]: [2] -> [1] (10) | |
Wait: (10, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c2890 (0x285d87680:0) [1280x768] 0.049530 -0.013351 0.006092 .. | |
|<- 1. 0x1438a8180 (0x285da7180:0) [2x133x1280] -0.213623 0.277832 -0.094299 .. | |
CCV_NNC_TRANSPOSE_FORWARD [22]: [1] -> [1] (10) | |
|-> 1. 0x1438e49e0 (0x285da7180:0) [2x133x8x160] -0.213623 0.277832 -0.094299 .. | |
|<- 1. 0x1438a81f0 (0x285da71c0:0) [2x8x133x160] -0.213623 0.277832 -0.094299 .. | |
Emit: (10, 42) | |
CCV_NNC_GEMM_FORWARD [23]: [2] -> [1] (11) | |
Wait: (11, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c2900 (0x285d876c0:0) [1280x768] -0.006660 -0.087158 0.025131 .. | |
|<- 1. 0x1438a8340 (0x285da7240:0) [2x133x1280] -0.006889 -0.040039 0.008888 .. | |
CCV_NNC_TRANSPOSE_FORWARD [24]: [1] -> [1] (11) | |
|-> 1. 0x1438e4b30 (0x285da7240:0) [2x133x8x160] -0.006889 -0.040039 0.008888 .. | |
|<- 1. 0x1438a83b0 (0x285da7280:0) [2x8x133x160] -0.006889 -0.040039 0.008888 .. | |
Emit: (11, 43) | |
CCV_NNC_GEMM_FORWARD [25]: [2] -> [1] (12) | |
Wait: (12, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c3930 (0x285d8ce00:0) [1280x768] 0.059662 0.042114 0.031982 .. | |
|<- 1. 0x1438a9ca0 (0x285da7640:0) [2x133x1280] 0.191650 0.108704 -0.219238 .. | |
CCV_NNC_TRANSPOSE_FORWARD [26]: [1] -> [1] (12) | |
|-> 1. 0x1438e8970 (0x285da7640:0) [2x133x8x160] 0.191650 0.108704 -0.219238 .. | |
|<- 1. 0x1438a9d10 (0x285da7680:0) [2x8x133x160] 0.191650 0.108704 -0.219238 .. | |
Emit: (12, 50) | |
CCV_NNC_GEMM_FORWARD [27]: [2] -> [1] (13) | |
Wait: (13, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c39a0 (0x285d8f800:0) [1280x768] 0.045746 0.000335 -0.000800 .. | |
|<- 1. 0x1438a9e60 (0x285da7700:0) [2x133x1280] -0.091675 0.026260 0.035645 .. | |
CCV_NNC_TRANSPOSE_FORWARD [28]: [1] -> [1] (13) | |
|-> 1. 0x1438e8ac0 (0x285da7700:0) [2x133x8x160] -0.091675 0.026260 0.035645 .. | |
|<- 1. 0x1438a9ed0 (0x285da7740:0) [2x8x133x160] -0.091675 0.026260 0.035645 .. | |
Emit: (13, 51) | |
CCV_NNC_GEMM_FORWARD [29]: [2] -> [1] (14) | |
Wait: (14, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c5370 (0x285e696c0:0) [1280x768] 0.050659 -0.016159 -0.011871 .. | |
|<- 1. 0x1438abfa0 (0x285da7f80:0) [2x133x1280] -0.178467 0.800293 -1.226562 .. | |
CCV_NNC_TRANSPOSE_FORWARD [30]: [1] -> [1] (14) | |
|-> 1. 0x1438ec9e0 (0x285da7f80:0) [2x133x8x160] -0.178467 0.800293 -1.226562 .. | |
|<- 1. 0x1438ac010 (0x285da7fc0:0) [2x8x133x160] -0.178467 0.800293 -1.226562 .. | |
Emit: (14, 60) | |
CCV_NNC_GEMM_FORWARD [31]: [2] -> [1] (15) | |
Wait: (15, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c53e0 (0x285e6a280:0) [1280x768] 0.026581 -0.126099 0.020554 .. | |
|<- 1. 0x1438ac160 (0x285d850c0:0) [2x133x1280] -0.026199 -0.083679 -0.066772 .. | |
CCV_NNC_TRANSPOSE_FORWARD [32]: [1] -> [1] (15) | |
|-> 1. 0x1438ecb30 (0x285d850c0:0) [2x133x8x160] -0.026199 -0.083679 -0.066772 .. | |
|<- 1. 0x1438ac1d0 (0x285d84540:0) [2x8x133x160] -0.026199 -0.083679 -0.066772 .. | |
Emit: (15, 61) | |
CCV_NNC_GEMM_FORWARD [33]: [2] -> [1] (16) | |
Wait: (16, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c79f0 (0x285d98e40:0) [1280x768] 0.005672 0.008583 -0.108887 .. | |
|<- 1. 0x1438aee00 (0x285d833c0:0) [2x133x1280] -0.494141 0.059296 0.135498 .. | |
CCV_NNC_TRANSPOSE_FORWARD [34]: [1] -> [1] (16) | |
|-> 1. 0x1438f10b0 (0x285d833c0:0) [2x133x8x160] -0.494141 0.059296 0.135498 .. | |
|<- 1. 0x1438aee70 (0x285d83e40:0) [2x8x133x160] -0.494141 0.059296 0.135498 .. | |
Emit: (16, 80) | |
CCV_NNC_GEMM_FORWARD [35]: [2] -> [1] (17) | |
Wait: (17, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c7a60 (0x285d98e80:0) [1280x768] 0.018356 0.016327 -0.031113 .. | |
|<- 1. 0x1438aefc0 (0x285d83f80:0) [2x133x1280] 0.102844 -0.059814 -0.027191 .. | |
CCV_NNC_TRANSPOSE_FORWARD [36]: [1] -> [1] (17) | |
|-> 1. 0x1438f1200 (0x285d83f80:0) [2x133x8x160] 0.102844 -0.059814 -0.027191 .. | |
|<- 1. 0x1438af030 (0x285d83ec0:0) [2x8x133x160] 0.102844 -0.059814 -0.027191 .. | |
Emit: (17, 81) | |
CCV_NNC_GEMM_FORWARD [37]: [2] -> [1] (18) | |
Wait: (18, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c8b70 (0x285d99840:0) [1280x768] -0.063782 -0.024292 0.022858 .. | |
|<- 1. 0x1438b0990 (0x285d83d40:0) [2x133x1280] 0.121155 0.245972 -0.240967 .. | |
CCV_NNC_TRANSPOSE_FORWARD [38]: [1] -> [1] (18) | |
|-> 1. 0x1438f51a0 (0x285d83d40:0) [2x133x8x160] 0.121155 0.245972 -0.240967 .. | |
|<- 1. 0x1438b0a00 (0x285d82b80:0) [2x8x133x160] 0.121155 0.245972 -0.240967 .. | |
Emit: (18, 90) | |
CCV_NNC_GEMM_FORWARD [39]: [2] -> [1] (19) | |
Wait: (19, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c8be0 (0x285d99880:0) [1280x768] -0.043610 0.111389 -0.029739 .. | |
|<- 1. 0x1438b0b50 (0x285d80ec0:0) [2x133x1280] 0.004066 -0.018509 -0.005821 .. | |
CCV_NNC_TRANSPOSE_FORWARD [40]: [1] -> [1] (19) | |
|-> 1. 0x1438f52f0 (0x285d80ec0:0) [2x133x8x160] 0.004066 -0.018509 -0.005821 .. | |
|<- 1. 0x1438b0bc0 (0x285d8f740:0) [2x8x133x160] 0.004066 -0.018509 -0.005821 .. | |
Emit: (19, 91) | |
CCV_NNC_GEMM_FORWARD [41]: [2] -> [1] (20) | |
Wait: (20, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c9cf0 (0x285d9a240:0) [1280x768] -0.001761 0.075928 0.115906 .. | |
|<- 1. 0x1438b2520 (0x285d89bc0:0) [2x133x1280] 0.334717 -0.014442 -0.148804 .. | |
CCV_NNC_TRANSPOSE_FORWARD [42]: [1] -> [1] (20) | |
|-> 1. 0x1438f9290 (0x285d89bc0:0) [2x133x8x160] 0.334717 -0.014442 -0.148804 .. | |
|<- 1. 0x1438b2590 (0x285d89340:0) [2x8x133x160] 0.334717 -0.014442 -0.148804 .. | |
Emit: (20, 100) | |
CCV_NNC_GEMM_FORWARD [43]: [2] -> [1] (21) | |
Wait: (21, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438c9d60 (0x285d9a280:0) [1280x768] -0.041809 -0.037811 0.074951 .. | |
|<- 1. 0x1438b26e0 (0x285d8ac40:0) [2x133x1280] 0.031281 0.007065 -0.043945 .. | |
CCV_NNC_TRANSPOSE_FORWARD [44]: [1] -> [1] (21) | |
|-> 1. 0x1438f93e0 (0x285d8ac40:0) [2x133x8x160] 0.031281 0.007065 -0.043945 .. | |
|<- 1. 0x1438b2750 (0x285d89c80:0) [2x8x133x160] 0.031281 0.007065 -0.043945 .. | |
Emit: (21, 101) | |
CCV_NNC_GEMM_FORWARD [45]: [2] -> [1] (22) | |
Wait: (22, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438caf50 (0x285d9acc0:0) [640x768] -0.113464 0.034241 -0.047577 .. | |
|<- 1. 0x1438b4120 (0x285df6b80:0) [2x133x640] -0.624512 0.743164 -0.471924 .. | |
CCV_NNC_TRANSPOSE_FORWARD [46]: [1] -> [1] (22) | |
|-> 1. 0x1438fd380 (0x285df6b80:0) [2x133x8x80] -0.624512 0.743164 -0.471924 .. | |
|<- 1. 0x1438b4190 (0x285df3a00:0) [2x8x133x80] -0.624512 0.743164 -0.471924 .. | |
Emit: (22, 110) | |
CCV_NNC_GEMM_FORWARD [47]: [2] -> [1] (23) | |
Wait: (23, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cafc0 (0x285d9ad00:0) [640x768] -0.052460 -0.007027 -0.031403 .. | |
|<- 1. 0x1438b42e0 (0x285df3b40:0) [2x133x640] -0.003769 -0.020844 -0.024673 .. | |
CCV_NNC_TRANSPOSE_FORWARD [48]: [1] -> [1] (23) | |
|-> 1. 0x1438fd4d0 (0x285df3b40:0) [2x133x8x80] -0.003769 -0.020844 -0.024673 .. | |
|<- 1. 0x1438b4350 (0x285df34c0:0) [2x8x133x80] -0.003769 -0.020844 -0.024673 .. | |
Emit: (23, 111) | |
CCV_NNC_GEMM_FORWARD [49]: [2] -> [1] (24) | |
Wait: (24, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cc0d0 (0x285d9b6c0:0) [640x768] -0.041046 -0.033722 -0.042297 .. | |
|<- 1. 0x1438b5cb0 (0x285df3480:0) [2x133x640] -0.090027 0.466309 0.978516 .. | |
CCV_NNC_TRANSPOSE_FORWARD [50]: [1] -> [1] (24) | |
|-> 1. 0x143901470 (0x285df3480:0) [2x133x8x80] -0.090027 0.466309 0.978516 .. | |
|<- 1. 0x1438b5d20 (0x285df3940:0) [2x8x133x80] -0.090027 0.466309 0.978516 .. | |
Emit: (24, 120) | |
CCV_NNC_GEMM_FORWARD [51]: [2] -> [1] (25) | |
Wait: (25, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cc140 (0x285d9b700:0) [640x768] -0.016235 -0.003174 -0.023041 .. | |
|<- 1. 0x1438b5e70 (0x285df0a40:0) [2x133x640] -0.021072 0.016312 -0.006813 .. | |
CCV_NNC_TRANSPOSE_FORWARD [52]: [1] -> [1] (25) | |
|-> 1. 0x1439015c0 (0x285df0a40:0) [2x133x8x80] -0.021072 0.016312 -0.006813 .. | |
|<- 1. 0x1438b5ee0 (0x285df0740:0) [2x8x133x80] -0.021072 0.016312 -0.006813 .. | |
Emit: (25, 121) | |
CCV_NNC_GEMM_FORWARD [53]: [2] -> [1] (26) | |
Wait: (26, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cd250 (0x285d9c0c0:0) [640x768] 0.073486 0.011406 -0.008133 .. | |
|<- 1. 0x1438b7840 (0x285de5780:0) [2x133x640] -0.396484 -0.269043 -0.424072 .. | |
CCV_NNC_TRANSPOSE_FORWARD [54]: [1] -> [1] (26) | |
|-> 1. 0x143905560 (0x285de5780:0) [2x133x8x80] -0.396484 -0.269043 -0.424072 .. | |
|<- 1. 0x1438b78b0 (0x285de7a00:0) [2x8x133x80] -0.396484 -0.269043 -0.424072 .. | |
Emit: (26, 130) | |
CCV_NNC_GEMM_FORWARD [55]: [2] -> [1] (27) | |
Wait: (27, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cd2c0 (0x285d9c100:0) [640x768] 0.004990 0.025543 0.019318 .. | |
|<- 1. 0x1438b7a00 (0x285de0dc0:0) [2x133x640] 0.022568 -0.025116 -0.027023 .. | |
CCV_NNC_TRANSPOSE_FORWARD [56]: [1] -> [1] (27) | |
|-> 1. 0x1439056b0 (0x285de0dc0:0) [2x133x8x80] 0.022568 -0.025116 -0.027023 .. | |
|<- 1. 0x1438b7a70 (0x285de0e80:0) [2x8x133x80] 0.022568 -0.025116 -0.027023 .. | |
Emit: (27, 131) | |
CCV_NNC_GEMM_FORWARD [57]: [2] -> [1] (28) | |
Wait: (28, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438ce4b0 (0x285d9cb40:0) [320x768] -0.017227 0.046448 0.083008 .. | |
|<- 1. 0x1438b9440 (0x285e2f180:0) [2x133x320] 2.285156 0.156494 -1.203125 .. | |
CCV_NNC_TRANSPOSE_FORWARD [58]: [1] -> [1] (28) | |
|-> 1. 0x143909650 (0x285e2f180:0) [2x133x8x40] 2.285156 0.156494 -1.203125 .. | |
|<- 1. 0x1438b94b0 (0x285e2f300:0) [2x8x133x40] 2.285156 0.156494 -1.203125 .. | |
Emit: (28, 140) | |
CCV_NNC_GEMM_FORWARD [59]: [2] -> [1] (29) | |
Wait: (29, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438ce520 (0x285d9cb80:0) [320x768] 0.019409 0.018814 0.000233 .. | |
|<- 1. 0x1438b9600 (0x285e2fa40:0) [2x133x320] -0.004307 -0.029922 0.005905 .. | |
CCV_NNC_TRANSPOSE_FORWARD [60]: [1] -> [1] (29) | |
|-> 1. 0x1439097a0 (0x285e2fa40:0) [2x133x8x40] -0.004307 -0.029922 0.005905 .. | |
|<- 1. 0x1438b9670 (0x285e2ee80:0) [2x8x133x40] -0.004307 -0.029922 0.005905 .. | |
Emit: (29, 141) | |
CCV_NNC_GEMM_FORWARD [61]: [2] -> [1] (30) | |
Wait: (30, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cf630 (0x285d9d540:0) [320x768] 0.016708 -0.056610 -0.050446 .. | |
|<- 1. 0x1438bafd0 (0x285ef5940:0) [2x133x320] -1.026367 0.949707 -6.625000 .. | |
CCV_NNC_TRANSPOSE_FORWARD [62]: [1] -> [1] (30) | |
|-> 1. 0x14390d740 (0x285ef5940:0) [2x133x8x40] -1.026367 0.949707 -6.625000 .. | |
|<- 1. 0x1438bb040 (0x285ef41c0:0) [2x8x133x40] -1.026367 0.949707 -6.625000 .. | |
Emit: (30, 150) | |
CCV_NNC_GEMM_FORWARD [63]: [2] -> [1] (31) | |
Wait: (31, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438cf6a0 (0x285d9d580:0) [320x768] 0.001955 -0.014694 -0.003132 .. | |
|<- 1. 0x1438bb190 (0x285ed4f80:0) [2x133x320] 0.047729 0.026077 0.020203 .. | |
CCV_NNC_TRANSPOSE_FORWARD [64]: [1] -> [1] (31) | |
|-> 1. 0x14390d890 (0x285ed4f80:0) [2x133x8x40] 0.047729 0.026077 0.020203 .. | |
|<- 1. 0x1438bb200 (0x285ed54c0:0) [2x8x133x40] 0.047729 0.026077 0.020203 .. | |
Emit: (31, 151) | |
CCV_NNC_GEMM_FORWARD [65]: [2] -> [1] (32) | |
Wait: (32, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438d07b0 (0x285d9df40:0) [320x768] 0.003315 0.021103 0.009254 .. | |
|<- 1. 0x1438bcb60 (0x285f6d480:0) [2x133x320] 0.226440 -0.880859 -0.376221 .. | |
CCV_NNC_TRANSPOSE_FORWARD [66]: [1] -> [1] (32) | |
|-> 1. 0x143911830 (0x285f6d480:0) [2x133x8x40] 0.226440 -0.880859 -0.376221 .. | |
|<- 1. 0x1438bcbd0 (0x285f6d400:0) [2x8x133x40] 0.226440 -0.880859 -0.376221 .. | |
Emit: (32, 160) | |
CCV_NNC_GEMM_FORWARD [67]: [2] -> [1] (33) | |
Wait: (33, 0) | |
|-> 1. 0x1438bd490 (0x285e6c2c0:0) [2x133x768] -0.387939 0.023743 -0.054749 .. | |
|-> 2. 0x1438d0820 (0x285d9df80:0) [320x768] 0.005962 -0.006207 -0.002657 .. | |
|<- 1. 0x1438bcd20 (0x285f6d200:0) [2x133x320] -0.004234 0.009697 0.024551 .. | |
CCV_NNC_TRANSPOSE_FORWARD [68]: [1] -> [1] (33) | |
|-> 1. 0x143911980 (0x285f6d200:0) [2x133x8x40] -0.004234 0.009697 0.024551 .. | |
|<- 1. 0x1438bcd90 (0x285da6ec0:0) [2x8x133x40] -0.004234 0.009697 0.024551 .. | |
Emit: (33, 161) | |
CCV_NNC_SWISH_FORWARD [69]: [1] -> [1] (0) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.068420 -0.037476 -0.015541 .. | |
|<- 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
Emit: (0, 2) | |
CCV_NNC_GROUP_NORM_FORWARD [70]: [3] -> [3] (1) | |
|-> 1. 0x14390db70 (0x285f78ac0:0) [2x64x64x320] -0.319092 -0.406982 0.225342 .. | |
|-> 2. 0x1438bd810 (0x285d84100:0) [1x1x1x320] 0.484131 0.523926 0.366943 .. | |
|-> 3. 0x1438bd880 (0x285d84600:0) [1x1x1x320] -0.007233 -0.079224 -0.075317 .. | |
|<- 1. 0x1438a00e0 (0x285da5680:0) [2x64x64x320] -0.373535 -0.587402 0.132080 .. | |
|<- 2. 0x1438a0150 (0x285da5700:0) [2x1x1x32] -0.007511 -0.001691 0.001145 .. | |
|<- 3. 0x1438a01c0 (0x285da5740:0) [2x1x1x32] 2.427734 2.734375 3.083984 .. | |
CCV_NNC_SWISH_FORWARD [71]: [1] -> [1] (1) | |
|-> 1. 0x1438a00e0 (0x285da5680:0) [2x64x64x320] -0.373535 -0.587402 0.132080 .. | |
|<- 1. 0x1438a00e0 (0x285da5680:0) [2x64x64x320] -0.152344 -0.209839 0.070374 .. | |
CCV_NNC_CONVOLUTION_FORWARD [72]: [3] -> [1] (1) | |
|-> 1. 0x1438a00e0 (0x285da5680:0) [2x64x64x320] -0.152344 -0.209839 0.070374 .. | |
|-> 2. 0x1438bd9d0 (0x285d84500:0) [320x320x3x3] -0.018021 -0.052185 -0.052765 .. | |
|-> 3. 0x1438bda40 (0x285d84780:0) [320] 0.036621 -0.050140 0.015305 .. | |
|<- 1. 0x1438a02a0 (0x285da56c0:0) [2x64x64x320] 0.862793 0.136719 -1.131836 .. | |
Emit: (1, 1) | |
CCV_NNC_GEMM_FORWARD [73]: [3] -> [1] (0) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438bd8f0 (0x285d84400:0) [320x1280] -0.004944 -0.001311 -0.004967 .. | |
|-> 3. 0x1438bd960 (0x285d846c0:0) [320] 0.038757 -0.058807 0.015556 .. | |
|<- 1. 0x1438a0230 (0x285da5780:0) [2x320] 0.389648 0.819824 0.133667 .. | |
CCV_NNC_ADD_FORWARD [74]: [2] -> [1] (0) | |
Wait: (0, 1) | |
|-> 1. 0x1438a02a0 (0x285da56c0:0) [2x64x64x320] 0.862793 0.136719 -1.131836 .. | |
|-> 2. 0x1438d0f90 (0x285da5780:0) [2x1x1x320] 0.389648 0.819824 0.133667 .. | |
|<- 1. 0x1438a02a0 (0x285da56c0:0) [2x64x64x320] 1.251953 0.956543 -0.998047 .. | |
CCV_NNC_GROUP_NORM_FORWARD [75]: [3] -> [3] (0) | |
|-> 1. 0x1438a02a0 (0x285da56c0:0) [2x64x64x320] 1.251953 0.956543 -0.998047 .. | |
|-> 2. 0x1438bdab0 (0x285d84680:0) [1x1x1x320] 0.290283 0.676270 0.381104 .. | |
|-> 3. 0x1438bdb20 (0x285d84740:0) [1x1x1x320] -0.077087 -0.171631 -0.141968 .. | |
|<- 1. 0x1438a0310 (0x285da5680:0) [2x64x64x320] 0.135986 0.244141 -0.208862 .. | |
|<- 2. 0x1438a0380 (0x285da57c0:0) [2x1x1x32] -0.563965 -0.766113 -0.697754 .. | |
|<- 3. 0x1438a03f0 (0x285da5800:0) [2x1x1x32] 0.404297 0.273682 0.777832 .. | |
CCV_NNC_SWISH_FORWARD [76]: [1] -> [1] (0) | |
|-> 1. 0x1438a0310 (0x285da5680:0) [2x64x64x320] 0.135986 0.244141 -0.208862 .. | |
|<- 1. 0x1438a0310 (0x285da5680:0) [2x64x64x320] 0.072632 0.136841 -0.093567 .. | |
CCV_NNC_CONVOLUTION_FORWARD [77]: [3] -> [1] (0) | |
|-> 1. 0x1438a0310 (0x285da5680:0) [2x64x64x320] 0.072632 0.136841 -0.093567 .. | |
|-> 2. 0x1438bdb90 (0x285d84800:0) [320x320x3x3] 0.012184 0.018036 -0.006847 .. | |
|-> 3. 0x1438bdc00 (0x285d84700:0) [320] 0.001400 -0.109863 0.059784 .. | |
|<- 1. 0x1438a0460 (0x285da56c0:0) [2x64x64x320] 0.450928 -1.825195 0.461914 .. | |
CCV_NNC_ADD_FORWARD [78]: [2] -> [1] (0) | |
|-> 1. 0x14390db70 (0x285f78ac0:0) [2x64x64x320] -0.319092 -0.406982 0.225342 .. | |
|-> 2. 0x1438a0460 (0x285da56c0:0) [2x64x64x320] 0.450928 -1.825195 0.461914 .. | |
|<- 1. 0x1438a04d0 (0x285da5840:0) [2x64x64x320] 0.131836 -2.232422 0.687500 .. | |
CCV_NNC_GEMM_FORWARD [79]: [3] -> [1] (34) | |
Wait: (34, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438be990 (0x285d84bc0:0) [320x1280] -0.004845 -0.001458 -0.003963 .. | |
|-> 3. 0x1438bea00 (0x285d85200:0) [320] 0.004868 -0.009079 -0.058716 .. | |
|<- 1. 0x1438a1d50 (0x285da5dc0:0) [2x320] 0.114136 0.382324 -0.697754 .. | |
Emit: (34, 10) | |
CCV_NNC_GEMM_FORWARD [80]: [3] -> [1] (35) | |
Wait: (35, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438bfb10 (0x285d85c80:0) [640x1280] 0.006191 -0.002232 -0.009239 .. | |
|-> 3. 0x1438bfb80 (0x285d85cc0:0) [640] 0.027374 -0.004711 0.019440 .. | |
|<- 1. 0x1438a3870 (0x285da6180:0) [2x640] 0.351318 -0.119873 0.318848 .. | |
Emit: (35, 18) | |
CCV_NNC_GEMM_FORWARD [81]: [3] -> [1] (36) | |
Wait: (36, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c0c90 (0x285d86680:0) [640x1280] 0.004734 -0.008568 0.008568 .. | |
|-> 3. 0x1438c0d00 (0x285d866c0:0) [640] 0.026276 0.008690 -0.049683 .. | |
|<- 1. 0x1438a5390 (0x285da6840:0) [2x640] 0.087891 -3.085938 0.536621 .. | |
Emit: (36, 28) | |
CCV_NNC_GEMM_FORWARD [82]: [3] -> [1] (37) | |
Wait: (37, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c1e10 (0x285d87080:0) [1280x1280] -0.006657 0.006611 -0.002247 .. | |
|-> 3. 0x1438c1e80 (0x285d870c0:0) [1280] 0.013191 0.012268 0.008003 .. | |
|<- 1. 0x1438a6eb0 (0x285da6d80:0) [2x1280] 0.093994 0.277832 0.315918 .. | |
Emit: (37, 36) | |
CCV_NNC_GEMM_FORWARD [83]: [3] -> [1] (38) | |
Wait: (38, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c2f90 (0x285d87a80:0) [1280x1280] -0.005486 -0.005077 -0.003628 .. | |
|-> 3. 0x1438c3000 (0x285d87ac0:0) [1280] 0.044830 -0.016068 0.031052 .. | |
|<- 1. 0x1438a89d0 (0x285da7440:0) [2x1280] 0.601562 -0.082703 0.705078 .. | |
Emit: (38, 46) | |
CCV_NNC_GEMM_FORWARD [84]: [3] -> [1] (39) | |
Wait: (39, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c4110 (0x285d8a640:0) [1280x1280] -0.007282 -0.001312 0.003534 .. | |
|-> 3. 0x1438c4180 (0x285d8ac00:0) [1280] 0.077209 -0.040894 -0.032227 .. | |
|<- 1. 0x1438aa4f0 (0x285da7940:0) [2x1280] 0.770020 0.276611 0.438477 .. | |
Emit: (39, 54) | |
CCV_NNC_GEMM_FORWARD [85]: [3] -> [1] (40) | |
Wait: (40, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c4570 (0x285df7340:0) [1280x1280] 0.002802 -0.005547 0.010971 .. | |
|-> 3. 0x1438c45e0 (0x285df7280:0) [1280] -0.076843 0.028809 0.114197 .. | |
|<- 1. 0x1438aa8e0 (0x285da7a80:0) [2x1280] -0.554199 0.637207 0.615234 .. | |
Emit: (40, 55) | |
CCV_NNC_GEMM_FORWARD [86]: [3] -> [1] (41) | |
Wait: (41, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c49d0 (0x285dfd540:0) [1280x1280] 0.001873 -0.000576 -0.005287 .. | |
|-> 3. 0x1438c4a40 (0x285de0700:0) [1280] 0.076538 0.086609 0.002594 .. | |
|<- 1. 0x1438aacd0 (0x285da7bc0:0) [2x1280] 0.581543 1.150391 0.077393 .. | |
Emit: (41, 56) | |
CCV_NNC_GEMM_FORWARD [87]: [3] -> [1] (42) | |
Wait: (42, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c5a70 (0x285e6a040:0) [1280x1280] -0.000326 -0.004715 -0.008072 .. | |
|-> 3. 0x1438c5ae0 (0x285e69c00:0) [1280] 0.128540 -0.076782 0.120300 .. | |
|<- 1. 0x1438ac7f0 (0x285d84340:0) [2x1280] 0.444092 0.104248 0.304443 .. | |
Emit: (42, 64) | |
CCV_NNC_GEMM_FORWARD [88]: [3] -> [1] (43) | |
Wait: (43, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c5ed0 (0x285e69540:0) [1280x1280] -0.006855 -0.009766 -0.000924 .. | |
|-> 3. 0x1438c5f40 (0x285e69c80:0) [1280] 0.033813 0.077148 0.046234 .. | |
|<- 1. 0x1438acc50 (0x285d82bc0:0) [2x1280] 0.063354 0.040497 0.044067 .. | |
Emit: (43, 65) | |
CCV_NNC_GEMM_FORWARD [89]: [3] -> [1] (44) | |
Wait: (44, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c6410 (0x285d981c0:0) [1280x1280] 0.011826 -0.011513 -0.001285 .. | |
|-> 3. 0x1438c6480 (0x285d98200:0) [1280] 0.017502 -0.009285 -0.049225 .. | |
|<- 1. 0x1438ad120 (0x285d837c0:0) [2x1280] 0.086243 1.029297 0.114319 .. | |
Emit: (44, 68) | |
CCV_NNC_GEMM_FORWARD [90]: [3] -> [1] (45) | |
Wait: (45, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c6950 (0x285d984c0:0) [1280x1280] 0.004402 -0.006351 0.008255 .. | |
|-> 3. 0x1438c69c0 (0x285d98500:0) [1280] 0.031647 -0.037048 0.060364 .. | |
|<- 1. 0x1438ad5f0 (0x285d800c0:0) [2x1280] 0.105347 -0.784180 0.284912 .. | |
Emit: (45, 71) | |
CCV_NNC_GEMM_FORWARD [91]: [3] -> [1] (46) | |
Wait: (46, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c6f70 (0x285d98840:0) [1280x1280] -0.003630 0.008698 0.005058 .. | |
|-> 3. 0x1438c6fe0 (0x285d98880:0) [1280] 0.100220 0.082825 0.077271 .. | |
|<- 1. 0x1438adb30 (0x285d83980:0) [2x1280] -0.228027 0.609375 0.654297 .. | |
Emit: (46, 74) | |
CCV_NNC_GEMM_FORWARD [92]: [3] -> [1] (47) | |
Wait: (47, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c80f0 (0x285d99240:0) [1280x1280] 0.007771 -0.006096 0.009300 .. | |
|-> 3. 0x1438c8160 (0x285d99280:0) [1280] 0.065491 0.066833 -0.015106 .. | |
|<- 1. 0x1438af6c0 (0x285d83f40:0) [2x1280] -0.230713 0.213135 -0.136353 .. | |
Emit: (47, 84) | |
CCV_NNC_GEMM_FORWARD [93]: [3] -> [1] (48) | |
Wait: (48, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438c9270 (0x285d99c40:0) [1280x1280] -0.000185 -0.003536 0.004467 .. | |
|-> 3. 0x1438c92e0 (0x285d99c80:0) [1280] 0.041534 0.008492 0.046967 .. | |
|<- 1. 0x1438b1250 (0x285d8c440:0) [2x1280] 1.041992 0.774902 1.260742 .. | |
Emit: (48, 94) | |
CCV_NNC_GEMM_FORWARD [94]: [3] -> [1] (49) | |
Wait: (49, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438ca4d0 (0x285d9a6c0:0) [640x1280] -0.012924 -0.011131 0.001637 .. | |
|-> 3. 0x1438ca540 (0x285d9a700:0) [640] 0.100769 0.093994 0.061066 .. | |
|<- 1. 0x1438b2e50 (0x285df5b80:0) [2x640] 0.082214 1.164062 0.841797 .. | |
Emit: (49, 104) | |
CCV_NNC_GEMM_FORWARD [95]: [3] -> [1] (50) | |
Wait: (50, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438cb650 (0x285d9b0c0:0) [640x1280] -0.000035 -0.001340 -0.006222 .. | |
|-> 3. 0x1438cb6c0 (0x285d9b100:0) [640] 0.053101 -0.055695 -0.059418 .. | |
|<- 1. 0x1438b49e0 (0x285df3880:0) [2x640] 0.327637 -0.112061 0.204590 .. | |
Emit: (50, 114) | |
CCV_NNC_GEMM_FORWARD [96]: [3] -> [1] (51) | |
Wait: (51, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438cc7d0 (0x285d9bac0:0) [640x1280] 0.007111 -0.001447 0.010307 .. | |
|-> 3. 0x1438cc840 (0x285d9bb00:0) [640] 0.019012 0.010918 0.034790 .. | |
|<- 1. 0x1438b6570 (0x285dffc00:0) [2x640] -0.846680 0.141968 0.290283 .. | |
Emit: (51, 124) | |
CCV_NNC_GEMM_FORWARD [97]: [3] -> [1] (52) | |
Wait: (52, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438cda30 (0x285d9c540:0) [320x1280] 0.001700 -0.003801 -0.004478 .. | |
|-> 3. 0x1438cdaa0 (0x285d9c580:0) [320] -0.004143 0.078064 0.069885 .. | |
|<- 1. 0x1438b8170 (0x285def880:0) [2x320] 0.466797 0.149780 1.849609 .. | |
Emit: (52, 134) | |
CCV_NNC_GEMM_FORWARD [98]: [3] -> [1] (53) | |
Wait: (53, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438cebb0 (0x285d9cf40:0) [320x1280] 0.005024 -0.000107 0.000202 .. | |
|-> 3. 0x1438cec20 (0x285d9cf80:0) [320] 0.031738 -0.058533 0.119751 .. | |
|<- 1. 0x1438b9d00 (0x285e6b440:0) [2x320] 0.176636 -1.454102 0.976562 .. | |
Emit: (53, 144) | |
CCV_NNC_GEMM_FORWARD [99]: [3] -> [1] (54) | |
Wait: (54, 2) | |
|-> 1. 0x1438a0070 (0x285da5640:0) [2x1280] -0.033051 -0.018387 -0.007710 .. | |
|-> 2. 0x1438cfd30 (0x285d9d940:0) [320x1280] -0.006310 0.003212 0.005932 .. | |
|-> 3. 0x1438cfda0 (0x285d9d980:0) [320] -0.016846 -0.054718 0.046021 .. | |
|<- 1. 0x1438bb890 (0x285f65e80:0) [2x320] -0.972656 0.468994 0.141357 .. | |
Emit: (54, 154) | |
CCV_NNC_GROUP_NORM_FORWARD [100]: [3] -> [3] (0) | |
|-> 1. 0x1438a04d0 (0x285da5840:0) [2x64x64x320] 0.131836 -2.232422 0.687500 .. | |
|-> 2. 0x1438bdc70 (0x285d847c0:0) [1x1x1x320] 0.349365 0.203857 0.279053 .. | |
|-> 3. 0x1438bdce0 (0x285d84880:0) [1x1x1x320] -0.073303 0.182617 -0.251465 .. | |
|<- 1. 0x1438a0540 (0x285da5680:0) [2x64x64x320] -0.015656 -0.225952 -0.063171 .. | |
|<- 2. 0x1438a05b0 (0x285da5740:0) [2x1x1x32] -0.048035 -0.275879 0.005417 .. | |
|<- 3. 0x1438a0620 (0x285da5700:0) [2x1x1x32] 0.917480 1.359375 4.316406 .. | |
CCV_NNC_CONVOLUTION_FORWARD [101]: [3] -> [1] (0) | |
|-> 1. 0x1438a0540 (0x285da5680:0) [2x64x64x320] -0.015656 -0.225952 -0.063171 .. | |
|-> 2. 0x1438bdd50 (0x285d84840:0) [320x320x1x1] 0.018326 .. | |
|-> 3. 0x1438bddc0 (0x285d84c40:0) [320] 0.057037 0.063049 -0.028610 .. | |
|<- 1. 0x1438a0690 (0x285da56c0:0) [2x64x64x320] 0.347656 0.462646 -0.141479 .. | |
CCV_NNC_LAYER_NORM_FORWARD [102]: [3] -> [3] (0) | |
|-> 1. 0x1438d1000 (0x285da56c0:0) [2x4096x320] 0.347656 0.462646 -0.141479 .. | |
|-> 2. 0x1438bde30 (0x285d84d00:0) [1x1x320] 0.759766 0.622559 0.730469 .. | |
|-> 3. 0x1438bdea0 (0x285d84c80:0) [1x1x320] 0.039795 -0.103760 -0.001315 .. | |
|<- 1. 0x1438a0700 (0x285da5680:0) [2x4096x320] 1.031250 1.008789 -0.544434 .. | |
|<- 2. 0x1438a0770 (0x285da5880:0) [2x4096x1] 0.036041 .. | |
|<- 3. 0x1438a07e0 (0x285da58c0:0) [2x4096x1] 4.187500 .. | |
Emit: (0, 3) | |
CCV_NNC_GEMM_FORWARD [103]: [2] -> [1] (0) | |
|-> 1. 0x1438a0700 (0x285da5680:0) [2x4096x320] 1.031250 1.008789 -0.544434 .. | |
|-> 2. 0x1438bdf10 (0x285d84c00:0) [320x320] 0.071777 -0.076782 0.022446 .. | |
|<- 1. 0x1438a0850 (0x285da5900:0) [2x4096x320] 1.149414 -1.515625 -0.993164 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [104]: [1] -> [1] (0) | |
|-> 1. 0x1438a0850 (0x285da5900:0) [2x4096x320] 1.149414 -1.515625 -0.993164 .. | |
|<- 1. 0x1438a0850 (0x285da5900:0) [2x4096x320] 0.181641 -0.239624 -0.156982 .. | |
CCV_NNC_TRANSPOSE_FORWARD [105]: [1] -> [1] (0) | |
|-> 1. 0x1438d10e0 (0x285da5900:0) [2x4096x8x40] 0.181641 -0.239624 -0.156982 .. | |
|<- 1. 0x1438a09a0 (0x285da59c0:0) [2x8x4096x40] 0.181641 -0.239624 -0.156982 .. | |
CCV_NNC_GEMM_FORWARD [106]: [2] -> [1] (1) | |
Wait: (1, 3) | |
|-> 1. 0x1438a0700 (0x285da5680:0) [2x4096x320] 1.031250 1.008789 -0.544434 .. | |
|-> 2. 0x1438bdf80 (0x285d84cc0:0) [320x320] -0.111938 -0.047272 -0.020325 .. | |
|<- 1. 0x1438a08c0 (0x285da5940:0) [2x4096x320] 0.471924 -0.942871 0.792969 .. | |
CCV_NNC_TRANSPOSE_FORWARD [107]: [1] -> [1] (1) | |
|-> 1. 0x1438d1070 (0x285da5940:0) [2x4096x8x40] 0.471924 -0.942871 0.792969 .. | |
|<- 1. 0x1438a0930 (0x285da5980:0) [2x8x4096x40] 0.471924 -0.942871 0.792969 .. | |
Emit: (1, 4) | |
CCV_NNC_GEMM_FORWARD [108]: [2] -> [1] (55) | |
Wait: (55, 3) | |
|-> 1. 0x1438a0700 (0x285da5680:0) [2x4096x320] 1.031250 1.008789 -0.544434 .. | |
|-> 2. 0x1438bdff0 (0x285d84d40:0) [320x320] -0.024887 0.011726 -0.073364 .. | |
|<- 1. 0x1438a0a10 (0x285da5a00:0) [2x4096x320] 0.333496 0.162231 0.011147 .. | |
CCV_NNC_TRANSPOSE_FORWARD [109]: [1] -> [1] (55) | |
|-> 1. 0x1438d1230 (0x285da5a00:0) [2x4096x8x40] 0.333496 0.162231 0.011147 .. | |
|<- 1. 0x1438a0af0 (0x285da5a80:0) [2x8x4096x40] 0.333496 0.162231 0.011147 .. | |
Emit: (55, 5) | |
CCV_NNC_GEMM_FORWARD [110]: [2] -> [1] (0) | |
Wait: (0, 4) | |
|-> 1. 0x1438d11c0 (0x285da59c0:0) [1x4096x40] 0.181641 -0.239624 -0.156982 .. | |
|-> 2. 0x1438d1150 (0x285da5980:0) [1x4096x40] 0.471924 -0.942871 0.792969 .. | |
|<- 1. 0x1438a0a80 (0x285da5a40:0) [1x4096x4096] 1.342773 1.739258 0.361328 .. | |
CCV_NNC_SOFTMAX_FORWARD [111]: [1] -> [1] (0) | |
|-> 1. 0x1438d12a0 (0x285da5a40:0) [4096x4096] 1.342773 1.739258 0.361328 .. | |
|<- 1. 0x1438d12a0 (0x285da5a40:0) [4096x4096] 0.000418 0.000622 0.000157 .. | |
CCV_NNC_GEMM_FORWARD [112]: [2] -> [1] (0) | |
Wait: (0, 5) | |
|-> 1. 0x1438d1380 (0x285da5a40:0) [1x4096x4096] 0.000418 0.000622 0.000157 .. | |
|-> 2. 0x1438d1310 (0x285da5a80:0) [1x4096x40] 0.333496 0.162231 0.011147 .. | |
|<- 1. 0x1438d4000 (0x285da5680:0) [1x4096x40] -0.164062 -0.099121 0.168091 .. | |
CCV_NNC_GEMM_FORWARD [113]: [2] -> [1] (0) | |
|-> 1. 0x1438d14a0 (0x285da59c0:0) [1x4096x40] 0.315186 0.172241 -0.090027 .. | |
|-> 2. 0x1438d13f0 (0x285da5980:0) [1x4096x40] 1.596680 -0.960449 0.928711 .. | |
|<- 1. 0x1438a0b60 (0x285da5a40:0) [1x4096x4096] 7.625000 3.019531 3.916016 .. | |
CCV_NNC_SOFTMAX_FORWARD [114]: [1] -> [1] (0) | |
|-> 1. 0x1438d1550 (0x285da5a40:0) [4096x4096] 7.625000 3.019531 3.916016 .. | |
|<- 1. 0x1438d1550 (0x285da5a40:0) [4096x4096] 0.034180 0.000342 0.000838 .. | |
CCV_NNC_GEMM_FORWARD [115]: [2] -> [1] (0) | |
|-> 1. 0x1438d1670 (0x285da5a40:0) [1x4096x4096] 0.034180 0.000342 0.000838 .. | |
|-> 2. 0x1438d15c0 (0x285da5a80:0) [1x4096x40] 0.084656 0.138184 0.002228 .. | |
|<- 1. 0x1438d4070 (0x285da5680:0) [1x4096x40] -0.028610 0.000618 0.013924 .. | |
CCV_NNC_GEMM_FORWARD [116]: [2] -> [1] (0) | |
|-> 1. 0x1438d1790 (0x285da59c0:0) [1x4096x40] -0.071655 -0.121826 -0.061707 .. | |
|-> 2. 0x1438d16e0 (0x285da5980:0) [1x4096x40] -0.478516 -1.603516 -0.821289 .. | |
|<- 1. 0x1438a0bd0 (0x285da5a40:0) [1x4096x4096] 4.460938 2.183594 2.863281 .. | |
CCV_NNC_SOFTMAX_FORWARD [117]: [1] -> [1] (0) | |
|-> 1. 0x1438d1840 (0x285da5a40:0) [4096x4096] 4.460938 2.183594 2.863281 .. | |
|<- 1. 0x1438d1840 (0x285da5a40:0) [4096x4096] 0.017975 0.001843 0.003637 .. | |
CCV_NNC_GEMM_FORWARD [118]: [2] -> [1] (0) | |
|-> 1. 0x1438d1960 (0x285da5a40:0) [1x4096x4096] 0.017975 0.001843 0.003637 .. | |
|-> 2. 0x1438d18b0 (0x285da5a80:0) [1x4096x40] 0.279053 -0.195801 0.358887 .. | |
|<- 1. 0x1438d4120 (0x285da5680:0) [1x4096x40] 0.075317 -0.022110 0.061371 .. | |
CCV_NNC_GEMM_FORWARD [119]: [2] -> [1] (0) | |
|-> 1. 0x1438d1a80 (0x285da59c0:0) [1x4096x40] -0.276611 -0.201660 -0.025070 .. | |
|-> 2. 0x1438d19d0 (0x285da5980:0) [1x4096x40] -0.522949 -0.113892 1.308594 .. | |
|<- 1. 0x1438a0c40 (0x285da5a40:0) [1x4096x4096] 0.968262 1.105469 0.160156 .. | |
CCV_NNC_SOFTMAX_FORWARD [120]: [1] -> [1] (0) | |
|-> 1. 0x1438d1b30 (0x285da5a40:0) [4096x4096] 0.968262 1.105469 0.160156 .. | |
|<- 1. 0x1438d1b30 (0x285da5a40:0) [4096x4096] 0.000864 0.000990 0.000385 .. | |
CCV_NNC_GEMM_FORWARD [121]: [2] -> [1] (0) | |
|-> 1. 0x1438d1c50 (0x285da5a40:0) [1x4096x4096] 0.000864 0.000990 0.000385 .. | |
|-> 2. 0x1438d1ba0 (0x285da5a80:0) [1x4096x40] 0.065002 -0.490479 -0.035065 .. | |
|<- 1. 0x1438d41d0 (0x285da5680:0) [1x4096x40] 0.084290 -0.009338 0.205078 .. | |
CCV_NNC_GEMM_FORWARD [122]: [2] -> [1] (0) | |
|-> 1. 0x1438d1d70 (0x285da59c0:0) [1x4096x40] 0.087524 -0.084839 0.022324 .. | |
|-> 2. 0x1438d1cc0 (0x285da5980:0) [1x4096x40] 1.386719 -0.196899 -1.851562 .. | |
|<- 1. 0x1438a0cb0 (0x285da5a40:0) [1x4096x4096] 4.031250 2.867188 2.191406 .. | |
CCV_NNC_SOFTMAX_FORWARD [123]: [1] -> [1] (0) | |
|-> 1. 0x1438d1e20 (0x285da5a40:0) [4096x4096] 4.031250 2.867188 2.191406 .. | |
|<- 1. 0x1438d1e20 (0x285da5a40:0) [4096x4096] 0.009003 0.002810 0.001430 .. | |
CCV_NNC_GEMM_FORWARD [124]: [2] -> [1] (0) | |
|-> 1. 0x1438d1f40 (0x285da5a40:0) [1x4096x4096] 0.009003 0.002810 0.001430 .. | |
|-> 2. 0x1438d1e90 (0x285da5a80:0) [1x4096x40] -0.168457 0.082825 -0.655273 .. | |
|<- 1. 0x1438d4280 (0x285da5680:0) [1x4096x40] 0.018707 -0.049713 -0.241455 .. | |
CCV_NNC_GEMM_FORWARD [125]: [2] -> [1] (0) | |
|-> 1. 0x1438d2060 (0x285da59c0:0) [1x4096x40] 0.116150 0.235718 0.070007 .. | |
|-> 2. 0x1438d1fb0 (0x285da5980:0) [1x4096x40] -0.277832 -1.186523 0.947266 .. | |
|<- 1. 0x1438a0d20 (0x285da5a40:0) [1x4096x4096] 1.523438 1.729492 1.864258 .. | |
CCV_NNC_SOFTMAX_FORWARD [126]: [1] -> [1] (0) | |
|-> 1. 0x1438d2110 (0x285da5a40:0) [4096x4096] 1.523438 1.729492 1.864258 .. | |
|<- 1. 0x1438d2110 (0x285da5a40:0) [4096x4096] 0.000710 0.000873 0.000998 .. | |
CCV_NNC_GEMM_FORWARD [127]: [2] -> [1] (0) | |
|-> 1. 0x1438d2230 (0x285da5a40:0) [1x4096x4096] 0.000710 0.000873 0.000998 .. | |
|-> 2. 0x1438d2180 (0x285da5a80:0) [1x4096x40] -0.005127 0.099792 0.155029 .. | |
|<- 1. 0x1438d4330 (0x285da5680:0) [1x4096x40] 0.072449 -0.060333 -0.011993 .. | |
CCV_NNC_GEMM_FORWARD [128]: [2] -> [1] (0) | |
|-> 1. 0x1438d2350 (0x285da59c0:0) [1x4096x40] 0.019272 -0.055237 -0.130005 .. | |
|-> 2. 0x1438d22a0 (0x285da5980:0) [1x4096x40] 0.814453 -0.346191 1.026367 .. | |
|<- 1. 0x1438a0d90 (0x285da5a40:0) [1x4096x4096] 8.171875 4.007812 5.050781 .. | |
CCV_NNC_SOFTMAX_FORWARD [129]: [1] -> [1] (0) | |
|-> 1. 0x1438d2400 (0x285da5a40:0) [4096x4096] 8.171875 4.007812 5.050781 .. | |
|<- 1. 0x1438d2400 (0x285da5a40:0) [4096x4096] 0.051697 0.000803 0.002281 .. | |
CCV_NNC_GEMM_FORWARD [130]: [2] -> [1] (0) | |
|-> 1. 0x1438d2520 (0x285da5a40:0) [1x4096x4096] 0.051697 0.000803 0.002281 .. | |
|-> 2. 0x1438d2470 (0x285da5a80:0) [1x4096x40] 0.229004 -0.007763 0.674316 .. | |
|<- 1. 0x1438d43e0 (0x285da5680:0) [1x4096x40] 0.202148 0.293457 0.154907 .. | |
CCV_NNC_GEMM_FORWARD [131]: [2] -> [1] (0) | |
|-> 1. 0x1438d2640 (0x285da59c0:0) [1x4096x40] -0.156494 -0.095947 0.025284 .. | |
|-> 2. 0x1438d2590 (0x285da5980:0) [1x4096x40] -0.095276 0.494385 0.494873 .. | |
|<- 1. 0x1438a0e00 (0x285da5a40:0) [1x4096x4096] -0.452148 -1.506836 -1.910156 .. | |
CCV_NNC_SOFTMAX_FORWARD [132]: [1] -> [1] (0) | |
|-> 1. 0x1438d26f0 (0x285da5a40:0) [4096x4096] -0.452148 -1.506836 -1.910156 .. | |
|<- 1. 0x1438d26f0 (0x285da5a40:0) [4096x4096] 0.000643 0.000224 0.000150 .. | |
CCV_NNC_GEMM_FORWARD [133]: [2] -> [1] (0) | |
|-> 1. 0x1438d2810 (0x285da5a40:0) [1x4096x4096] 0.000643 0.000224 0.000150 .. | |
|-> 2. 0x1438d2760 (0x285da5a80:0) [1x4096x40] 1.302734 -0.050659 -0.475342 .. | |
|<- 1. 0x1438d4490 (0x285da5680:0) [1x4096x40] -0.125122 0.123169 -0.030411 .. | |
CCV_NNC_GEMM_FORWARD [134]: [2] -> [1] (0) | |
|-> 1. 0x1438d2930 (0x285da59c0:0) [1x4096x40] 0.181641 -0.239624 -0.156982 .. | |
|-> 2. 0x1438d2880 (0x285da5980:0) [1x4096x40] 0.471924 -0.942871 0.792969 .. | |
|<- 1. 0x1438a0e70 (0x285da5a40:0) [1x4096x4096] 1.342773 1.739258 0.361328 .. | |
CCV_NNC_SOFTMAX_FORWARD [135]: [1] -> [1] (0) | |
|-> 1. 0x1438d29e0 (0x285da5a40:0) [4096x4096] 1.342773 1.739258 0.361328 .. | |
|<- 1. 0x1438d29e0 (0x285da5a40:0) [4096x4096] 0.000418 0.000622 0.000157 .. | |
CCV_NNC_GEMM_FORWARD [136]: [2] -> [1] (0) | |
|-> 1. 0x1438d2b00 (0x285da5a40:0) [1x4096x4096] 0.000418 0.000622 0.000157 .. | |
|-> 2. 0x1438d2a50 (0x285da5a80:0) [1x4096x40] 0.333496 0.162231 0.011147 .. | |
|<- 1. 0x1438d4540 (0x285da5680:0) [1x4096x40] -0.164062 -0.099121 0.168091 .. | |
CCV_NNC_GEMM_FORWARD [137]: [2] -> [1] (0) | |
|-> 1. 0x1438d2c20 (0x285da59c0:0) [1x4096x40] 0.315186 0.172241 -0.090027 .. | |
|-> 2. 0x1438d2b70 (0x285da5980:0) [1x4096x40] 1.596680 -0.960449 0.928711 .. | |
|<- 1. 0x1438a0ee0 (0x285da5a40:0) [1x4096x4096] 7.625000 3.019531 3.916016 .. | |
CCV_NNC_SOFTMAX_FORWARD [138]: [1] -> [1] (0) | |
|-> 1. 0x1438d2cd0 (0x285da5a40:0) [4096x4096] 7.625000 3.019531 3.916016 .. | |
|<- 1. 0x1438d2cd0 (0x285da5a40:0) [4096x4096] 0.034180 0.000342 0.000838 .. | |
CCV_NNC_GEMM_FORWARD [139]: [2] -> [1] (0) | |
|-> 1. 0x1438d2df0 (0x285da5a40:0) [1x4096x4096] 0.034180 0.000342 0.000838 .. | |
|-> 2. 0x1438d2d40 (0x285da5a80:0) [1x4096x40] 0.084656 0.138184 0.002228 .. | |
|<- 1. 0x1438d45f0 (0x285da5680:0) [1x4096x40] -0.028610 0.000618 0.013924 .. | |
CCV_NNC_GEMM_FORWARD [140]: [2] -> [1] (0) | |
|-> 1. 0x1438d2f10 (0x285da59c0:0) [1x4096x40] -0.071655 -0.121826 -0.061707 .. | |
|-> 2. 0x1438d2e60 (0x285da5980:0) [1x4096x40] -0.478516 -1.603516 -0.821289 .. | |
|<- 1. 0x1438a0f50 (0x285da5a40:0) [1x4096x4096] 4.460938 2.183594 2.863281 .. | |
CCV_NNC_SOFTMAX_FORWARD [141]: [1] -> [1] (0) | |
|-> 1. 0x1438d2fc0 (0x285da5a40:0) [4096x4096] 4.460938 2.183594 2.863281 .. | |
|<- 1. 0x1438d2fc0 (0x285da5a40:0) [4096x4096] 0.017975 0.001843 0.003637 .. | |
CCV_NNC_GEMM_FORWARD [142]: [2] -> [1] (0) | |
|-> 1. 0x1438d30e0 (0x285da5a40:0) [1x4096x4096] 0.017975 0.001843 0.003637 .. | |
|-> 2. 0x1438d3030 (0x285da5a80:0) [1x4096x40] 0.279053 -0.195801 0.358887 .. | |
|<- 1. 0x1438d46a0 (0x285da5680:0) [1x4096x40] 0.075317 -0.022110 0.061371 .. | |
CCV_NNC_GEMM_FORWARD [143]: [2] -> [1] (0) | |
|-> 1. 0x1438d3200 (0x285da59c0:0) [1x4096x40] -0.276611 -0.201660 -0.025070 .. | |
|-> 2. 0x1438d3150 (0x285da5980:0) [1x4096x40] -0.522949 -0.113892 1.308594 .. | |
|<- 1. 0x1438a0fc0 (0x285da5a40:0) [1x4096x4096] 0.968262 1.105469 0.160156 .. | |
CCV_NNC_SOFTMAX_FORWARD [144]: [1] -> [1] (0) | |
|-> 1. 0x1438d32b0 (0x285da5a40:0) [4096x4096] 0.968262 1.105469 0.160156 .. | |
|<- 1. 0x1438d32b0 (0x285da5a40:0) [4096x4096] 0.000864 0.000990 0.000385 .. | |
CCV_NNC_GEMM_FORWARD [145]: [2] -> [1] (0) | |
|-> 1. 0x1438d33d0 (0x285da5a40:0) [1x4096x4096] 0.000864 0.000990 0.000385 .. | |
|-> 2. 0x1438d3320 (0x285da5a80:0) [1x4096x40] 0.065002 -0.490479 -0.035065 .. | |
|<- 1. 0x1438d4750 (0x285da5680:0) [1x4096x40] 0.084290 -0.009338 0.205078 .. | |
CCV_NNC_GEMM_FORWARD [146]: [2] -> [1] (0) | |
|-> 1. 0x1438d34f0 (0x285da59c0:0) [1x4096x40] 0.087524 -0.084839 0.022324 .. | |
|-> 2. 0x1438d3440 (0x285da5980:0) [1x4096x40] 1.386719 -0.196899 -1.851562 .. | |
|<- 1. 0x1438a1030 (0x285da5a40:0) [1x4096x4096] 4.031250 2.867188 2.191406 .. | |
CCV_NNC_SOFTMAX_FORWARD [147]: [1] -> [1] (0) | |
|-> 1. 0x1438d35a0 (0x285da5a40:0) [4096x4096] 4.031250 2.867188 2.191406 .. | |
|<- 1. 0x1438d35a0 (0x285da5a40:0) [4096x4096] 0.009003 0.002810 0.001430 .. | |
CCV_NNC_GEMM_FORWARD [148]: [2] -> [1] (0) | |
|-> 1. 0x1438d36c0 (0x285da5a40:0) [1x4096x4096] 0.009003 0.002810 0.001430 .. | |
|-> 2. 0x1438d3610 (0x285da5a80:0) [1x4096x40] -0.168457 0.082825 -0.655273 .. | |
|<- 1. 0x1438d4800 (0x285da5680:0) [1x4096x40] 0.018707 -0.049713 -0.241455 .. | |
CCV_NNC_GEMM_FORWARD [149]: [2] -> [1] (0) | |
|-> 1. 0x1438d37e0 (0x285da59c0:0) [1x4096x40] 0.116150 0.235718 0.070007 .. | |
|-> 2. 0x1438d3730 (0x285da5980:0) [1x4096x40] -0.277832 -1.186523 0.947266 .. | |
|<- 1. 0x1438a10a0 (0x285da5a40:0) [1x4096x4096] 1.523438 1.729492 1.864258 .. | |
CCV_NNC_SOFTMAX_FORWARD [150]: [1] -> [1] (0) | |
|-> 1. 0x1438d3890 (0x285da5a40:0) [4096x4096] 1.523438 1.729492 1.864258 .. | |
|<- 1. 0x1438d3890 (0x285da5a40:0) [4096x4096] 0.000710 0.000873 0.000998 .. | |
CCV_NNC_GEMM_FORWARD [151]: [2] -> [1] (0) | |
|-> 1. 0x1438d39b0 (0x285da5a40:0) [1x4096x4096] 0.000710 0.000873 0.000998 .. | |
|-> 2. 0x1438d3900 (0x285da5a80:0) [1x4096x40] -0.005127 0.099792 0.155029 .. | |
|<- 1. 0x1438d48b0 (0x285da5680:0) [1x4096x40] 0.072449 -0.060333 -0.011993 .. | |
CCV_NNC_GEMM_FORWARD [152]: [2] -> [1] (0) | |
|-> 1. 0x1438d3ad0 (0x285da59c0:0) [1x4096x40] 0.019272 -0.055237 -0.130005 .. | |
|-> 2. 0x1438d3a20 (0x285da5980:0) [1x4096x40] 0.814453 -0.346191 1.026367 .. | |
|<- 1. 0x1438a1110 (0x285da5a40:0) [1x4096x4096] 8.171875 4.007812 5.050781 .. | |
CCV_NNC_SOFTMAX_FORWARD [153]: [1] -> [1] (0) | |
|-> 1. 0x1438d3b80 (0x285da5a40:0) [4096x4096] 8.171875 4.007812 5.050781 .. | |
|<- 1. 0x1438d3b80 (0x285da5a40:0) [4096x4096] 0.051697 0.000803 0.002281 .. | |
CCV_NNC_GEMM_FORWARD [154]: [2] -> [1] (0) | |
|-> 1. 0x1438d3ca0 (0x285da5a40:0) [1x4096x4096] 0.051697 0.000803 0.002281 .. | |
|-> 2. 0x1438d3bf0 (0x285da5a80:0) [1x4096x40] 0.229004 -0.007763 0.674316 .. | |
|<- 1. 0x1438d4960 (0x285da5680:0) [1x4096x40] 0.202148 0.293457 0.154907 .. | |
CCV_NNC_GEMM_FORWARD [155]: [2] -> [1] (0) | |
|-> 1. 0x1438d3dc0 (0x285da59c0:0) [1x4096x40] -0.156494 -0.095947 0.025284 .. | |
|-> 2. 0x1438d3d10 (0x285da5980:0) [1x4096x40] -0.095276 0.494385 0.494873 .. | |
|<- 1. 0x1438a1180 (0x285da5a40:0) [1x4096x4096] -0.452148 -1.506836 -1.910156 .. | |
CCV_NNC_SOFTMAX_FORWARD [156]: [1] -> [1] (0) | |
|-> 1. 0x1438d3e70 (0x285da5a40:0) [4096x4096] -0.452148 -1.506836 -1.910156 .. | |
|<- 1. 0x1438d3e70 (0x285da5a40:0) [4096x4096] 0.000643 0.000224 0.000150 .. | |
CCV_NNC_GEMM_FORWARD [157]: [2] -> [1] (0) | |
|-> 1. 0x1438d3f90 (0x285da5a40:0) [1x4096x4096] 0.000643 0.000224 0.000150 .. | |
|-> 2. 0x1438d3ee0 (0x285da5a80:0) [1x4096x40] 1.302734 -0.050659 -0.475342 .. | |
|<- 1. 0x1438d4a10 (0x285da5680:0) [1x4096x40] -0.125122 0.123169 -0.030411 .. | |
CCV_NNC_TRANSPOSE_FORWARD [158]: [1] -> [1] (0) | |
|-> 1. 0x1438d4ac0 (0x285da5680:0) [2x8x4096x40] -0.164062 -0.099121 0.168091 .. | |
|<- 1. 0x1438a1260 (0x285da5940:0) [2x4096x8x40] -0.164062 -0.099121 0.168091 .. | |
CCV_NNC_GEMM_FORWARD [159]: [3] -> [1] (0) | |
|-> 1. 0x1438d4b30 (0x285da5940:0) [2x4096x320] -0.164062 -0.099121 0.168091 .. | |
|-> 2. 0x1438be060 (0x285d84e40:0) [320x320] 0.020599 0.010056 -0.034363 .. | |
|-> 3. 0x1438be0d0 (0x285d84e00:0) [320] 0.058563 0.010330 0.046692 .. | |
|<- 1. 0x1438a12d0 (0x285da5ac0:0) [2x4096x320] 0.045868 -0.097534 0.009132 .. | |
CCV_NNC_ADD_FORWARD [160]: [2] -> [1] (0) | |
|-> 1. 0x1438a12d0 (0x285da5ac0:0) [2x4096x320] 0.045868 -0.097534 0.009132 .. | |
|-> 2. 0x1438d1000 (0x285da56c0:0) [2x4096x320] 0.347656 0.462646 -0.141479 .. | |
|<- 1. 0x1438a12d0 (0x285da5ac0:0) [2x4096x320] 0.393555 0.365234 -0.132324 .. | |
CCV_NNC_LAYER_NORM_FORWARD [161]: [3] -> [3] (0) | |
|-> 1. 0x1438a12d0 (0x285da5ac0:0) [2x4096x320] 0.393555 0.365234 -0.132324 .. | |
|-> 2. 0x1438be140 (0x285d84d80:0) [1x1x320] 0.379883 0.422607 0.413086 .. | |
|-> 3. 0x1438be1b0 (0x285d84dc0:0) [1x1x320] -0.121826 -0.066040 -0.111389 .. | |
|<- 1. 0x1438a1340 (0x285da5940:0) [2x4096x320] 0.410400 0.477295 -0.416016 .. | |
|<- 2. 0x1438a13b0 (0x285da5b00:0) [2x4096x1] 0.049011 .. | |
|<- 3. 0x1438a1420 (0x285da5b40:0) [2x4096x1] 4.066406 .. | |
CCV_NNC_GEMM_FORWARD [162]: [2] -> [1] (0) | |
|-> 1. 0x1438a1340 (0x285da5940:0) [2x4096x320] 0.410400 0.477295 -0.416016 .. | |
|-> 2. 0x1438be220 (0x285d84180:0) [320x320] -0.023132 -0.141235 -0.164551 .. | |
|<- 1. 0x1438a1490 (0x285da5900:0) [2x4096x320] -0.523926 -0.234985 1.871094 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [163]: [1] -> [1] (0) | |
|-> 1. 0x1438a1490 (0x285da5900:0) [2x4096x320] -0.523926 -0.234985 1.871094 .. | |
|<- 1. 0x1438a1490 (0x285da5900:0) [2x4096x320] -0.082825 -0.037140 0.295898 .. | |
CCV_NNC_TRANSPOSE_FORWARD [164]: [1] -> [1] (0) | |
|-> 1. 0x1438d4c10 (0x285da5900:0) [2x4096x8x40] -0.082825 -0.037140 0.295898 .. | |
|<- 1. 0x1438a15e0 (0x285da56c0:0) [2x8x4096x40] -0.082825 -0.037140 0.295898 .. | |
CCV_NNC_GEMM_FORWARD [165]: [2] -> [1] (0) | |
Wait: (0, 6) | |
|-> 1. 0x1438a15e0 (0x285da56c0:0) [2x8x4096x40] -0.082825 -0.037140 0.295898 .. | |
|-> 2. 0x1438a1570 (0x285da5bc0:0) [2x8x133x40] -0.231689 -0.019897 8.742188 .. | |
|<- 1. 0x1438a1650 (0x285da5c00:0) [2x8x4096x133] 7.828125 1.667969 -1.150391 .. | |
CCV_NNC_SOFTMAX_FORWARD [166]: [1] -> [1] (0) | |
|-> 1. 0x1438d4c80 (0x285da5c00:0) [65536x133] 7.828125 1.667969 -1.150391 .. | |
|<- 1. 0x1438d4c80 (0x285da5c00:0) [65536x133] 0.928711 0.001961 0.000117 .. | |
CCV_NNC_GEMM_FORWARD [167]: [2] -> [1] (0) | |
Wait: (0, 7) | |
|-> 1. 0x1438d4d60 (0x285da5c00:0) [2x8x4096x133] 0.928711 0.001961 0.000117 .. | |
|-> 2. 0x1438a1730 (0x285da5c80:0) [2x8x133x40] 0.030670 -0.073059 -0.036987 .. | |
|<- 1. 0x1438a17a0 (0x285da56c0:0) [2x8x4096x40] 0.064331 -0.074341 -0.010612 .. | |
CCV_NNC_TRANSPOSE_FORWARD [168]: [1] -> [1] (0) | |
|-> 1. 0x1438d4dd0 (0x285da56c0:0) [2x8x4096x40] 0.064331 -0.074341 -0.010612 .. | |
|<- 1. 0x1438a1810 (0x285da5940:0) [2x4096x8x40] 0.064331 -0.074341 -0.010612 .. | |
CCV_NNC_GEMM_FORWARD [169]: [3] -> [1] (0) | |
|-> 1. 0x1438d4e40 (0x285da5940:0) [2x4096x320] 0.064331 -0.074341 -0.010612 .. | |
|-> 2. 0x1438be370 (0x285d85140:0) [320x320] 0.006714 -0.007145 0.013000 .. | |
|-> 3. 0x1438be3e0 (0x285d849c0:0) [320] 0.037170 -0.006664 0.000309 .. | |
|<- 1. 0x1438a1880 (0x285da5a80:0) [2x4096x320] 0.043182 0.030182 0.011131 .. | |
CCV_NNC_ADD_FORWARD [170]: [2] -> [1] (0) | |
|-> 1. 0x1438a1880 (0x285da5a80:0) [2x4096x320] 0.043182 0.030182 0.011131 .. | |
|-> 2. 0x1438a12d0 (0x285da5ac0:0) [2x4096x320] 0.393555 0.365234 -0.132324 .. | |
|<- 1. 0x1438a1880 (0x285da5a80:0) [2x4096x320] 0.436768 0.395508 -0.121216 .. | |
CCV_NNC_LAYER_NORM_FORWARD [171]: [3] -> [3] (0) | |
|-> 1. 0x1438a1880 (0x285da5a80:0) [2x4096x320] 0.436768 0.395508 -0.121216 .. | |
|-> 2. 0x1438be450 (0x285d84ac0:0) [1x1x320] 0.416260 0.481934 0.441650 .. | |
|-> 3. 0x1438be4c0 (0x285d84a00:0) [1x1x320] -0.141479 -0.019455 0.005322 .. | |
|<- 1. 0x1438a18f0 (0x285da5ac0:0) [2x4096x320] 0.462646 0.604492 -0.288818 .. | |
|<- 2. 0x1438a1960 (0x285da5cc0:0) [2x4096x1] 0.054352 .. | |
|<- 3. 0x1438a19d0 (0x285da5d00:0) [2x4096x1] 3.794922 .. | |
Emit: (0, 8) | |
CCV_NNC_GEMM_FORWARD [172]: [3] -> [1] (0) | |
|-> 1. 0x1438a18f0 (0x285da5ac0:0) [2x4096x320] 0.462646 0.604492 -0.288818 .. | |
|-> 2. 0x1438be530 (0x285d84900:0) [1280x320] 0.018341 -0.062164 0.038361 .. | |
|-> 3. 0x1438be5a0 (0x285d851c0:0) [1280] 0.033142 -0.048279 -0.067139 .. | |
|<- 1. 0x1438a1a40 (0x285da5d40:0) [2x4096x1280] 0.161499 -0.139038 -1.244141 .. | |
CCV_NNC_GELU_FORWARD [173]: [1] -> [1] (0) | |
|-> 1. 0x1438a1a40 (0x285da5d40:0) [2x4096x1280] 0.161499 -0.139038 -1.244141 .. | |
|<- 1. 0x1438a1a40 (0x285da5d40:0) [2x4096x1280] 0.091125 -0.061829 -0.132812 .. | |
CCV_NNC_GEMM_FORWARD [174]: [3] -> [1] (1) | |
Wait: (1, 8) | |
|-> 1. 0x1438a18f0 (0x285da5ac0:0) [2x4096x320] 0.462646 0.604492 -0.288818 .. | |
|-> 2. 0x1438be610 (0x285d84b00:0) [1280x320] -0.035797 0.002018 0.014442 .. | |
|-> 3. 0x1438be680 (0x285d84940:0) [1280] 0.006767 0.075500 0.015762 .. | |
|<- 1. 0x1438a1ab0 (0x285da5d80:0) [2x4096x1280] -0.197021 0.565430 0.207397 .. | |
Emit: (1, 9) | |
CCV_NNC_MUL_FORWARD [175]: [2] -> [1] (0) | |
Wait: (0, 9) | |
|-> 1. 0x1438a1ab0 (0x285da5d80:0) [2x4096x1280] -0.197021 0.565430 0.207397 .. | |
|-> 2. 0x1438a1a40 (0x285da5d40:0) [2x4096x1280] 0.091125 -0.061829 -0.132812 .. | |
|<- 1. 0x1438a1ab0 (0x285da5d80:0) [2x4096x1280] -0.017960 -0.034973 -0.027542 .. | |
CCV_NNC_GEMM_FORWARD [176]: [3] -> [1] (0) | |
|-> 1. 0x1438a1ab0 (0x285da5d80:0) [2x4096x1280] -0.017960 -0.034973 -0.027542 .. | |
|-> 2. 0x1438be6f0 (0x285d84a80:0) [320x1280] 0.078674 0.009918 -0.000766 .. | |
|-> 3. 0x1438be760 (0x285d848c0:0) [320] -0.005562 0.002239 -0.023773 .. | |
|<- 1. 0x1438a1b20 (0x285da56c0:0) [2x4096x320] 0.103027 -0.406494 0.565430 .. | |
CCV_NNC_ADD_FORWARD [177]: [2] -> [1] (0) | |
|-> 1. 0x1438a1b20 (0x285da56c0:0) [2x4096x320] 0.103027 -0.406494 0.565430 .. | |
|-> 2. 0x1438a1880 (0x285da5a80:0) [2x4096x320] 0.436768 0.395508 -0.121216 .. | |
|<- 1. 0x1438a1b20 (0x285da56c0:0) [2x4096x320] 0.540039 -0.010986 0.444336 .. | |
CCV_NNC_CONVOLUTION_FORWARD [178]: [3] -> [1] (0) | |
|-> 1. 0x1438d4eb0 (0x285da56c0:0) [2x64x64x320] 0.540039 -0.010986 0.444336 .. | |
|-> 2. 0x1438be7d0 (0x285d84b40:0) [320x320x1x1] -0.025055 .. | |
|-> 3. 0x1438be840 (0x285d84980:0) [320] -0.039307 -0.017242 -0.024658 .. | |
|<- 1. 0x1438a1b90 (0x285da5680:0) [2x64x64x320] -0.526367 -0.144165 0.465576 .. | |
CCV_NNC_ADD_FORWARD [179]: [2] -> [1] (0) | |
|-> 1. 0x1438a1b90 (0x285da5680:0) [2x64x64x320] -0.526367 -0.144165 0.465576 .. | |
|-> 2. 0x1438a04d0 (0x285da5840:0) [2x64x64x320] 0.131836 -2.232422 0.687500 .. | |
|<- 1. 0x143909a80 (0x285e6d340:0) [2x64x64x320] -0.394531 -2.376953 1.153320 .. | |
CCV_NNC_GROUP_NORM_FORWARD [180]: [3] -> [3] (0) | |
|-> 1. 0x143909a80 (0x285e6d340:0) [2x64x64x320] -0.394531 -2.376953 1.153320 .. | |
|-> 2. 0x1438be8b0 (0x285d84a40:0) [1x1x1x320] 0.416992 0.220825 0.264160 .. | |
|-> 3. 0x1438be920 (0x285d84200:0) [1x1x1x320] -0.109131 0.241455 -0.181763 .. | |
|<- 1. 0x1438a1c00 (0x285da5680:0) [2x64x64x320] -0.260498 -0.254639 0.110901 .. | |
|<- 2. 0x1438a1c70 (0x285da5740:0) [2x1x1x32] -0.012650 -0.262451 -0.010139 .. | |
|<- 3. 0x1438a1ce0 (0x285da5700:0) [2x1x1x32] 0.950195 1.647461 5.222656 .. | |
CCV_NNC_SWISH_FORWARD [181]: [1] -> [1] (0) | |
|-> 1. 0x1438a1c00 (0x285da5680:0) [2x64x64x320] -0.260498 -0.254639 0.110901 .. | |
|<- 1. 0x1438a1c00 (0x285da5680:0) [2x64x64x320] -0.113403 -0.111206 0.058533 .. | |
CCV_NNC_CONVOLUTION_FORWARD [182]: [3] -> [1] (0) | |
|-> 1. 0x1438a1c00 (0x285da5680:0) [2x64x64x320] -0.113403 -0.111206 0.058533 .. | |
|-> 2. 0x1438bea70 (0x285d85180:0) [320x320x3x3] 0.032501 0.068237 0.137939 .. | |
|-> 3. 0x1438beae0 (0x285d843c0:0) [320] 0.019516 0.005825 -0.055542 .. | |
|<- 1. 0x1438a1dc0 (0x285da56c0:0) [2x64x64x320] -0.125488 -0.400635 -0.284424 .. | |
CCV_NNC_ADD_FORWARD [183]: [2] -> [1] (0) | |
Wait: (0, 10) | |
|-> 1. 0x1438a1dc0 (0x285da56c0:0) [2x64x64x320] -0.125488 -0.400635 -0.284424 .. | |
|-> 2. 0x1438d4f20 (0x285da5dc0:0) [2x1x1x320] 0.114136 0.382324 -0.697754 .. | |
|<- 1. 0x1438a1dc0 (0x285da56c0:0) [2x64x64x320] -0.011353 -0.018311 -0.982422 .. | |
CCV_NNC_GROUP_NORM_FORWARD [184]: [3] -> [3] (0) | |
|-> 1. 0x1438a1dc0 (0x285da56c0:0) [2x64x64x320] -0.011353 -0.018311 -0.982422 .. | |
|-> 2. 0x1438beb50 (0x285d852c0:0) [1x1x1x320] 0.733398 0.608398 0.626465 .. | |
|-> 3. 0x1438bebc0 (0x285d853c0:0) [1x1x1x320] -0.231812 -0.169800 -0.094360 .. | |
|<- 1. 0x1438a1e30 (0x285da5680:0) [2x64x64x320] -0.522461 -0.417969 -1.359375 .. | |
|<- 2. 0x1438a1ea0 (0x285da5e00:0) [2x1x1x32] 0.225830 0.153564 0.310059 .. | |
|<- 3. 0x1438a1f10 (0x285da5800:0) [2x1x1x32] 1.670898 1.156250 0.658203 .. | |
CCV_NNC_SWISH_FORWARD [185]: [1] -> [1] (0) | |
|-> 1. 0x1438a1e30 (0x285da5680:0) [2x64x64x320] -0.522461 -0.417969 -1.359375 .. | |
|<- 1. 0x1438a1e30 (0x285da5680:0) [2x64x64x320] -0.194458 -0.165894 -0.277832 .. | |
CCV_NNC_CONVOLUTION_FORWARD [186]: [3] -> [1] (0) | |
|-> 1. 0x1438a1e30 (0x285da5680:0) [2x64x64x320] -0.194458 -0.165894 -0.277832 .. | |
|-> 2. 0x1438bec30 (0x285d85400:0) [320x320x3x3] -0.011002 -0.015823 -0.001194 .. | |
|-> 3. 0x1438beca0 (0x285d85440:0) [320] -0.017487 0.020096 -0.013153 .. | |
|<- 1. 0x1438a1f80 (0x285da56c0:0) [2x64x64x320] -0.270020 0.777832 -0.507324 .. | |
CCV_NNC_ADD_FORWARD [187]: [2] -> [1] (0) | |
|-> 1. 0x143909a80 (0x285e6d340:0) [2x64x64x320] -0.394531 -2.376953 1.153320 .. | |
|-> 2. 0x1438a1f80 (0x285da56c0:0) [2x64x64x320] -0.270020 0.777832 -0.507324 .. | |
|<- 1. 0x1438a1ff0 (0x285da5840:0) [2x64x64x320] -0.664551 -1.599609 0.645996 .. | |
CCV_NNC_GROUP_NORM_FORWARD [188]: [3] -> [3] (0) | |
|-> 1. 0x1438a1ff0 (0x285da5840:0) [2x64x64x320] -0.664551 -1.599609 0.645996 .. | |
|-> 2. 0x1438bed10 (0x285d85480:0) [1x1x1x320] 0.402344 0.316650 0.406982 .. | |
|-> 3. 0x1438bed80 (0x285d854c0:0) [1x1x1x320] -0.076233 0.042206 -0.025192 .. | |
|<- 1. 0x1438a2060 (0x285da5680:0) [2x64x64x320] -0.560059 -0.807617 0.330811 .. | |
|<- 2. 0x1438a20d0 (0x285da5740:0) [2x1x1x32] 0.093933 -0.135376 -0.198242 .. | |
|<- 3. 0x1438a2140 (0x285da5700:0) [2x1x1x32] 1.584961 2.177734 2.802734 .. | |
CCV_NNC_CONVOLUTION_FORWARD [189]: [3] -> [1] (0) | |
|-> 1. 0x1438a2060 (0x285da5680:0) [2x64x64x320] -0.560059 -0.807617 0.330811 .. | |
|-> 2. 0x1438bedf0 (0x285d85500:0) [320x320x1x1] 0.017532 .. | |
|-> 3. 0x1438bee60 (0x285d85540:0) [320] -0.068604 0.206543 -0.054993 .. | |
|<- 1. 0x1438a21b0 (0x285da56c0:0) [2x64x64x320] -0.506348 -0.774414 0.334961 .. | |
CCV_NNC_LAYER_NORM_FORWARD [190]: [3] -> [3] (0) | |
|-> 1. 0x1438d4f90 (0x285da56c0:0) [2x4096x320] -0.506348 -0.774414 0.334961 .. | |
|-> 2. 0x1438beed0 (0x285d85580:0) [1x1x320] 0.716309 0.794922 0.938965 .. | |
|-> 3. 0x1438bef40 (0x285d855c0:0) [1x1x320] 0.058411 -0.022797 -0.025116 .. | |
|<- 1. 0x1438a2220 (0x285da5680:0) [2x4096x320] -0.615234 -1.161133 0.540527 .. | |
|<- 2. 0x1438a2290 (0x285da5e40:0) [2x4096x1] 0.006432 .. | |
|<- 3. 0x1438a2300 (0x285da5880:0) [2x4096x1] 1.833984 .. | |
Emit: (0, 11) | |
CCV_NNC_GEMM_FORWARD [191]: [2] -> [1] (0) | |
|-> 1. 0x1438a2220 (0x285da5680:0) [2x4096x320] -0.615234 -1.161133 0.540527 .. | |
|-> 2. 0x1438befb0 (0x285d85600:0) [320x320] 0.098633 -0.015945 -0.021072 .. | |
|<- 1. 0x1438a2370 (0x285da5900:0) [2x4096x320] -0.845703 0.704590 -1.113281 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [192]: [1] -> [1] (0) | |
|-> 1. 0x1438a2370 (0x285da5900:0) [2x4096x320] -0.845703 0.704590 -1.113281 .. | |
|<- 1. 0x1438a2370 (0x285da5900:0) [2x4096x320] -0.133667 0.111389 -0.176025 .. | |
CCV_NNC_TRANSPOSE_FORWARD [193]: [1] -> [1] (0) | |
|-> 1. 0x1438d5070 (0x285da5900:0) [2x4096x8x40] -0.133667 0.111389 -0.176025 .. | |
|<- 1. 0x1438a24c0 (0x285da5e80:0) [2x8x4096x40] -0.133667 0.111389 -0.176025 .. | |
CCV_NNC_GEMM_FORWARD [194]: [2] -> [1] (1) | |
Wait: (1, 11) | |
|-> 1. 0x1438a2220 (0x285da5680:0) [2x4096x320] -0.615234 -1.161133 0.540527 .. | |
|-> 2. 0x1438bf020 (0x285d85640:0) [320x320] 0.096313 0.077942 0.058289 .. | |
|<- 1. 0x1438a23e0 (0x285da5940:0) [2x4096x320] -1.801758 -0.114258 -0.691895 .. | |
CCV_NNC_TRANSPOSE_FORWARD [195]: [1] -> [1] (1) | |
|-> 1. 0x1438d5000 (0x285da5940:0) [2x4096x8x40] -1.801758 -0.114258 -0.691895 .. | |
|<- 1. 0x1438a2450 (0x285da59c0:0) [2x8x4096x40] -1.801758 -0.114258 -0.691895 .. | |
Emit: (1, 12) | |
CCV_NNC_GEMM_FORWARD [196]: [2] -> [1] (2) | |
Wait: (2, 11) | |
|-> 1. 0x1438a2220 (0x285da5680:0) [2x4096x320] -0.615234 -1.161133 0.540527 .. | |
|-> 2. 0x1438bf090 (0x285d85680:0) [320x320] 0.093872 0.079895 -0.008286 .. | |
|<- 1. 0x1438a2530 (0x285da5ec0:0) [2x4096x320] -1.234375 0.313965 -0.631348 .. | |
CCV_NNC_TRANSPOSE_FORWARD [197]: [1] -> [1] (2) | |
|-> 1. 0x1438d51c0 (0x285da5ec0:0) [2x4096x8x40] -1.234375 0.313965 -0.631348 .. | |
|<- 1. 0x1438a2610 (0x285da5980:0) [2x8x4096x40] -1.234375 0.313965 -0.631348 .. | |
Emit: (2, 13) | |
CCV_NNC_GEMM_FORWARD [198]: [2] -> [1] (0) | |
Wait: (0, 12) | |
|-> 1. 0x1438d5150 (0x285da5e80:0) [1x4096x40] -0.133667 0.111389 -0.176025 .. | |
|-> 2. 0x1438d50e0 (0x285da59c0:0) [1x4096x40] -1.801758 -0.114258 -0.691895 .. | |
|<- 1. 0x1438a25a0 (0x285da5a40:0) [1x4096x4096] 9.351562 8.132812 8.390625 .. | |
CCV_NNC_SOFTMAX_FORWARD [199]: [1] -> [1] (0) | |
|-> 1. 0x1438d5230 (0x285da5a40:0) [4096x4096] 9.351562 8.132812 8.390625 .. | |
|<- 1. 0x1438d5230 (0x285da5a40:0) [4096x4096] 0.011200 0.003311 0.004284 .. | |
CCV_NNC_GEMM_FORWARD [200]: [2] -> [1] (0) | |
Wait: (0, 13) | |
|-> 1. 0x1438d5310 (0x285da5a40:0) [1x4096x4096] 0.011200 0.003311 0.004284 .. | |
|-> 2. 0x1438d52a0 (0x285da5980:0) [1x4096x40] -1.234375 0.313965 -0.631348 .. | |
|<- 1. 0x1438d7f90 (0x285da5680:0) [1x4096x40] -0.480469 -0.030075 -0.577637 .. | |
CCV_NNC_GEMM_FORWARD [201]: [2] -> [1] (0) | |
|-> 1. 0x1438d5430 (0x285da5e80:0) [1x4096x40] 0.036346 -0.232666 -0.030319 .. | |
|-> 2. 0x1438d5380 (0x285da59c0:0) [1x4096x40] 0.977051 -1.407227 1.997070 .. | |
|<- 1. 0x1438a2680 (0x285da5a40:0) [1x4096x4096] 9.007812 7.761719 7.343750 .. | |
CCV_NNC_SOFTMAX_FORWARD [202]: [1] -> [1] (0) | |
|-> 1. 0x1438d54e0 (0x285da5a40:0) [4096x4096] 9.007812 7.761719 7.343750 .. | |
|<- 1. 0x1438d54e0 (0x285da5a40:0) [4096x4096] 0.020401 0.005867 0.003862 .. | |
CCV_NNC_GEMM_FORWARD [203]: [2] -> [1] (0) | |
|-> 1. 0x1438d5600 (0x285da5a40:0) [1x4096x4096] 0.020401 0.005867 0.003862 .. | |
|-> 2. 0x1438d5550 (0x285da5980:0) [1x4096x40] 0.047607 0.135132 0.761719 .. | |
|<- 1. 0x1438d8000 (0x285da5680:0) [1x4096x40] -0.014862 0.101135 0.027740 .. | |
CCV_NNC_GEMM_FORWARD [204]: [2] -> [1] (0) | |
|-> 1. 0x1438d5720 (0x285da5e80:0) [1x4096x40] 0.040222 0.023972 -0.001418 .. | |
|-> 2. 0x1438d5670 (0x285da59c0:0) [1x4096x40] 1.561523 -1.250000 -0.090881 .. | |
|<- 1. 0x1438a26f0 (0x285da5a40:0) [1x4096x4096] 4.054688 4.242188 3.722656 .. | |
CCV_NNC_SOFTMAX_FORWARD [205]: [1] -> [1] (0) | |
|-> 1. 0x1438d57d0 (0x285da5a40:0) [4096x4096] 4.054688 4.242188 3.722656 .. | |
|<- 1. 0x1438d57d0 (0x285da5a40:0) [4096x4096] 0.001454 0.001754 0.001043 .. | |
CCV_NNC_GEMM_FORWARD [206]: [2] -> [1] (0) | |
|-> 1. 0x1438d58f0 (0x285da5a40:0) [1x4096x4096] 0.001454 0.001754 0.001043 .. | |
|-> 2. 0x1438d5840 (0x285da5980:0) [1x4096x40] 0.251709 -0.178223 0.285889 .. | |
|<- 1. 0x1438d80b0 (0x285da5680:0) [1x4096x40] 0.086182 0.041504 0.114563 .. | |
CCV_NNC_GEMM_FORWARD [207]: [2] -> [1] (0) | |
|-> 1. 0x1438d5a10 (0x285da5e80:0) [1x4096x40] 0.019974 -0.073975 0.106140 .. | |
|-> 2. 0x1438d5960 (0x285da59c0:0) [1x4096x40] -0.028793 -1.217773 -0.375977 .. | |
|<- 1. 0x1438a2760 (0x285da5a40:0) [1x4096x4096] 4.730469 3.630859 3.685547 .. | |
CCV_NNC_SOFTMAX_FORWARD [208]: [1] -> [1] (0) | |
|-> 1. 0x1438d5ac0 (0x285da5a40:0) [4096x4096] 4.730469 3.630859 3.685547 .. | |
|<- 1. 0x1438d5ac0 (0x285da5a40:0) [4096x4096] 0.004051 0.001349 0.001425 .. | |
CCV_NNC_GEMM_FORWARD [209]: [2] -> [1] (0) | |
|-> 1. 0x1438d5be0 (0x285da5a40:0) [1x4096x4096] 0.004051 0.001349 0.001425 .. | |
|-> 2. 0x1438d5b30 (0x285da5980:0) [1x4096x40] 0.143555 -0.132324 1.009766 .. | |
|<- 1. 0x1438d8160 (0x285da5680:0) [1x4096x40] 0.039490 0.045532 0.094360 .. | |
CCV_NNC_GEMM_FORWARD [210]: [2] -> [1] (0) | |
|-> 1. 0x1438d5d00 (0x285da5e80:0) [1x4096x40] -0.148804 0.187744 -0.056671 .. | |
|-> 2. 0x1438d5c50 (0x285da59c0:0) [1x4096x40] -0.924316 1.144531 -1.469727 .. | |
|<- 1. 0x1438a27d0 (0x285da5a40:0) [1x4096x4096] 7.554688 5.988281 5.781250 .. | |
CCV_NNC_SOFTMAX_FORWARD [211]: [1] -> [1] (0) | |
|-> 1. 0x1438d5db0 (0x285da5a40:0) [4096x4096] 7.554688 5.988281 5.781250 .. | |
|<- 1. 0x1438d5db0 (0x285da5a40:0) [4096x4096] 0.014046 0.002932 0.002384 .. | |
CCV_NNC_GEMM_FORWARD [212]: [2] -> [1] (0) | |
|-> 1. 0x1438d5ed0 (0x285da5a40:0) [1x4096x4096] 0.014046 0.002932 0.002384 .. | |
|-> 2. 0x1438d5e20 (0x285da5980:0) [1x4096x40] -0.618652 0.281982 0.310791 .. | |
|<- 1. 0x1438d8210 (0x285da5680:0) [1x4096x40] 0.006836 -0.060699 0.176758 .. | |
CCV_NNC_GEMM_FORWARD [213]: [2] -> [1] (0) | |
|-> 1. 0x1438d5ff0 (0x285da5e80:0) [1x4096x40] 0.218262 -0.120422 0.347412 .. | |
|-> 2. 0x1438d5f40 (0x285da59c0:0) [1x4096x40] -0.532715 -0.188354 4.175781 .. | |
|<- 1. 0x1438a2840 (0x285da5a40:0) [1x4096x4096] 10.250000 7.101562 7.339844 .. | |
CCV_NNC_SOFTMAX_FORWARD [214]: [1] -> [1] (0) | |
|-> 1. 0x1438d60a0 (0x285da5a40:0) [4096x4096] 10.250000 7.101562 7.339844 .. | |
|<- 1. 0x1438d60a0 (0x285da5a40:0) [4096x4096] 0.023895 0.001026 0.001302 .. | |
CCV_NNC_GEMM_FORWARD [215]: [2] -> [1] (0) | |
|-> 1. 0x1438d61c0 (0x285da5a40:0) [1x4096x4096] 0.023895 0.001026 0.001302 .. | |
|-> 2. 0x1438d6110 (0x285da5980:0) [1x4096x40] -0.437500 0.525391 -0.966309 .. | |
|<- 1. 0x1438d82c0 (0x285da5680:0) [1x4096x40] -0.296143 0.230469 -0.135742 .. | |
CCV_NNC_GEMM_FORWARD [216]: [2] -> [1] (0) | |
|-> 1. 0x1438d62e0 (0x285da5e80:0) [1x4096x40] -0.085999 0.054932 -0.167969 .. | |
|-> 2. 0x1438d6230 (0x285da59c0:0) [1x4096x40] -0.529297 -0.944824 -0.623047 .. | |
|<- 1. 0x1438a28b0 (0x285da5a40:0) [1x4096x4096] 7.566406 6.777344 6.683594 .. | |
CCV_NNC_SOFTMAX_FORWARD [217]: [1] -> [1] (0) | |
|-> 1. 0x1438d6390 (0x285da5a40:0) [4096x4096] 7.566406 6.777344 6.683594 .. | |
|<- 1. 0x1438d6390 (0x285da5a40:0) [4096x4096] 0.010353 0.004704 0.004280 .. | |
CCV_NNC_GEMM_FORWARD [218]: [2] -> [1] (0) | |
|-> 1. 0x1438d64b0 (0x285da5a40:0) [1x4096x4096] 0.010353 0.004704 0.004280 .. | |
|-> 2. 0x1438d6400 (0x285da5980:0) [1x4096x40] -0.015900 1.032227 -0.623047 .. | |
|<- 1. 0x1438d8370 (0x285da5680:0) [1x4096x40] 0.037140 0.132935 -0.143066 .. | |
CCV_NNC_GEMM_FORWARD [219]: [2] -> [1] (0) | |
|-> 1. 0x1438d65d0 (0x285da5e80:0) [1x4096x40] 0.319580 0.124512 -0.062927 .. | |
|-> 2. 0x1438d6520 (0x285da59c0:0) [1x4096x40] 1.286133 0.171265 0.064270 .. | |
|<- 1. 0x1438a2920 (0x285da5a40:0) [1x4096x4096] 6.781250 6.187500 5.871094 .. | |
CCV_NNC_SOFTMAX_FORWARD [220]: [1] -> [1] (0) | |
|-> 1. 0x1438d6680 (0x285da5a40:0) [4096x4096] 6.781250 6.187500 5.871094 .. | |
|<- 1. 0x1438d6680 (0x285da5a40:0) [4096x4096] 0.008736 0.004826 0.003517 .. | |
CCV_NNC_GEMM_FORWARD [221]: [2] -> [1] (0) | |
|-> 1. 0x1438d67a0 (0x285da5a40:0) [1x4096x4096] 0.008736 0.004826 0.003517 .. | |
|-> 2. 0x1438d66f0 (0x285da5980:0) [1x4096x40] 0.427734 1.020508 -0.391602 .. | |
|<- 1. 0x1438d8420 (0x285da5680:0) [1x4096x40] 0.159302 0.101929 0.190674 .. | |
CCV_NNC_GEMM_FORWARD [222]: [2] -> [1] (0) | |
|-> 1. 0x1438d68c0 (0x285da5e80:0) [1x4096x40] -0.121582 0.141235 -0.150635 .. | |
|-> 2. 0x1438d6810 (0x285da59c0:0) [1x4096x40] -1.795898 0.127197 -0.631836 .. | |
|<- 1. 0x1438a2990 (0x285da5a40:0) [1x4096x4096] 9.343750 7.875000 8.054688 .. | |
CCV_NNC_SOFTMAX_FORWARD [223]: [1] -> [1] (0) | |
|-> 1. 0x1438d6970 (0x285da5a40:0) [4096x4096] 9.343750 7.875000 8.054688 .. | |
|<- 1. 0x1438d6970 (0x285da5a40:0) [4096x4096] 0.013000 0.002993 0.003582 .. | |
CCV_NNC_GEMM_FORWARD [224]: [2] -> [1] (0) | |
|-> 1. 0x1438d6a90 (0x285da5a40:0) [1x4096x4096] 0.013000 0.002993 0.003582 .. | |
|-> 2. 0x1438d69e0 (0x285da5980:0) [1x4096x40] -1.347656 0.064209 -0.540039 .. | |
|<- 1. 0x1438d84d0 (0x285da5680:0) [1x4096x40] -0.609375 -0.265625 -0.527832 .. | |
CCV_NNC_GEMM_FORWARD [225]: [2] -> [1] (0) | |
|-> 1. 0x1438d6bb0 (0x285da5e80:0) [1x4096x40] 0.030289 -0.225830 -0.026382 .. | |
|-> 2. 0x1438d6b00 (0x285da59c0:0) [1x4096x40] 1.179688 -1.460938 2.224609 .. | |
|<- 1. 0x1438a2a00 (0x285da5a40:0) [1x4096x4096] 8.429688 7.464844 6.949219 .. | |
CCV_NNC_SOFTMAX_FORWARD [226]: [1] -> [1] (0) | |
|-> 1. 0x1438d6c60 (0x285da5a40:0) [4096x4096] 8.429688 7.464844 6.949219 .. | |
|<- 1. 0x1438d6c60 (0x285da5a40:0) [4096x4096] 0.012314 0.004692 0.002802 .. | |
CCV_NNC_GEMM_FORWARD [227]: [2] -> [1] (0) | |
|-> 1. 0x1438d6d80 (0x285da5a40:0) [1x4096x4096] 0.012314 0.004692 0.002802 .. | |
|-> 2. 0x1438d6cd0 (0x285da5980:0) [1x4096x40] 0.073669 0.051788 0.720703 .. | |
|<- 1. 0x1438d8580 (0x285da5680:0) [1x4096x40] 0.076477 0.103088 -0.050232 .. | |
CCV_NNC_GEMM_FORWARD [228]: [2] -> [1] (0) | |
|-> 1. 0x1438d6ea0 (0x285da5e80:0) [1x4096x40] 0.018051 0.040741 0.011230 .. | |
|-> 2. 0x1438d6df0 (0x285da59c0:0) [1x4096x40] 1.687500 -1.275391 -0.047729 .. | |
|<- 1. 0x1438a2a70 (0x285da5a40:0) [1x4096x4096] 3.875000 3.882812 3.503906 .. | |
CCV_NNC_SOFTMAX_FORWARD [229]: [1] -> [1] (0) | |
|-> 1. 0x1438d6f50 (0x285da5a40:0) [4096x4096] 3.875000 3.882812 3.503906 .. | |
|<- 1. 0x1438d6f50 (0x285da5a40:0) [4096x4096] 0.001207 0.001217 0.000833 .. | |
CCV_NNC_GEMM_FORWARD [230]: [2] -> [1] (0) | |
|-> 1. 0x1438d7070 (0x285da5a40:0) [1x4096x4096] 0.001207 0.001217 0.000833 .. | |
|-> 2. 0x1438d6fc0 (0x285da5980:0) [1x4096x40] 0.242554 -0.054993 0.248047 .. | |
|<- 1. 0x1438d8630 (0x285da5680:0) [1x4096x40] -0.027039 0.208130 0.120972 .. | |
CCV_NNC_GEMM_FORWARD [231]: [2] -> [1] (0) | |
|-> 1. 0x1438d7190 (0x285da5e80:0) [1x4096x40] 0.043915 -0.065063 0.132202 .. | |
|-> 2. 0x1438d70e0 (0x285da59c0:0) [1x4096x40] 0.310303 -1.222656 -0.413330 .. | |
|<- 1. 0x1438a2ae0 (0x285da5a40:0) [1x4096x4096] 4.406250 3.453125 3.429688 .. | |
CCV_NNC_SOFTMAX_FORWARD [232]: [1] -> [1] (0) | |
|-> 1. 0x1438d7240 (0x285da5a40:0) [4096x4096] 4.406250 3.453125 3.429688 .. | |
|<- 1. 0x1438d7240 (0x285da5a40:0) [4096x4096] 0.003157 0.001217 0.001189 .. | |
CCV_NNC_GEMM_FORWARD [233]: [2] -> [1] (0) | |
|-> 1. 0x1438d7360 (0x285da5a40:0) [1x4096x4096] 0.003157 0.001217 0.001189 .. | |
|-> 2. 0x1438d72b0 (0x285da5980:0) [1x4096x40] 0.327148 -0.010162 0.989258 .. | |
|<- 1. 0x1438d86e0 (0x285da5680:0) [1x4096x40] 0.274902 0.059875 0.136841 .. | |
CCV_NNC_GEMM_FORWARD [234]: [2] -> [1] (0) | |
|-> 1. 0x1438d7480 (0x285da5e80:0) [1x4096x40] -0.153931 0.160278 -0.040253 .. | |
|-> 2. 0x1438d73d0 (0x285da59c0:0) [1x4096x40] -0.802246 1.071289 -1.416016 .. | |
|<- 1. 0x1438a2b50 (0x285da5a40:0) [1x4096x4096] 7.312500 5.859375 5.621094 .. | |
CCV_NNC_SOFTMAX_FORWARD [235]: [1] -> [1] (0) | |
|-> 1. 0x1438d7530 (0x285da5a40:0) [4096x4096] 7.312500 5.859375 5.621094 .. | |
|<- 1. 0x1438d7530 (0x285da5a40:0) [4096x4096] 0.010078 0.002357 0.001858 .. | |
CCV_NNC_GEMM_FORWARD [236]: [2] -> [1] (0) | |
|-> 1. 0x1438d7650 (0x285da5a40:0) [1x4096x4096] 0.010078 0.002357 0.001858 .. | |
|-> 2. 0x1438d75a0 (0x285da5980:0) [1x4096x40] -0.635742 0.504883 0.295898 .. | |
|<- 1. 0x1438d8790 (0x285da5680:0) [1x4096x40] -0.069641 0.125977 0.092590 .. | |
CCV_NNC_GEMM_FORWARD [237]: [2] -> [1] (0) | |
|-> 1. 0x1438d7770 (0x285da5e80:0) [1x4096x40] 0.232300 -0.134033 0.339844 .. | |
|-> 2. 0x1438d76c0 (0x285da59c0:0) [1x4096x40] -0.541992 -0.197754 4.132812 .. | |
|<- 1. 0x1438a2bc0 (0x285da5a40:0) [1x4096x4096] 9.828125 6.730469 6.972656 .. | |
CCV_NNC_SOFTMAX_FORWARD [238]: [1] -> [1] (0) | |
|-> 1. 0x1438d7820 (0x285da5a40:0) [4096x4096] 9.828125 6.730469 6.972656 .. | |
|<- 1. 0x1438d7820 (0x285da5a40:0) [4096x4096] 0.019714 0.000890 0.001135 .. | |
CCV_NNC_GEMM_FORWARD [239]: [2] -> [1] (0) | |
|-> 1. 0x1438d7940 (0x285da5a40:0) [1x4096x4096] 0.019714 0.000890 0.001135 .. | |
|-> 2. 0x1438d7890 (0x285da5980:0) [1x4096x40] -0.355225 0.519043 -0.960938 .. | |
|<- 1. 0x1438d8840 (0x285da5680:0) [1x4096x40] -0.189331 0.215210 -0.134521 .. | |
CCV_NNC_GEMM_FORWARD [240]: [2] -> [1] (0) | |
|-> 1. 0x1438d7a60 (0x285da5e80:0) [1x4096x40] -0.090820 0.027908 -0.152954 .. | |
|-> 2. 0x1438d79b0 (0x285da59c0:0) [1x4096x40] -0.628418 -1.050781 -0.554199 .. | |
|<- 1. 0x1438a2c30 (0x285da5a40:0) [1x4096x4096] 7.300781 6.683594 6.578125 .. | |
CCV_NNC_SOFTMAX_FORWARD [241]: [1] -> [1] (0) | |
|-> 1. 0x1438d7b10 (0x285da5a40:0) [4096x4096] 7.300781 6.683594 6.578125 .. | |
|<- 1. 0x1438d7b10 (0x285da5a40:0) [4096x4096] 0.007607 0.004105 0.003693 .. | |
CCV_NNC_GEMM_FORWARD [242]: [2] -> [1] (0) | |
|-> 1. 0x1438d7c30 (0x285da5a40:0) [1x4096x4096] 0.007607 0.004105 0.003693 .. | |
|-> 2. 0x1438d7b80 (0x285da5980:0) [1x4096x40] -0.047211 1.030273 -0.604980 .. | |
|<- 1. 0x1438d88f0 (0x285da5680:0) [1x4096x40] 0.035095 0.157349 -0.082520 .. | |
CCV_NNC_GEMM_FORWARD [243]: [2] -> [1] (0) | |
|-> 1. 0x1438d7d50 (0x285da5e80:0) [1x4096x40] 0.318115 0.130615 -0.016373 .. | |
|-> 2. 0x1438d7ca0 (0x285da59c0:0) [1x4096x40] 1.349609 0.178345 0.092834 .. | |
|<- 1. 0x1438a2ca0 (0x285da5a40:0) [1x4096x4096] 6.468750 5.933594 5.675781 .. | |
CCV_NNC_SOFTMAX_FORWARD [244]: [1] -> [1] (0) | |
|-> 1. 0x1438d7e00 (0x285da5a40:0) [4096x4096] 6.468750 5.933594 5.675781 .. | |
|<- 1. 0x1438d7e00 (0x285da5a40:0) [4096x4096] 0.006683 0.003914 0.003025 .. | |
CCV_NNC_GEMM_FORWARD [245]: [2] -> [1] (0) | |
|-> 1. 0x1438d7f20 (0x285da5a40:0) [1x4096x4096] 0.006683 0.003914 0.003025 .. | |
|-> 2. 0x1438d7e70 (0x285da5980:0) [1x4096x40] 0.369629 1.071289 -0.148315 .. | |
|<- 1. 0x1438d89a0 (0x285da5680:0) [1x4096x40] 0.111816 0.073914 0.389160 .. | |
CCV_NNC_TRANSPOSE_FORWARD [246]: [1] -> [1] (0) | |
|-> 1. 0x1438d8a50 (0x285da5680:0) [2x8x4096x40] -0.480469 -0.030075 -0.577637 .. | |
|<- 1. 0x1438a2d80 (0x285da5940:0) [2x4096x8x40] -0.480469 -0.030075 -0.577637 .. | |
CCV_NNC_GEMM_FORWARD [247]: [3] -> [1] (0) | |
|-> 1. 0x1438d8ac0 (0x285da5940:0) [2x4096x320] -0.480469 -0.030075 -0.577637 .. | |
|-> 2. 0x1438bf100 (0x285d856c0:0) [320x320] -0.011864 0.022491 0.002018 .. | |
|-> 3. 0x1438bf170 (0x285d85700:0) [320] -0.023834 0.402588 -0.052490 .. | |
|<- 1. 0x1438a2df0 (0x285da5680:0) [2x4096x320] -0.020523 0.836426 -0.084534 .. | |
CCV_NNC_ADD_FORWARD [248]: [2] -> [1] (0) | |
|-> 1. 0x1438a2df0 (0x285da5680:0) [2x4096x320] -0.020523 0.836426 -0.084534 .. | |
|-> 2. 0x1438d4f90 (0x285da56c0:0) [2x4096x320] -0.506348 -0.774414 0.334961 .. | |
|<- 1. 0x1438a2df0 (0x285da5680:0) [2x4096x320] -0.526855 0.062012 0.250488 .. | |
CCV_NNC_LAYER_NORM_FORWARD [249]: [3] -> [3] (0) | |
|-> 1. 0x1438a2df0 (0x285da5680:0) [2x4096x320] -0.526855 0.062012 0.250488 .. | |
|-> 2. 0x1438bf1e0 (0x285d85740:0) [1x1x320] 0.270508 0.379883 0.366699 .. | |
|-> 3. 0x1438bf250 (0x285d85780:0) [1x1x320] -0.055328 -0.174805 -0.028580 .. | |
|<- 1. 0x1438a2e60 (0x285da5940:0) [2x4096x320] -0.341553 -0.124695 0.159546 .. | |
|<- 2. 0x1438a2ed0 (0x285da5b40:0) [2x4096x1] -0.003223 .. | |
|<- 3. 0x1438a2f40 (0x285da5b00:0) [2x4096x1] 2.021484 .. | |
CCV_NNC_GEMM_FORWARD [250]: [2] -> [1] (0) | |
|-> 1. 0x1438a2e60 (0x285da5940:0) [2x4096x320] -0.341553 -0.124695 0.159546 .. | |
|-> 2. 0x1438bf2c0 (0x285d857c0:0) [320x320] 0.007980 0.001403 0.000995 .. | |
|<- 1. 0x1438a2fb0 (0x285da5900:0) [2x4096x320] -0.100891 -0.179932 -0.498535 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [251]: [1] -> [1] (0) | |
|-> 1. 0x1438a2fb0 (0x285da5900:0) [2x4096x320] -0.100891 -0.179932 -0.498535 .. | |
|<- 1. 0x1438a2fb0 (0x285da5900:0) [2x4096x320] -0.015945 -0.028442 -0.078796 .. | |
CCV_NNC_TRANSPOSE_FORWARD [252]: [1] -> [1] (0) | |
|-> 1. 0x1438d8ba0 (0x285da5900:0) [2x4096x8x40] -0.015945 -0.028442 -0.078796 .. | |
|<- 1. 0x1438a3100 (0x285da56c0:0) [2x8x4096x40] -0.015945 -0.028442 -0.078796 .. | |
CCV_NNC_GEMM_FORWARD [253]: [2] -> [1] (0) | |
Wait: (0, 14) | |
|-> 1. 0x1438a3100 (0x285da56c0:0) [2x8x4096x40] -0.015945 -0.028442 -0.078796 .. | |
|-> 2. 0x1438a3090 (0x285da5f40:0) [2x8x133x40] -0.131592 -0.084351 1.820312 .. | |
|<- 1. 0x1438a3170 (0x285da5c00:0) [2x8x4096x133] 4.199219 2.185547 1.363281 .. | |
CCV_NNC_SOFTMAX_FORWARD [254]: [1] -> [1] (0) | |
|-> 1. 0x1438d8c10 (0x285da5c00:0) [65536x133] 4.199219 2.185547 1.363281 .. | |
|<- 1. 0x1438d8c10 (0x285da5c00:0) [65536x133] 0.349121 0.046631 0.020493 .. | |
CCV_NNC_GEMM_FORWARD [255]: [2] -> [1] (0) | |
Wait: (0, 15) | |
|-> 1. 0x1438d8cf0 (0x285da5c00:0) [2x8x4096x133] 0.349121 0.046631 0.020493 .. | |
|-> 2. 0x1438a3250 (0x285da5fc0:0) [2x8x133x40] 0.014427 -0.034271 -0.016800 .. | |
|<- 1. 0x1438a32c0 (0x285da56c0:0) [2x8x4096x40] -0.003622 -0.073608 -0.039703 .. | |
CCV_NNC_TRANSPOSE_FORWARD [256]: [1] -> [1] (0) | |
|-> 1. 0x1438d8d60 (0x285da56c0:0) [2x8x4096x40] -0.003622 -0.073608 -0.039703 .. | |
|<- 1. 0x1438a3330 (0x285da5940:0) [2x4096x8x40] -0.003622 -0.073608 -0.039703 .. | |
CCV_NNC_GEMM_FORWARD [257]: [3] -> [1] (0) | |
|-> 1. 0x1438d8dd0 (0x285da5940:0) [2x4096x320] -0.003622 -0.073608 -0.039703 .. | |
|-> 2. 0x1438bf410 (0x285d85880:0) [320x320] -0.001719 0.002342 0.004265 .. | |
|-> 3. 0x1438bf480 (0x285d858c0:0) [320] 0.001342 0.312988 0.043030 .. | |
|<- 1. 0x1438a33a0 (0x285da5ac0:0) [2x4096x320] 0.007706 0.598145 0.029892 .. | |
CCV_NNC_ADD_FORWARD [258]: [2] -> [1] (0) | |
|-> 1. 0x1438a33a0 (0x285da5ac0:0) [2x4096x320] 0.007706 0.598145 0.029892 .. | |
|-> 2. 0x1438a2df0 (0x285da5680:0) [2x4096x320] -0.526855 0.062012 0.250488 .. | |
|<- 1. 0x1438a33a0 (0x285da5ac0:0) [2x4096x320] -0.519043 0.660156 0.280273 .. | |
CCV_NNC_LAYER_NORM_FORWARD [259]: [3] -> [3] (0) | |
|-> 1. 0x1438a33a0 (0x285da5ac0:0) [2x4096x320] -0.519043 0.660156 0.280273 .. | |
|-> 2. 0x1438bf4f0 (0x285d85900:0) [1x1x320] 0.512207 0.289551 0.570312 .. | |
|-> 3. 0x1438bf560 (0x285d85940:0) [1x1x320] 0.000493 -0.209961 -0.087341 .. | |
|<- 1. 0x1438a3410 (0x285da6000:0) [2x4096x320] -0.515137 0.178833 0.246826 .. | |
|<- 2. 0x1438a3480 (0x285da6040:0) [2x4096x1] -0.013893 .. | |
|<- 3. 0x1438a34f0 (0x285da6080:0) [2x4096x1] 1.992188 .. | |
Emit: (0, 16) | |
CCV_NNC_GEMM_FORWARD [260]: [3] -> [1] (0) | |
|-> 1. 0x1438a3410 (0x285da6000:0) [2x4096x320] -0.515137 0.178833 0.246826 .. | |
|-> 2. 0x1438bf5d0 (0x285d85980:0) [1280x320] -0.038788 0.038239 0.032745 .. | |
|-> 3. 0x1438bf640 (0x285d859c0:0) [1280] 0.097046 0.036072 0.077148 .. | |
|<- 1. 0x1438a3560 (0x285da5d40:0) [2x4096x1280] 0.205566 0.226318 0.549316 .. | |
CCV_NNC_GELU_FORWARD [261]: [1] -> [1] (0) | |
|-> 1. 0x1438a3560 (0x285da5d40:0) [2x4096x1280] 0.205566 0.226318 0.549316 .. | |
|<- 1. 0x1438a3560 (0x285da5d40:0) [2x4096x1280] 0.119507 0.133423 0.389160 .. | |
CCV_NNC_GEMM_FORWARD [262]: [3] -> [1] (1) | |
Wait: (1, 16) | |
|-> 1. 0x1438a3410 (0x285da6000:0) [2x4096x320] -0.515137 0.178833 0.246826 .. | |
|-> 2. 0x1438bf6b0 (0x285d85a00:0) [1280x320] -0.009453 -0.016190 0.016663 .. | |
|-> 3. 0x1438bf720 (0x285d85a40:0) [1280] -0.011093 -0.059692 -0.029694 .. | |
|<- 1. 0x1438a35d0 (0x285da5d80:0) [2x4096x1280] -0.123535 0.455322 -0.136108 .. | |
Emit: (1, 17) | |
CCV_NNC_MUL_FORWARD [263]: [2] -> [1] (0) | |
Wait: (0, 17) | |
|-> 1. 0x1438a35d0 (0x285da5d80:0) [2x4096x1280] -0.123535 0.455322 -0.136108 .. | |
|-> 2. 0x1438a3560 (0x285da5d40:0) [2x4096x1280] 0.119507 0.133423 0.389160 .. | |
|<- 1. 0x1438a35d0 (0x285da5d80:0) [2x4096x1280] -0.014763 0.060760 -0.052979 .. | |
CCV_NNC_GEMM_FORWARD [264]: [3] -> [1] (0) | |
|-> 1. 0x1438a35d0 (0x285da5d80:0) [2x4096x1280] -0.014763 0.060760 -0.052979 .. | |
|-> 2. 0x1438bf790 (0x285d85a80:0) [320x1280] 0.064453 0.011925 -0.068970 .. | |
|-> 3. 0x1438bf800 (0x285d85ac0:0) [320] -0.027100 -0.310547 -0.016296 .. | |
|<- 1. 0x1438a3640 (0x285da56c0:0) [2x4096x320] -0.001959 -0.343994 -0.374268 .. | |
CCV_NNC_ADD_FORWARD [265]: [2] -> [1] (0) | |
|-> 1. 0x1438a3640 (0x285da56c0:0) [2x4096x320] -0.001959 -0.343994 -0.374268 .. | |
|-> 2. 0x1438a33a0 (0x285da5ac0:0) [2x4096x320] -0.519043 0.660156 0.280273 .. | |
|<- 1. 0x1438a3640 (0x285da56c0:0) [2x4096x320] -0.520996 0.316162 -0.093994 .. | |
CCV_NNC_CONVOLUTION_FORWARD [266]: [3] -> [1] (0) | |
|-> 1. 0x1438d8e40 (0x285da56c0:0) [2x64x64x320] -0.520996 0.316162 -0.093994 .. | |
|-> 2. 0x1438bf870 (0x285d85b00:0) [320x320x1x1] -0.055328 .. | |
|-> 3. 0x1438bf8e0 (0x285d85b40:0) [320] 0.022568 0.040405 -0.043579 .. | |
|<- 1. 0x1438a36b0 (0x285da5ac0:0) [2x64x64x320] 0.085571 0.700684 0.460449 .. | |
CCV_NNC_ADD_FORWARD [267]: [2] -> [1] (0) | |
|-> 1. 0x1438a36b0 (0x285da5ac0:0) [2x64x64x320] 0.085571 0.700684 0.460449 .. | |
|-> 2. 0x1438a1ff0 (0x285da5840:0) [2x64x64x320] -0.664551 -1.599609 0.645996 .. | |
|<- 1. 0x143905990 (0x285de0a40:0) [2x64x64x320] -0.579102 -0.898926 1.106445 .. | |
CCV_NNC_CONVOLUTION_FORWARD [268]: [3] -> [1] (0) | |
|-> 1. 0x143905990 (0x285de0a40:0) [2x64x64x320] -0.579102 -0.898926 1.106445 .. | |
|-> 2. 0x1438bf950 (0x285d85b80:0) [320x320x3x3] 0.000292 -0.000571 -0.037109 .. | |
|-> 3. 0x1438bf9c0 (0x285d85bc0:0) [320] 0.000891 -0.006954 -0.006714 .. | |
|<- 1. 0x1439018a0 (0x285df0000:0) [2x32x32x320] 0.989258 0.309814 0.657715 .. | |
Emit: (0, 19) | |
CCV_NNC_GROUP_NORM_FORWARD [269]: [3] -> [3] (0) | |
|-> 1. 0x1439018a0 (0x285df0000:0) [2x32x32x320] 0.989258 0.309814 0.657715 .. | |
|-> 2. 0x1438bfa30 (0x285d85c00:0) [1x1x1x320] 0.254639 0.270996 0.242065 .. | |
|-> 3. 0x1438bfaa0 (0x285d85c40:0) [1x1x1x320] 0.009743 0.018799 0.027435 .. | |
|<- 1. 0x1438a3720 (0x285da60c0:0) [2x32x32x320] 0.219238 0.100952 0.165161 .. | |
|<- 2. 0x1438a3790 (0x285da6100:0) [2x1x1x32] -0.086548 0.030014 0.079834 .. | |
|<- 3. 0x1438a3800 (0x285da6140:0) [2x1x1x32] 0.764648 1.391602 1.579102 .. | |
CCV_NNC_SWISH_FORWARD [270]: [1] -> [1] (0) | |
|-> 1. 0x1438a3720 (0x285da60c0:0) [2x32x32x320] 0.219238 0.100952 0.165161 .. | |
|<- 1. 0x1438a3720 (0x285da60c0:0) [2x32x32x320] 0.121582 0.053009 0.089355 .. | |
CCV_NNC_CONVOLUTION_FORWARD [271]: [3] -> [1] (0) | |
|-> 1. 0x1438a3720 (0x285da60c0:0) [2x32x32x320] 0.121582 0.053009 0.089355 .. | |
|-> 2. 0x1438bfbf0 (0x285d85d00:0) [640x320x3x3] -0.003166 -0.036407 -0.039703 .. | |
|-> 3. 0x1438bfc60 (0x285d85d40:0) [640] 0.025604 0.001693 0.020493 .. | |
|<- 1. 0x1438a38e0 (0x285da61c0:0) [2x32x32x640] -0.563965 -0.265381 0.013863 .. | |
CCV_NNC_ADD_FORWARD [272]: [2] -> [1] (0) | |
Wait: (0, 18) | |
|-> 1. 0x1438a38e0 (0x285da61c0:0) [2x32x32x640] -0.563965 -0.265381 0.013863 .. | |
|-> 2. 0x1438d8eb0 (0x285da6180:0) [2x1x1x640] 0.351318 -0.119873 0.318848 .. | |
|<- 1. 0x1438a38e0 (0x285da61c0:0) [2x32x32x640] -0.212646 -0.385254 0.332764 .. | |
CCV_NNC_GROUP_NORM_FORWARD [273]: [3] -> [3] (0) | |
|-> 1. 0x1438a38e0 (0x285da61c0:0) [2x32x32x640] -0.212646 -0.385254 0.332764 .. | |
|-> 2. 0x1438bfcd0 (0x285d85d80:0) [1x1x1x640] 0.268799 0.246338 0.254639 .. | |
|-> 3. 0x1438bfd40 (0x285d85dc0:0) [1x1x1x640] -0.096436 -0.092163 -0.112000 .. | |
|<- 1. 0x1438a3950 (0x285da6200:0) [2x32x32x640] -0.117004 -0.155640 0.014198 .. | |
|<- 2. 0x1438a39c0 (0x285da6240:0) [2x1x1x32] -0.139771 0.230103 0.045135 .. | |
|<- 3. 0x1438a3a30 (0x285da6280:0) [2x1x1x32] 1.048828 2.091797 1.273438 .. | |
CCV_NNC_SWISH_FORWARD [274]: [1] -> [1] (0) | |
|-> 1. 0x1438a3950 (0x285da6200:0) [2x32x32x640] -0.117004 -0.155640 0.014198 .. | |
|<- 1. 0x1438a3950 (0x285da6200:0) [2x32x32x640] -0.055084 -0.071777 0.007149 .. | |
CCV_NNC_CONVOLUTION_FORWARD [275]: [3] -> [1] (0) | |
|-> 1. 0x1438a3950 (0x285da6200:0) [2x32x32x640] -0.055084 -0.071777 0.007149 .. | |
|-> 2. 0x1438bfdb0 (0x285d85e00:0) [640x640x3x3] -0.040833 -0.005260 0.009308 .. | |
|-> 3. 0x1438bfe20 (0x285d85e40:0) [640] 0.005589 0.024704 0.081360 .. | |
|<- 1. 0x1438a3aa0 (0x285da61c0:0) [2x32x32x640] -0.117065 0.945312 0.622070 .. | |
CCV_NNC_CONVOLUTION_FORWARD [276]: [3] -> [1] (1) | |
Wait: (1, 19) | |
|-> 1. 0x1439018a0 (0x285df0000:0) [2x32x32x320] 0.989258 0.309814 0.657715 .. | |
|-> 2. 0x1438bfe90 (0x285d85e80:0) [640x320x1x1] 0.000690 .. | |
|-> 3. 0x1438bff00 (0x285d85ec0:0) [640] 0.021500 0.020828 0.086731 .. | |
|<- 1. 0x1438a3b10 (0x285da62c0:0) [2x32x32x640] -1.510742 -0.214111 -0.177734 .. | |
Emit: (1, 20) | |
CCV_NNC_ADD_FORWARD [277]: [2] -> [1] (0) | |
Wait: (0, 20) | |
|-> 1. 0x1438a3b10 (0x285da62c0:0) [2x32x32x640] -1.510742 -0.214111 -0.177734 .. | |
|-> 2. 0x1438a3aa0 (0x285da61c0:0) [2x32x32x640] -0.117065 0.945312 0.622070 .. | |
|<- 1. 0x1438a3b10 (0x285da62c0:0) [2x32x32x640] -1.627930 0.731445 0.444336 .. | |
CCV_NNC_GROUP_NORM_FORWARD [278]: [3] -> [3] (0) | |
|-> 1. 0x1438a3b10 (0x285da62c0:0) [2x32x32x640] -1.627930 0.731445 0.444336 .. | |
|-> 2. 0x1438bff70 (0x285d85f00:0) [1x1x1x640] 0.250977 0.392822 0.360107 .. | |
|-> 3. 0x1438bffe0 (0x285d85f40:0) [1x1x1x640] -0.014748 -0.003046 0.059326 .. | |
|<- 1. 0x1438a3b80 (0x285da6200:0) [2x32x32x640] -0.317383 0.351807 0.292236 .. | |
|<- 2. 0x1438a3bf0 (0x285da6100:0) [2x1x1x32] -0.279297 0.080261 -0.018372 .. | |
|<- 3. 0x1438a3c60 (0x285da6140:0) [2x1x1x32] 0.894043 1.658203 1.358398 .. | |
CCV_NNC_CONVOLUTION_FORWARD [279]: [3] -> [1] (0) | |
|-> 1. 0x1438a3b80 (0x285da6200:0) [2x32x32x640] -0.317383 0.351807 0.292236 .. | |
|-> 2. 0x1438c0050 (0x285d85f80:0) [640x640x1x1] 0.002949 .. | |
|-> 3. 0x1438c00c0 (0x285d85fc0:0) [640] 0.040070 -0.046509 -0.025711 .. | |
|<- 1. 0x1438a3cd0 (0x285da61c0:0) [2x32x32x640] 0.011711 0.003101 0.220581 .. | |
CCV_NNC_LAYER_NORM_FORWARD [280]: [3] -> [3] (0) | |
|-> 1. 0x1438d8f20 (0x285da61c0:0) [2x1024x640] 0.011711 0.003101 0.220581 .. | |
|-> 2. 0x1438c0130 (0x285d86000:0) [1x1x640] 0.505859 0.574707 0.518555 .. | |
|-> 3. 0x1438c01a0 (0x285d86040:0) [1x1x640] -0.050354 0.034210 -0.035522 .. | |
|<- 1. 0x1438a3d40 (0x285da6300:0) [2x1024x640] -0.038330 0.039764 0.153809 .. | |
|<- 2. 0x1438a3db0 (0x285da6340:0) [2x1024x1] -0.002829 .. | |
|<- 3. 0x1438a3e20 (0x285da6380:0) [2x1024x1] 1.633789 .. | |
Emit: (0, 21) | |
CCV_NNC_GEMM_FORWARD [281]: [2] -> [1] (0) | |
|-> 1. 0x1438a3d40 (0x285da6300:0) [2x1024x640] -0.038330 0.039764 0.153809 .. | |
|-> 2. 0x1438c0210 (0x285d86080:0) [640x640] 0.021545 0.046692 -0.021286 .. | |
|<- 1. 0x1438a3e90 (0x285da63c0:0) [2x1024x640] -0.520996 -1.092773 -0.407471 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [282]: [1] -> [1] (0) | |
|-> 1. 0x1438a3e90 (0x285da63c0:0) [2x1024x640] -0.520996 -1.092773 -0.407471 .. | |
|<- 1. 0x1438a3e90 (0x285da63c0:0) [2x1024x640] -0.058258 -0.122192 -0.045563 .. | |
CCV_NNC_TRANSPOSE_FORWARD [283]: [1] -> [1] (0) | |
|-> 1. 0x1438d9000 (0x285da63c0:0) [2x1024x8x80] -0.058258 -0.122192 -0.045563 .. | |
|<- 1. 0x1438a3fe0 (0x285da6480:0) [2x8x1024x80] -0.058258 -0.122192 -0.045563 .. | |
CCV_NNC_GEMM_FORWARD [284]: [2] -> [1] (1) | |
Wait: (1, 21) | |
|-> 1. 0x1438a3d40 (0x285da6300:0) [2x1024x640] -0.038330 0.039764 0.153809 .. | |
|-> 2. 0x1438c0280 (0x285d860c0:0) [640x640] 0.084473 -0.108582 0.039673 .. | |
|<- 1. 0x1438a3f00 (0x285da6400:0) [2x1024x640] -0.410889 -0.769531 -0.632812 .. | |
CCV_NNC_TRANSPOSE_FORWARD [285]: [1] -> [1] (1) | |
|-> 1. 0x1438d8f90 (0x285da6400:0) [2x1024x8x80] -0.410889 -0.769531 -0.632812 .. | |
|<- 1. 0x1438a3f70 (0x285da6440:0) [2x8x1024x80] -0.410889 -0.769531 -0.632812 .. | |
Emit: (1, 22) | |
CCV_NNC_GEMM_FORWARD [286]: [2] -> [1] (2) | |
Wait: (2, 21) | |
|-> 1. 0x1438a3d40 (0x285da6300:0) [2x1024x640] -0.038330 0.039764 0.153809 .. | |
|-> 2. 0x1438c02f0 (0x285d86100:0) [640x640] -0.016006 0.012390 -0.068909 .. | |
|<- 1. 0x1438a4050 (0x285da64c0:0) [2x1024x640] -0.335938 0.587891 0.184082 .. | |
CCV_NNC_TRANSPOSE_FORWARD [287]: [1] -> [1] (2) | |
|-> 1. 0x1438d9150 (0x285da64c0:0) [2x1024x8x80] -0.335938 0.587891 0.184082 .. | |
|<- 1. 0x1438a4130 (0x285da6200:0) [2x8x1024x80] -0.335938 0.587891 0.184082 .. | |
Emit: (2, 23) | |
CCV_NNC_GEMM_FORWARD [288]: [2] -> [1] (0) | |
Wait: (0, 22) | |
|-> 1. 0x1438d90e0 (0x285da6480:0) [1x1024x80] -0.058258 -0.122192 -0.045563 .. | |
|-> 2. 0x1438d9070 (0x285da6440:0) [1x1024x80] -0.410889 -0.769531 -0.632812 .. | |
|<- 1. 0x1438a40c0 (0x285da6500:0) [1x1024x1024] 5.570312 5.574219 5.335938 .. | |
CCV_NNC_SOFTMAX_FORWARD [289]: [1] -> [1] (0) | |
|-> 1. 0x1438d91c0 (0x285da6500:0) [1024x1024] 5.570312 5.574219 5.335938 .. | |
|<- 1. 0x1438d91c0 (0x285da6500:0) [1024x1024] 0.017990 0.018066 0.014236 .. | |
CCV_NNC_GEMM_FORWARD [290]: [2] -> [1] (0) | |
Wait: (0, 23) | |
|-> 1. 0x1438d92a0 (0x285da6500:0) [1x1024x1024] 0.017990 0.018066 0.014236 .. | |
|-> 2. 0x1438d9230 (0x285da6200:0) [1x1024x80] -0.335938 0.587891 0.184082 .. | |
|<- 1. 0x1438dbf20 (0x285da6300:0) [1x1024x80] -0.361084 0.128540 -0.017471 .. | |
CCV_NNC_GEMM_FORWARD [291]: [2] -> [1] (0) | |
|-> 1. 0x1438d93c0 (0x285da6480:0) [1x1024x80] 0.183472 -0.044678 -0.124023 .. | |
|-> 2. 0x1438d9310 (0x285da6440:0) [1x1024x80] 1.311523 -1.477539 -0.934082 .. | |
|<- 1. 0x1438a41a0 (0x285da6500:0) [1x1024x1024] 8.023438 2.181641 4.316406 .. | |
CCV_NNC_SOFTMAX_FORWARD [292]: [1] -> [1] (0) | |
|-> 1. 0x1438d9470 (0x285da6500:0) [1024x1024] 8.023438 2.181641 4.316406 .. | |
|<- 1. 0x1438d9470 (0x285da6500:0) [1024x1024] 0.016083 0.000047 0.000395 .. | |
CCV_NNC_GEMM_FORWARD [293]: [2] -> [1] (0) | |
|-> 1. 0x1438d9590 (0x285da6500:0) [1x1024x1024] 0.016083 0.000047 0.000395 .. | |
|-> 2. 0x1438d94e0 (0x285da6200:0) [1x1024x80] -0.179077 0.330566 -0.060211 .. | |
|<- 1. 0x1438dbf90 (0x285da6300:0) [1x1024x80] 0.000919 0.247803 -0.168701 .. | |
CCV_NNC_GEMM_FORWARD [294]: [2] -> [1] (0) | |
|-> 1. 0x1438d96b0 (0x285da6480:0) [1x1024x80] -0.057922 -0.082520 -0.039917 .. | |
|-> 2. 0x1438d9600 (0x285da6440:0) [1x1024x80] -1.572266 -1.166992 0.088196 .. | |
|<- 1. 0x1438a4210 (0x285da6500:0) [1x1024x1024] 5.429688 3.023438 3.111328 .. | |
CCV_NNC_SOFTMAX_FORWARD [295]: [1] -> [1] (0) | |
|-> 1. 0x1438d9760 (0x285da6500:0) [1024x1024] 5.429688 3.023438 3.111328 .. | |
|<- 1. 0x1438d9760 (0x285da6500:0) [1024x1024] 0.052948 0.004772 0.005211 .. | |
CCV_NNC_GEMM_FORWARD [296]: [2] -> [1] (0) | |
|-> 1. 0x1438d9880 (0x285da6500:0) [1x1024x1024] 0.052948 0.004772 0.005211 .. | |
|-> 2. 0x1438d97d0 (0x285da6200:0) [1x1024x80] -0.742676 -0.222290 -0.208740 .. | |
|<- 1. 0x1438dc040 (0x285da6300:0) [1x1024x80] -0.292725 -0.001611 0.300781 .. | |
CCV_NNC_GEMM_FORWARD [297]: [2] -> [1] (0) | |
|-> 1. 0x1438d99a0 (0x285da6480:0) [1x1024x80] 0.012566 -0.013527 -0.073425 .. | |
|-> 2. 0x1438d98f0 (0x285da6440:0) [1x1024x80] -2.072266 -0.619141 -1.301758 .. | |
|<- 1. 0x1438a4280 (0x285da6500:0) [1x1024x1024] 8.476562 8.156250 9.359375 .. | |
CCV_NNC_SOFTMAX_FORWARD [298]: [1] -> [1] (0) | |
|-> 1. 0x1438d9a50 (0x285da6500:0) [1024x1024] 8.476562 8.156250 9.359375 .. | |
|<- 1. 0x1438d9a50 (0x285da6500:0) [1024x1024] 0.003235 0.002348 0.007820 .. | |
CCV_NNC_GEMM_FORWARD [299]: [2] -> [1] (0) | |
|-> 1. 0x1438d9b70 (0x285da6500:0) [1x1024x1024] 0.003235 0.002348 0.007820 .. | |
|-> 2. 0x1438d9ac0 (0x285da6200:0) [1x1024x80] 0.027679 0.418701 -0.992676 .. | |
|<- 1. 0x1438dc0f0 (0x285da6300:0) [1x1024x80] -0.282227 0.398438 -0.941895 .. | |
CCV_NNC_GEMM_FORWARD [300]: [2] -> [1] (0) | |
|-> 1. 0x1438d9c90 (0x285da6480:0) [1x1024x80] -0.044586 -0.031982 -0.024704 .. | |
|-> 2. 0x1438d9be0 (0x285da6440:0) [1x1024x80] 1.074219 0.126831 1.488281 .. | |
|<- 1. 0x1438a42f0 (0x285da6500:0) [1x1024x1024] 0.976562 1.429688 1.472656 .. | |
CCV_NNC_SOFTMAX_FORWARD [301]: [1] -> [1] (0) | |
|-> 1. 0x1438d9d40 (0x285da6500:0) [1024x1024] 0.976562 1.429688 1.472656 .. | |
|<- 1. 0x1438d9d40 (0x285da6500:0) [1024x1024] 0.001372 0.002159 0.002253 .. | |
CCV_NNC_GEMM_FORWARD [302]: [2] -> [1] (0) | |
|-> 1. 0x1438d9e60 (0x285da6500:0) [1x1024x1024] 0.001372 0.002159 0.002253 .. | |
|-> 2. 0x1438d9db0 (0x285da6200:0) [1x1024x80] 0.544922 0.029510 0.598633 .. | |
|<- 1. 0x1438dc1a0 (0x285da6300:0) [1x1024x80] 0.154419 0.206909 0.036774 .. | |
CCV_NNC_GEMM_FORWARD [303]: [2] -> [1] (0) | |
|-> 1. 0x1438d9f80 (0x285da6480:0) [1x1024x80] 0.044128 0.020248 0.016449 .. | |
|-> 2. 0x1438d9ed0 (0x285da6440:0) [1x1024x80] -0.579102 -0.297852 -0.833984 .. | |
|<- 1. 0x1438a4360 (0x285da6500:0) [1x1024x1024] 0.775391 -0.621094 -0.245117 .. | |
CCV_NNC_SOFTMAX_FORWARD [304]: [1] -> [1] (0) | |
|-> 1. 0x1438da030 (0x285da6500:0) [1024x1024] 0.775391 -0.621094 -0.245117 .. | |
|<- 1. 0x1438da030 (0x285da6500:0) [1024x1024] 0.003210 0.000794 0.001157 .. | |
CCV_NNC_GEMM_FORWARD [305]: [2] -> [1] (0) | |
|-> 1. 0x1438da150 (0x285da6500:0) [1x1024x1024] 0.003210 0.000794 0.001157 .. | |
|-> 2. 0x1438da0a0 (0x285da6200:0) [1x1024x80] -0.126099 0.404541 -0.460449 .. | |
|<- 1. 0x1438dc250 (0x285da6300:0) [1x1024x80] -0.294922 0.374512 0.024796 .. | |
CCV_NNC_GEMM_FORWARD [306]: [2] -> [1] (0) | |
|-> 1. 0x1438da270 (0x285da6480:0) [1x1024x80] 0.011032 -0.000726 -0.145264 .. | |
|-> 2. 0x1438da1c0 (0x285da6440:0) [1x1024x80] -1.261719 1.200195 -1.605469 .. | |
|<- 1. 0x1438a43d0 (0x285da6500:0) [1x1024x1024] 5.765625 3.843750 3.955078 .. | |
CCV_NNC_SOFTMAX_FORWARD [307]: [1] -> [1] (0) | |
|-> 1. 0x1438da320 (0x285da6500:0) [1024x1024] 5.765625 3.843750 3.955078 .. | |
|<- 1. 0x1438da320 (0x285da6500:0) [1024x1024] 0.034363 0.005028 0.005619 .. | |
CCV_NNC_GEMM_FORWARD [308]: [2] -> [1] (0) | |
|-> 1. 0x1438da440 (0x285da6500:0) [1x1024x1024] 0.034363 0.005028 0.005619 .. | |
|-> 2. 0x1438da390 (0x285da6200:0) [1x1024x80] -0.669922 -0.351074 -0.237671 .. | |
|<- 1. 0x1438dc300 (0x285da6300:0) [1x1024x80] -0.017807 -0.226807 -0.214600 .. | |
CCV_NNC_GEMM_FORWARD [309]: [2] -> [1] (0) | |
|-> 1. 0x1438da560 (0x285da6480:0) [1x1024x80] 0.061798 -0.091064 0.092712 .. | |
|-> 2. 0x1438da4b0 (0x285da6440:0) [1x1024x80] -1.122070 0.973633 2.224609 .. | |
|<- 1. 0x1438a4440 (0x285da6500:0) [1x1024x1024] 6.023438 4.640625 4.320312 .. | |
CCV_NNC_SOFTMAX_FORWARD [310]: [1] -> [1] (0) | |
|-> 1. 0x1438da610 (0x285da6500:0) [1024x1024] 6.023438 4.640625 4.320312 .. | |
|<- 1. 0x1438da610 (0x285da6500:0) [1024x1024] 0.064880 0.016281 0.011818 .. | |
CCV_NNC_GEMM_FORWARD [311]: [2] -> [1] (0) | |
|-> 1. 0x1438da730 (0x285da6500:0) [1x1024x1024] 0.064880 0.016281 0.011818 .. | |
|-> 2. 0x1438da680 (0x285da6200:0) [1x1024x80] -0.178711 1.040039 -0.553711 .. | |
|<- 1. 0x1438dc3b0 (0x285da6300:0) [1x1024x80] -0.082153 0.366699 -0.263428 .. | |
CCV_NNC_GEMM_FORWARD [312]: [2] -> [1] (0) | |
|-> 1. 0x1438da850 (0x285da6480:0) [1x1024x80] -0.038757 -0.099304 -0.036530 .. | |
|-> 2. 0x1438da7a0 (0x285da6440:0) [1x1024x80] -0.388428 -1.009766 -0.566895 .. | |
|<- 1. 0x1438a44b0 (0x285da6500:0) [1x1024x1024] 5.679688 5.593750 5.460938 .. | |
CCV_NNC_SOFTMAX_FORWARD [313]: [1] -> [1] (0) | |
|-> 1. 0x1438da900 (0x285da6500:0) [1024x1024] 5.679688 5.593750 5.460938 .. | |
|<- 1. 0x1438da900 (0x285da6500:0) [1024x1024] 0.021042 0.019318 0.016907 .. | |
CCV_NNC_GEMM_FORWARD [314]: [2] -> [1] (0) | |
|-> 1. 0x1438daa20 (0x285da6500:0) [1x1024x1024] 0.021042 0.019318 0.016907 .. | |
|-> 2. 0x1438da970 (0x285da6200:0) [1x1024x80] -0.329834 0.572266 0.132324 .. | |
|<- 1. 0x1438dc460 (0x285da6300:0) [1x1024x80] -0.384521 0.130493 -0.053589 .. | |
CCV_NNC_GEMM_FORWARD [315]: [2] -> [1] (0) | |
|-> 1. 0x1438dab40 (0x285da6480:0) [1x1024x80] 0.178711 -0.053009 -0.130005 .. | |
|-> 2. 0x1438daa90 (0x285da6440:0) [1x1024x80] 1.332031 -1.637695 -0.878906 .. | |
|<- 1. 0x1438a4520 (0x285da6500:0) [1x1024x1024] 7.808594 2.779297 4.605469 .. | |
CCV_NNC_SOFTMAX_FORWARD [316]: [1] -> [1] (0) | |
|-> 1. 0x1438dabf0 (0x285da6500:0) [1024x1024] 7.808594 2.779297 4.605469 .. | |
|<- 1. 0x1438dabf0 (0x285da6500:0) [1024x1024] 0.013405 0.000088 0.000545 .. | |
CCV_NNC_GEMM_FORWARD [317]: [2] -> [1] (0) | |
|-> 1. 0x1438dad10 (0x285da6500:0) [1x1024x1024] 0.013405 0.000088 0.000545 .. | |
|-> 2. 0x1438dac60 (0x285da6200:0) [1x1024x80] -0.192017 0.287109 -0.053925 .. | |
|<- 1. 0x1438dc510 (0x285da6300:0) [1x1024x80] 0.139404 0.192505 -0.123840 .. | |
CCV_NNC_GEMM_FORWARD [318]: [2] -> [1] (0) | |
|-> 1. 0x1438dae30 (0x285da6480:0) [1x1024x80] -0.055725 -0.087036 -0.044281 .. | |
|-> 2. 0x1438dad80 (0x285da6440:0) [1x1024x80] -1.325195 -1.289062 0.051819 .. | |
|<- 1. 0x1438a4590 (0x285da6500:0) [1x1024x1024] 5.421875 3.320312 3.195312 .. | |
CCV_NNC_SOFTMAX_FORWARD [319]: [1] -> [1] (0) | |
|-> 1. 0x1438daee0 (0x285da6500:0) [1024x1024] 5.421875 3.320312 3.195312 .. | |
|<- 1. 0x1438daee0 (0x285da6500:0) [1024x1024] 0.057922 0.007080 0.006248 .. | |
CCV_NNC_GEMM_FORWARD [320]: [2] -> [1] (0) | |
|-> 1. 0x1438db000 (0x285da6500:0) [1x1024x1024] 0.057922 0.007080 0.006248 .. | |
|-> 2. 0x1438daf50 (0x285da6200:0) [1x1024x80] -0.742188 -0.330811 -0.071472 .. | |
|<- 1. 0x1438dc5c0 (0x285da6300:0) [1x1024x80] -0.361084 -0.045593 0.334473 .. | |
CCV_NNC_GEMM_FORWARD [321]: [2] -> [1] (0) | |
|-> 1. 0x1438db120 (0x285da6480:0) [1x1024x80] 0.014198 0.003281 -0.079468 .. | |
|-> 2. 0x1438db070 (0x285da6440:0) [1x1024x80] -2.187500 -0.302734 -1.355469 .. | |
|<- 1. 0x1438a4600 (0x285da6500:0) [1x1024x1024] 8.507812 8.203125 9.304688 .. | |
CCV_NNC_SOFTMAX_FORWARD [322]: [1] -> [1] (0) | |
|-> 1. 0x1438db1d0 (0x285da6500:0) [1024x1024] 8.507812 8.203125 9.304688 .. | |
|<- 1. 0x1438db1d0 (0x285da6500:0) [1024x1024] 0.003477 0.002563 0.007713 .. | |
CCV_NNC_GEMM_FORWARD [323]: [2] -> [1] (0) | |
|-> 1. 0x1438db2f0 (0x285da6500:0) [1x1024x1024] 0.003477 0.002563 0.007713 .. | |
|-> 2. 0x1438db240 (0x285da6200:0) [1x1024x80] 0.006760 0.414062 -0.980957 .. | |
|<- 1. 0x1438dc670 (0x285da6300:0) [1x1024x80] -0.318848 0.344482 -0.938965 .. | |
CCV_NNC_GEMM_FORWARD [324]: [2] -> [1] (0) | |
|-> 1. 0x1438db410 (0x285da6480:0) [1x1024x80] -0.034363 -0.038727 -0.018570 .. | |
|-> 2. 0x1438db360 (0x285da6440:0) [1x1024x80] 0.910156 0.247681 1.322266 .. | |
|<- 1. 0x1438a4670 (0x285da6500:0) [1x1024x1024] 1.238281 1.551758 1.779297 .. | |
CCV_NNC_SOFTMAX_FORWARD [325]: [1] -> [1] (0) | |
|-> 1. 0x1438db4c0 (0x285da6500:0) [1024x1024] 1.238281 1.551758 1.779297 .. | |
|<- 1. 0x1438db4c0 (0x285da6500:0) [1024x1024] 0.001794 0.002455 0.003080 .. | |
CCV_NNC_GEMM_FORWARD [326]: [2] -> [1] (0) | |
|-> 1. 0x1438db5e0 (0x285da6500:0) [1x1024x1024] 0.001794 0.002455 0.003080 .. | |
|-> 2. 0x1438db530 (0x285da6200:0) [1x1024x80] 0.464355 0.148926 0.725098 .. | |
|<- 1. 0x1438dc720 (0x285da6300:0) [1x1024x80] 0.254883 0.322021 0.157227 .. | |
CCV_NNC_GEMM_FORWARD [327]: [2] -> [1] (0) | |
|-> 1. 0x1438db700 (0x285da6480:0) [1x1024x80] 0.039307 0.029373 -0.006130 .. | |
|-> 2. 0x1438db650 (0x285da6440:0) [1x1024x80] -0.614258 -0.156738 -0.780273 .. | |
|<- 1. 0x1438a46e0 (0x285da6500:0) [1x1024x1024] 0.920410 -0.377930 -0.031647 .. | |
CCV_NNC_SOFTMAX_FORWARD [328]: [1] -> [1] (0) | |
|-> 1. 0x1438db7b0 (0x285da6500:0) [1024x1024] 0.920410 -0.377930 -0.031647 .. | |
|<- 1. 0x1438db7b0 (0x285da6500:0) [1024x1024] 0.002964 0.000809 0.001144 .. | |
CCV_NNC_GEMM_FORWARD [329]: [2] -> [1] (0) | |
|-> 1. 0x1438db8d0 (0x285da6500:0) [1x1024x1024] 0.002964 0.000809 0.001144 .. | |
|-> 2. 0x1438db820 (0x285da6200:0) [1x1024x80] -0.185791 0.209961 -0.484375 .. | |
|<- 1. 0x1438dc7d0 (0x285da6300:0) [1x1024x80] -0.371338 0.261719 0.041748 .. | |
CCV_NNC_GEMM_FORWARD [330]: [2] -> [1] (0) | |
|-> 1. 0x1438db9f0 (0x285da6480:0) [1x1024x80] 0.001505 -0.010872 -0.146973 .. | |
|-> 2. 0x1438db940 (0x285da6440:0) [1x1024x80] -1.353516 1.194336 -1.552734 .. | |
|<- 1. 0x1438a4750 (0x285da6500:0) [1x1024x1024] 5.667969 3.976562 4.187500 .. | |
CCV_NNC_SOFTMAX_FORWARD [331]: [1] -> [1] (0) | |
|-> 1. 0x1438dbaa0 (0x285da6500:0) [1024x1024] 5.667969 3.976562 4.187500 .. | |
|<- 1. 0x1438dbaa0 (0x285da6500:0) [1024x1024] 0.036499 0.006725 0.008308 .. | |
CCV_NNC_GEMM_FORWARD [332]: [2] -> [1] (0) | |
|-> 1. 0x1438dbbc0 (0x285da6500:0) [1x1024x1024] 0.036499 0.006725 0.008308 .. | |
|-> 2. 0x1438dbb10 (0x285da6200:0) [1x1024x80] -0.753906 -0.347900 -0.301025 .. | |
|<- 1. 0x1438dc880 (0x285da6300:0) [1x1024x80] -0.161499 -0.282471 -0.173218 .. | |
CCV_NNC_GEMM_FORWARD [333]: [2] -> [1] (0) | |
|-> 1. 0x1438dbce0 (0x285da6480:0) [1x1024x80] 0.087769 -0.096741 0.088684 .. | |
|-> 2. 0x1438dbc30 (0x285da6440:0) [1x1024x80] -1.050781 1.060547 2.183594 .. | |
|<- 1. 0x1438a47c0 (0x285da6500:0) [1x1024x1024] 6.304688 5.085938 4.675781 .. | |
CCV_NNC_SOFTMAX_FORWARD [334]: [1] -> [1] (0) | |
|-> 1. 0x1438dbd90 (0x285da6500:0) [1024x1024] 6.304688 5.085938 4.675781 .. | |
|<- 1. 0x1438dbd90 (0x285da6500:0) [1024x1024] 0.075073 0.022186 0.014725 .. | |
CCV_NNC_GEMM_FORWARD [335]: [2] -> [1] (0) | |
|-> 1. 0x1438dbeb0 (0x285da6500:0) [1x1024x1024] 0.075073 0.022186 0.014725 .. | |
|-> 2. 0x1438dbe00 (0x285da6200:0) [1x1024x80] -0.238281 1.119141 -0.505859 .. | |
|<- 1. 0x1438dc930 (0x285da6300:0) [1x1024x80] -0.135010 0.397217 -0.234375 .. | |
CCV_NNC_TRANSPOSE_FORWARD [336]: [1] -> [1] (0) | |
|-> 1. 0x1438dc9e0 (0x285da6300:0) [2x8x1024x80] -0.361084 0.128540 -0.017471 .. | |
|<- 1. 0x1438a48a0 (0x285da6200:0) [2x1024x8x80] -0.361084 0.128540 -0.017471 .. | |
CCV_NNC_GEMM_FORWARD [337]: [3] -> [1] (0) | |
|-> 1. 0x1438dca50 (0x285da6200:0) [2x1024x640] -0.361084 0.128540 -0.017471 .. | |
|-> 2. 0x1438c0360 (0x285d86140:0) [640x640] -0.028152 -0.005211 0.069153 .. | |
|-> 3. 0x1438c03d0 (0x285d86180:0) [640] 0.000637 0.002556 -0.041992 .. | |
|<- 1. 0x1438a4910 (0x285da6300:0) [2x1024x640] 0.014832 -0.139160 -0.882812 .. | |
CCV_NNC_ADD_FORWARD [338]: [2] -> [1] (0) | |
|-> 1. 0x1438a4910 (0x285da6300:0) [2x1024x640] 0.014832 -0.139160 -0.882812 .. | |
|-> 2. 0x1438d8f20 (0x285da61c0:0) [2x1024x640] 0.011711 0.003101 0.220581 .. | |
|<- 1. 0x1438a4910 (0x285da6300:0) [2x1024x640] 0.026550 -0.136108 -0.662109 .. | |
CCV_NNC_LAYER_NORM_FORWARD [339]: [3] -> [3] (0) | |
|-> 1. 0x1438a4910 (0x285da6300:0) [2x1024x640] 0.026550 -0.136108 -0.662109 .. | |
|-> 2. 0x1438c0440 (0x285d861c0:0) [1x1x640] 0.403564 0.457031 0.463867 .. | |
|-> 3. 0x1438c04b0 (0x285d86200:0) [1x1x640] 0.034668 -0.095215 -0.043091 .. | |
|<- 1. 0x1438a4980 (0x285da61c0:0) [2x1024x640] 0.045197 -0.222778 -0.630371 .. | |
|<- 2. 0x1438a49f0 (0x285da6380:0) [2x1024x1] 0.012642 .. | |
|<- 3. 0x1438a4a60 (0x285da6340:0) [2x1024x1] 1.876953 .. | |
CCV_NNC_GEMM_FORWARD [340]: [2] -> [1] (0) | |
|-> 1. 0x1438a4980 (0x285da61c0:0) [2x1024x640] 0.045197 -0.222778 -0.630371 .. | |
|-> 2. 0x1438c0520 (0x285d86240:0) [640x640] -0.068909 -0.063782 0.046234 .. | |
|<- 1. 0x1438a4ad0 (0x285da6200:0) [2x1024x640] -0.490234 -1.106445 -0.379150 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [341]: [1] -> [1] (0) | |
|-> 1. 0x1438a4ad0 (0x285da6200:0) [2x1024x640] -0.490234 -1.106445 -0.379150 .. | |
|<- 1. 0x1438a4ad0 (0x285da6200:0) [2x1024x640] -0.054810 -0.123718 -0.042389 .. | |
CCV_NNC_TRANSPOSE_FORWARD [342]: [1] -> [1] (0) | |
|-> 1. 0x1438dcb30 (0x285da6200:0) [2x1024x8x80] -0.054810 -0.123718 -0.042389 .. | |
|<- 1. 0x1438a4c20 (0x285da6440:0) [2x8x1024x80] -0.054810 -0.123718 -0.042389 .. | |
CCV_NNC_GEMM_FORWARD [343]: [2] -> [1] (0) | |
Wait: (0, 24) | |
|-> 1. 0x1438a4c20 (0x285da6440:0) [2x8x1024x80] -0.054810 -0.123718 -0.042389 .. | |
|-> 2. 0x1438a4bb0 (0x285da6580:0) [2x8x133x80] 0.370605 -0.183228 -1.733398 .. | |
|<- 1. 0x1438a4c90 (0x285da65c0:0) [2x8x1024x133] 6.578125 -0.109436 -0.457764 .. | |
CCV_NNC_SOFTMAX_FORWARD [344]: [1] -> [1] (0) | |
|-> 1. 0x1438dcba0 (0x285da65c0:0) [16384x133] 6.578125 -0.109436 -0.457764 .. | |
|<- 1. 0x1438dcba0 (0x285da65c0:0) [16384x133] 0.646973 0.000806 0.000569 .. | |
CCV_NNC_GEMM_FORWARD [345]: [2] -> [1] (0) | |
Wait: (0, 25) | |
|-> 1. 0x1438dcc80 (0x285da65c0:0) [2x8x1024x133] 0.646973 0.000806 0.000569 .. | |
|-> 2. 0x1438a4d70 (0x285da6640:0) [2x8x133x80] 0.013397 0.017731 0.048828 .. | |
|<- 1. 0x1438a4de0 (0x285da6440:0) [2x8x1024x80] 0.079773 0.100769 -0.193115 .. | |
CCV_NNC_TRANSPOSE_FORWARD [346]: [1] -> [1] (0) | |
|-> 1. 0x1438dccf0 (0x285da6440:0) [2x8x1024x80] 0.079773 0.100769 -0.193115 .. | |
|<- 1. 0x1438a4e50 (0x285da61c0:0) [2x1024x8x80] 0.079773 0.100769 -0.193115 .. | |
CCV_NNC_GEMM_FORWARD [347]: [3] -> [1] (0) | |
|-> 1. 0x1438dcd60 (0x285da61c0:0) [2x1024x640] 0.079773 0.100769 -0.193115 .. | |
|-> 2. 0x1438c0670 (0x285d86300:0) [640x640] -0.001424 0.000917 -0.006500 .. | |
|-> 3. 0x1438c06e0 (0x285d86340:0) [640] -0.015472 0.013123 -0.070862 .. | |
|<- 1. 0x1438a4ec0 (0x285da6400:0) [2x1024x640] 0.012054 0.027100 -0.074219 .. | |
CCV_NNC_ADD_FORWARD [348]: [2] -> [1] (0) | |
|-> 1. 0x1438a4ec0 (0x285da6400:0) [2x1024x640] 0.012054 0.027100 -0.074219 .. | |
|-> 2. 0x1438a4910 (0x285da6300:0) [2x1024x640] 0.026550 -0.136108 -0.662109 .. | |
|<- 1. 0x1438a4ec0 (0x285da6400:0) [2x1024x640] 0.038605 -0.109009 -0.736328 .. | |
CCV_NNC_LAYER_NORM_FORWARD [349]: [3] -> [3] (0) | |
|-> 1. 0x1438a4ec0 (0x285da6400:0) [2x1024x640] 0.038605 -0.109009 -0.736328 .. | |
|-> 2. 0x1438c0750 (0x285d86380:0) [1x1x640] 0.307373 0.304199 0.304932 .. | |
|-> 3. 0x1438c07c0 (0x285d863c0:0) [1x1x640] 0.016418 -0.054840 0.052734 .. | |
|<- 1. 0x1438a4f30 (0x285da6680:0) [2x1024x640] 0.031403 -0.121338 -0.360352 .. | |
|<- 2. 0x1438a4fa0 (0x285da66c0:0) [2x1024x1] 0.011696 .. | |
|<- 3. 0x1438a5010 (0x285da6700:0) [2x1024x1] 1.811523 .. | |
Emit: (0, 26) | |
CCV_NNC_GEMM_FORWARD [350]: [3] -> [1] (0) | |
|-> 1. 0x1438a4f30 (0x285da6680:0) [2x1024x640] 0.031403 -0.121338 -0.360352 .. | |
|-> 2. 0x1438c0830 (0x285d86400:0) [2560x640] -0.052673 -0.019516 -0.017975 .. | |
|-> 3. 0x1438c08a0 (0x285d86440:0) [2560] -0.304199 0.028854 0.045166 .. | |
|<- 1. 0x1438a5080 (0x285da6740:0) [2x1024x2560] -0.736328 0.725098 -0.290527 .. | |
CCV_NNC_GELU_FORWARD [351]: [1] -> [1] (0) | |
|-> 1. 0x1438a5080 (0x285da6740:0) [2x1024x2560] -0.736328 0.725098 -0.290527 .. | |
|<- 1. 0x1438a5080 (0x285da6740:0) [2x1024x2560] -0.169922 0.555176 -0.112061 .. | |
CCV_NNC_GEMM_FORWARD [352]: [3] -> [1] (1) | |
Wait: (1, 26) | |
|-> 1. 0x1438a4f30 (0x285da6680:0) [2x1024x640] 0.031403 -0.121338 -0.360352 .. | |
|-> 2. 0x1438c0910 (0x285d86480:0) [2560x640] 0.075134 0.030365 0.000856 .. | |
|-> 3. 0x1438c0980 (0x285d864c0:0) [2560] -0.089661 0.030685 -0.067871 .. | |
|<- 1. 0x1438a50f0 (0x285da6780:0) [2x1024x2560] -0.932617 0.306396 -1.067383 .. | |
Emit: (1, 27) | |
CCV_NNC_MUL_FORWARD [353]: [2] -> [1] (0) | |
Wait: (0, 27) | |
|-> 1. 0x1438a50f0 (0x285da6780:0) [2x1024x2560] -0.932617 0.306396 -1.067383 .. | |
|-> 2. 0x1438a5080 (0x285da6740:0) [2x1024x2560] -0.169922 0.555176 -0.112061 .. | |
|<- 1. 0x1438a50f0 (0x285da6780:0) [2x1024x2560] 0.158447 0.170044 0.119629 .. | |
CCV_NNC_GEMM_FORWARD [354]: [3] -> [1] (0) | |
|-> 1. 0x1438a50f0 (0x285da6780:0) [2x1024x2560] 0.158447 0.170044 0.119629 .. | |
|-> 2. 0x1438c09f0 (0x285d86500:0) [640x2560] 0.039215 -0.043976 0.050629 .. | |
|-> 3. 0x1438c0a60 (0x285d86540:0) [640] -0.002060 0.010002 -0.000533 .. | |
|<- 1. 0x1438a5160 (0x285da6680:0) [2x1024x640] -0.767578 -0.584961 0.454346 .. | |
CCV_NNC_ADD_FORWARD [355]: [2] -> [1] (0) | |
|-> 1. 0x1438a5160 (0x285da6680:0) [2x1024x640] -0.767578 -0.584961 0.454346 .. | |
|-> 2. 0x1438a4ec0 (0x285da6400:0) [2x1024x640] 0.038605 -0.109009 -0.736328 .. | |
|<- 1. 0x1438a5160 (0x285da6680:0) [2x1024x640] -0.729004 -0.693848 -0.281982 .. | |
CCV_NNC_CONVOLUTION_FORWARD [356]: [3] -> [1] (0) | |
|-> 1. 0x1438dcdd0 (0x285da6680:0) [2x32x32x640] -0.729004 -0.693848 -0.281982 .. | |
|-> 2. 0x1438c0ad0 (0x285d86580:0) [640x640x1x1] 0.023605 .. | |
|-> 3. 0x1438c0b40 (0x285d865c0:0) [640] -0.031860 -0.006199 -0.021896 .. | |
|<- 1. 0x1438a51d0 (0x285da6480:0) [2x32x32x640] -1.019531 -0.302734 0.253906 .. | |
CCV_NNC_ADD_FORWARD [357]: [2] -> [1] (0) | |
|-> 1. 0x1438a51d0 (0x285da6480:0) [2x32x32x640] -1.019531 -0.302734 0.253906 .. | |
|-> 2. 0x1438a3b10 (0x285da62c0:0) [2x32x32x640] -1.627930 0.731445 0.444336 .. | |
|<- 1. 0x1438fd7b0 (0x285da5980:0) [2x32x32x640] -2.648438 0.428711 0.698242 .. | |
CCV_NNC_GROUP_NORM_FORWARD [358]: [3] -> [3] (0) | |
|-> 1. 0x1438fd7b0 (0x285da5980:0) [2x32x32x640] -2.648438 0.428711 0.698242 .. | |
|-> 2. 0x1438c0bb0 (0x285d86600:0) [1x1x1x640] 0.208496 0.307617 0.281494 .. | |
|-> 3. 0x1438c0c20 (0x285d86640:0) [1x1x1x640] -0.066956 -0.038818 -0.037933 .. | |
|<- 1. 0x1438a5240 (0x285da6480:0) [2x32x32x640] -0.544922 0.127075 0.183716 .. | |
|<- 2. 0x1438a52b0 (0x285da67c0:0) [2x1x1x32] -0.157104 0.148926 0.143311 .. | |
|<- 3. 0x1438a5320 (0x285da6800:0) [2x1x1x32] 0.920410 1.851562 1.354492 .. | |
CCV_NNC_SWISH_FORWARD [359]: [1] -> [1] (0) | |
|-> 1. 0x1438a5240 (0x285da6480:0) [2x32x32x640] -0.544922 0.127075 0.183716 .. | |
|<- 1. 0x1438a5240 (0x285da6480:0) [2x32x32x640] -0.199951 0.067566 0.100281 .. | |
CCV_NNC_CONVOLUTION_FORWARD [360]: [3] -> [1] (0) | |
|-> 1. 0x1438a5240 (0x285da6480:0) [2x32x32x640] -0.199951 0.067566 0.100281 .. | |
|-> 2. 0x1438c0d70 (0x285d86700:0) [640x640x3x3] -0.004822 -0.019791 -0.021057 .. | |
|-> 3. 0x1438c0de0 (0x285d86740:0) [640] 0.027176 0.012741 -0.054749 .. | |
|<- 1. 0x1438a5400 (0x285da62c0:0) [2x32x32x640] 1.653320 -0.888184 1.012695 .. | |
CCV_NNC_ADD_FORWARD [361]: [2] -> [1] (0) | |
Wait: (0, 28) | |
|-> 1. 0x1438a5400 (0x285da62c0:0) [2x32x32x640] 1.653320 -0.888184 1.012695 .. | |
|-> 2. 0x1438dce40 (0x285da6840:0) [2x1x1x640] 0.087891 -3.085938 0.536621 .. | |
|<- 1. 0x1438a5400 (0x285da62c0:0) [2x32x32x640] 1.741211 -3.974609 1.548828 .. | |
CCV_NNC_GROUP_NORM_FORWARD [362]: [3] -> [3] (0) | |
|-> 1. 0x1438a5400 (0x285da62c0:0) [2x32x32x640] 1.741211 -3.974609 1.548828 .. | |
|-> 2. 0x1438c0e50 (0x285d86780:0) [1x1x1x640] 0.551270 0.692871 0.686035 .. | |
|-> 3. 0x1438c0ec0 (0x285d867c0:0) [1x1x1x640] -0.276367 -0.065369 -0.252930 .. | |
|<- 1. 0x1438a5470 (0x285da6480:0) [2x32x32x640] 0.421875 -2.527344 0.504395 .. | |
|<- 2. 0x1438a54e0 (0x285da6880:0) [2x1x1x32] 0.239380 0.424561 0.679199 .. | |
|<- 3. 0x1438a5550 (0x285da68c0:0) [2x1x1x32] 0.843262 1.119141 1.365234 .. | |
CCV_NNC_SWISH_FORWARD [363]: [1] -> [1] (0) | |
|-> 1. 0x1438a5470 (0x285da6480:0) [2x32x32x640] 0.421875 -2.527344 0.504395 .. | |
|<- 1. 0x1438a5470 (0x285da6480:0) [2x32x32x640] 0.254883 -0.186890 0.314453 .. | |
CCV_NNC_CONVOLUTION_FORWARD [364]: [3] -> [1] (0) | |
|-> 1. 0x1438a5470 (0x285da6480:0) [2x32x32x640] 0.254883 -0.186890 0.314453 .. | |
|-> 2. 0x1438c0f30 (0x285d86800:0) [640x640x3x3] 0.033478 0.012352 -0.008667 .. | |
|-> 3. 0x1438c0fa0 (0x285d86840:0) [640] -0.000833 -0.002270 0.024445 .. | |
|<- 1. 0x1438a55c0 (0x285da6900:0) [2x32x32x640] -0.551270 -0.381836 0.529785 .. | |
CCV_NNC_ADD_FORWARD [365]: [2] -> [1] (0) | |
|-> 1. 0x1438fd7b0 (0x285da5980:0) [2x32x32x640] -2.648438 0.428711 0.698242 .. | |
|-> 2. 0x1438a55c0 (0x285da6900:0) [2x32x32x640] -0.551270 -0.381836 0.529785 .. | |
|<- 1. 0x1438a5630 (0x285da62c0:0) [2x32x32x640] -3.199219 0.046875 1.228516 .. | |
CCV_NNC_GROUP_NORM_FORWARD [366]: [3] -> [3] (0) | |
|-> 1. 0x1438a5630 (0x285da62c0:0) [2x32x32x640] -3.199219 0.046875 1.228516 .. | |
|-> 2. 0x1438c1010 (0x285d86880:0) [1x1x1x640] 0.291504 0.381348 0.403564 .. | |
|-> 3. 0x1438c1080 (0x285d868c0:0) [1x1x1x640] -0.014030 0.044952 0.045532 .. | |
|<- 1. 0x1438a56a0 (0x285da6900:0) [2x32x32x640] -0.937988 0.169678 0.691406 .. | |
|<- 2. 0x1438a5710 (0x285da5700:0) [2x1x1x32] -0.256836 0.051575 0.174438 .. | |
|<- 3. 0x1438a5780 (0x285da5740:0) [2x1x1x32] 1.077148 1.314453 1.291016 .. | |
CCV_NNC_CONVOLUTION_FORWARD [367]: [3] -> [1] (0) | |
|-> 1. 0x1438a56a0 (0x285da6900:0) [2x32x32x640] -0.937988 0.169678 0.691406 .. | |
|-> 2. 0x1438c10f0 (0x285d86900:0) [640x640x1x1] -0.072144 .. | |
|-> 3. 0x1438c1160 (0x285d86940:0) [640] 0.026093 -0.050903 -0.041107 .. | |
|<- 1. 0x1438a57f0 (0x285da6480:0) [2x32x32x640] -0.096313 0.765625 0.216919 .. | |
CCV_NNC_LAYER_NORM_FORWARD [368]: [3] -> [3] (0) | |
|-> 1. 0x1438dceb0 (0x285da6480:0) [2x1024x640] -0.096313 0.765625 0.216919 .. | |
|-> 2. 0x1438c11d0 (0x285d86980:0) [1x1x640] 0.543457 0.561523 0.567383 .. | |
|-> 3. 0x1438c1240 (0x285d869c0:0) [1x1x640] 0.066528 0.015854 0.001546 .. | |
|<- 1. 0x1438a5860 (0x285da6900:0) [2x1024x640] 0.049316 0.431396 0.142700 .. | |
|<- 2. 0x1438a58d0 (0x285da6940:0) [2x1024x1] -0.060944 .. | |
|<- 3. 0x1438a5940 (0x285da6980:0) [2x1024x1] 0.895508 .. | |
Emit: (0, 29) | |
CCV_NNC_GEMM_FORWARD [369]: [2] -> [1] (0) | |
|-> 1. 0x1438a5860 (0x285da6900:0) [2x1024x640] 0.049316 0.431396 0.142700 .. | |
|-> 2. 0x1438c12b0 (0x285d86a00:0) [640x640] 0.032898 0.015129 0.023300 .. | |
|<- 1. 0x1438a59b0 (0x285da69c0:0) [2x1024x640] 0.834961 -1.231445 1.248047 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [370]: [1] -> [1] (0) | |
|-> 1. 0x1438a59b0 (0x285da69c0:0) [2x1024x640] 0.834961 -1.231445 1.248047 .. | |
|<- 1. 0x1438a59b0 (0x285da69c0:0) [2x1024x640] 0.093384 -0.137695 0.139526 .. | |
CCV_NNC_TRANSPOSE_FORWARD [371]: [1] -> [1] (0) | |
|-> 1. 0x1438dcf90 (0x285da69c0:0) [2x1024x8x80] 0.093384 -0.137695 0.139526 .. | |
|<- 1. 0x1438a5b00 (0x285da61c0:0) [2x8x1024x80] 0.093384 -0.137695 0.139526 .. | |
CCV_NNC_GEMM_FORWARD [372]: [2] -> [1] (1) | |
Wait: (1, 29) | |
|-> 1. 0x1438a5860 (0x285da6900:0) [2x1024x640] 0.049316 0.431396 0.142700 .. | |
|-> 2. 0x1438c1320 (0x285d86a40:0) [640x640] -0.020447 0.138306 -0.020874 .. | |
|<- 1. 0x1438a5a20 (0x285da63c0:0) [2x1024x640] 0.753906 -2.132812 -1.050781 .. | |
CCV_NNC_TRANSPOSE_FORWARD [373]: [1] -> [1] (1) | |
|-> 1. 0x1438dcf20 (0x285da63c0:0) [2x1024x8x80] 0.753906 -2.132812 -1.050781 .. | |
|<- 1. 0x1438a5a90 (0x285da6a00:0) [2x8x1024x80] 0.753906 -2.132812 -1.050781 .. | |
Emit: (1, 30) | |
CCV_NNC_GEMM_FORWARD [374]: [2] -> [1] (2) | |
Wait: (2, 29) | |
|-> 1. 0x1438a5860 (0x285da6900:0) [2x1024x640] 0.049316 0.431396 0.142700 .. | |
|-> 2. 0x1438c1390 (0x285d86a80:0) [640x640] 0.008591 -0.076965 0.013618 .. | |
|<- 1. 0x1438a5b70 (0x285da64c0:0) [2x1024x640] 0.223389 0.438232 -1.061523 .. | |
CCV_NNC_TRANSPOSE_FORWARD [375]: [1] -> [1] (2) | |
|-> 1. 0x1438dd0e0 (0x285da64c0:0) [2x1024x8x80] 0.223389 0.438232 -1.061523 .. | |
|<- 1. 0x1438a5c50 (0x285da6a80:0) [2x8x1024x80] 0.223389 0.438232 -1.061523 .. | |
Emit: (2, 31) | |
CCV_NNC_GEMM_FORWARD [376]: [2] -> [1] (0) | |
Wait: (0, 30) | |
|-> 1. 0x1438dd070 (0x285da61c0:0) [1x1024x80] 0.093384 -0.137695 0.139526 .. | |
|-> 2. 0x1438dd000 (0x285da6a00:0) [1x1024x80] 0.753906 -2.132812 -1.050781 .. | |
|<- 1. 0x1438a5be0 (0x285da6a40:0) [1x1024x1024] 3.708984 2.576172 2.929688 .. | |
CCV_NNC_SOFTMAX_FORWARD [377]: [1] -> [1] (0) | |
|-> 1. 0x1438dd150 (0x285da6a40:0) [1024x1024] 3.708984 2.576172 2.929688 .. | |
|<- 1. 0x1438dd150 (0x285da6a40:0) [1024x1024] 0.005600 0.001803 0.002567 .. | |
CCV_NNC_GEMM_FORWARD [378]: [2] -> [1] (0) | |
Wait: (0, 31) | |
|-> 1. 0x1438dd230 (0x285da6a40:0) [1x1024x1024] 0.005600 0.001803 0.002567 .. | |
|-> 2. 0x1438dd1c0 (0x285da6a80:0) [1x1024x80] 0.223389 0.438232 -1.061523 .. | |
|<- 1. 0x1438dfeb0 (0x285da6900:0) [1x1024x80] 0.265381 0.010628 -0.298096 .. | |
CCV_NNC_GEMM_FORWARD [379]: [2] -> [1] (0) | |
|-> 1. 0x1438dd350 (0x285da61c0:0) [1x1024x80] -0.102234 0.056061 -0.065491 .. | |
|-> 2. 0x1438dd2a0 (0x285da6a00:0) [1x1024x80] -0.977051 0.231567 -0.533691 .. | |
|<- 1. 0x1438a5cc0 (0x285da6a40:0) [1x1024x1024] 1.554688 1.155273 1.335938 .. | |
CCV_NNC_SOFTMAX_FORWARD [380]: [1] -> [1] (0) | |
|-> 1. 0x1438dd400 (0x285da6a40:0) [1024x1024] 1.554688 1.155273 1.335938 .. | |
|<- 1. 0x1438dd400 (0x285da6a40:0) [1024x1024] 0.003613 0.002422 0.002903 .. | |
CCV_NNC_GEMM_FORWARD [381]: [2] -> [1] (0) | |
|-> 1. 0x1438dd520 (0x285da6a40:0) [1x1024x1024] 0.003613 0.002422 0.002903 .. | |
|-> 2. 0x1438dd470 (0x285da6a80:0) [1x1024x80] -0.706543 0.345947 0.224121 .. | |
|<- 1. 0x1438dff20 (0x285da6900:0) [1x1024x80] -0.127441 0.074585 0.045319 .. | |
CCV_NNC_GEMM_FORWARD [382]: [2] -> [1] (0) | |
|-> 1. 0x1438dd640 (0x285da61c0:0) [1x1024x80] -0.036591 0.026779 -0.229492 .. | |
|-> 2. 0x1438dd590 (0x285da6a00:0) [1x1024x80] -2.191406 1.556641 0.182617 .. | |
|<- 1. 0x1438a5d30 (0x285da6a40:0) [1x1024x1024] 4.519531 3.941406 3.863281 .. | |
CCV_NNC_SOFTMAX_FORWARD [383]: [1] -> [1] (0) | |
|-> 1. 0x1438dd6f0 (0x285da6a40:0) [1024x1024] 4.519531 3.941406 3.863281 .. | |
|<- 1. 0x1438dd6f0 (0x285da6a40:0) [1024x1024] 0.004894 0.002745 0.002539 .. | |
CCV_NNC_GEMM_FORWARD [384]: [2] -> [1] (0) | |
|-> 1. 0x1438dd810 (0x285da6a40:0) [1x1024x1024] 0.004894 0.002745 0.002539 .. | |
|-> 2. 0x1438dd760 (0x285da6a80:0) [1x1024x80] 0.266602 0.398438 0.144409 .. | |
|<- 1. 0x1438dffd0 (0x285da6900:0) [1x1024x80] 0.065369 0.208862 0.217651 .. | |
CCV_NNC_GEMM_FORWARD [385]: [2] -> [1] (0) | |
|-> 1. 0x1438dd930 (0x285da61c0:0) [1x1024x80] 0.041473 -0.001205 -0.115967 .. | |
|-> 2. 0x1438dd880 (0x285da6a00:0) [1x1024x80] 1.298828 -0.989746 -0.521973 .. | |
|<- 1. 0x1438a5da0 (0x285da6a40:0) [1x1024x1024] 3.648438 1.824219 1.376953 .. | |
CCV_NNC_SOFTMAX_FORWARD [386]: [1] -> [1] (0) | |
|-> 1. 0x1438dd9e0 (0x285da6a40:0) [1024x1024] 3.648438 1.824219 1.376953 .. | |
|<- 1. 0x1438dd9e0 (0x285da6a40:0) [1024x1024] 0.024292 0.003918 0.002506 .. | |
CCV_NNC_GEMM_FORWARD [387]: [2] -> [1] (0) | |
|-> 1. 0x1438ddb00 (0x285da6a40:0) [1x1024x1024] 0.024292 0.003918 0.002506 .. | |
|-> 2. 0x1438dda50 (0x285da6a80:0) [1x1024x80] 0.635254 0.037811 0.057648 .. | |
|<- 1. 0x1438e0080 (0x285da6900:0) [1x1024x80] 0.120483 0.097351 0.052246 .. | |
CCV_NNC_GEMM_FORWARD [388]: [2] -> [1] (0) | |
|-> 1. 0x1438ddc20 (0x285da61c0:0) [1x1024x80] -0.129639 -0.012672 -0.145508 .. | |
|-> 2. 0x1438ddb70 (0x285da6a00:0) [1x1024x80] -2.470703 -1.506836 -2.023438 .. | |
|<- 1. 0x1438a5e10 (0x285da6a40:0) [1x1024x1024] 4.156250 1.927734 2.832031 .. | |
CCV_NNC_SOFTMAX_FORWARD [389]: [1] -> [1] (0) | |
|-> 1. 0x1438ddcd0 (0x285da6a40:0) [1024x1024] 4.156250 1.927734 2.832031 .. | |
|<- 1. 0x1438ddcd0 (0x285da6a40:0) [1024x1024] 0.020737 0.002234 0.005516 .. | |
CCV_NNC_GEMM_FORWARD [390]: [2] -> [1] (0) | |
|-> 1. 0x1438dddf0 (0x285da6a40:0) [1x1024x1024] 0.020737 0.002234 0.005516 .. | |
|-> 2. 0x1438ddd40 (0x285da6a80:0) [1x1024x80] 0.094360 0.555664 0.795898 .. | |
|<- 1. 0x1438e0130 (0x285da6900:0) [1x1024x80] 0.042542 0.075012 -0.051636 .. | |
CCV_NNC_GEMM_FORWARD [391]: [2] -> [1] (0) | |
|-> 1. 0x1438ddf10 (0x285da61c0:0) [1x1024x80] 0.051453 -0.110107 -0.027237 .. | |
|-> 2. 0x1438dde60 (0x285da6a00:0) [1x1024x80] -0.833008 1.696289 -1.751953 .. | |
|<- 1. 0x1438a5e80 (0x285da6a40:0) [1x1024x1024] 6.093750 4.109375 5.015625 .. | |
CCV_NNC_SOFTMAX_FORWARD [392]: [1] -> [1] (0) | |
|-> 1. 0x1438ddfc0 (0x285da6a40:0) [1024x1024] 6.093750 4.109375 5.015625 .. | |
|<- 1. 0x1438ddfc0 (0x285da6a40:0) [1024x1024] 0.035126 0.004829 0.011955 .. | |
CCV_NNC_GEMM_FORWARD [393]: [2] -> [1] (0) | |
|-> 1. 0x1438de0e0 (0x285da6a40:0) [1x1024x1024] 0.035126 0.004829 0.011955 .. | |
|-> 2. 0x1438de030 (0x285da6a80:0) [1x1024x80] 0.095581 -0.037384 -0.475098 .. | |
|<- 1. 0x1438e01e0 (0x285da6900:0) [1x1024x80] 0.146240 -0.027695 -0.245850 .. | |
CCV_NNC_GEMM_FORWARD [394]: [2] -> [1] (0) | |
|-> 1. 0x1438de200 (0x285da61c0:0) [1x1024x80] -0.039215 -0.091675 -0.002338 .. | |
|-> 2. 0x1438de150 (0x285da6a00:0) [1x1024x80] -1.115234 -1.572266 1.486328 .. | |
|<- 1. 0x1438a5ef0 (0x285da6a40:0) [1x1024x1024] 5.199219 2.582031 2.798828 .. | |
CCV_NNC_SOFTMAX_FORWARD [395]: [1] -> [1] (0) | |
|-> 1. 0x1438de2b0 (0x285da6a40:0) [1024x1024] 5.199219 2.582031 2.798828 .. | |
|<- 1. 0x1438de2b0 (0x285da6a40:0) [1024x1024] 0.042633 0.003113 0.003866 .. | |
CCV_NNC_GEMM_FORWARD [396]: [2] -> [1] (0) | |
|-> 1. 0x1438de3d0 (0x285da6a40:0) [1x1024x1024] 0.042633 0.003113 0.003866 .. | |
|-> 2. 0x1438de320 (0x285da6a80:0) [1x1024x80] 0.318115 0.350098 -0.006535 .. | |
|<- 1. 0x1438e0290 (0x285da6900:0) [1x1024x80] -0.154907 0.117798 0.120850 .. | |
CCV_NNC_GEMM_FORWARD [397]: [2] -> [1] (0) | |
|-> 1. 0x1438de4f0 (0x285da61c0:0) [1x1024x80] -0.017166 -0.081970 0.087646 .. | |
|-> 2. 0x1438de440 (0x285da6a00:0) [1x1024x80] 1.744141 -0.133789 1.097656 .. | |
|<- 1. 0x1438a5f60 (0x285da6a40:0) [1x1024x1024] 3.775391 2.425781 2.640625 .. | |
CCV_NNC_SOFTMAX_FORWARD [398]: [1] -> [1] (0) | |
|-> 1. 0x1438de5a0 (0x285da6a40:0) [1024x1024] 3.775391 2.425781 2.640625 .. | |
|<- 1. 0x1438de5a0 (0x285da6a40:0) [1024x1024] 0.020065 0.005203 0.006451 .. | |
CCV_NNC_GEMM_FORWARD [399]: [2] -> [1] (0) | |
|-> 1. 0x1438de6c0 (0x285da6a40:0) [1x1024x1024] 0.020065 0.005203 0.006451 .. | |
|-> 2. 0x1438de610 (0x285da6a80:0) [1x1024x80] -0.410400 0.046173 0.415527 .. | |
|<- 1. 0x1438e0340 (0x285da6900:0) [1x1024x80] -0.011215 0.166138 0.009338 .. | |
CCV_NNC_GEMM_FORWARD [400]: [2] -> [1] (0) | |
|-> 1. 0x1438de7e0 (0x285da61c0:0) [1x1024x80] 0.087097 -0.124390 0.137573 .. | |
|-> 2. 0x1438de730 (0x285da6a00:0) [1x1024x80] 0.666016 -1.976562 -1.167969 .. | |
|<- 1. 0x1438a5fd0 (0x285da6a40:0) [1x1024x1024] 3.236328 2.248047 2.550781 .. | |
CCV_NNC_SOFTMAX_FORWARD [401]: [1] -> [1] (0) | |
|-> 1. 0x1438de890 (0x285da6a40:0) [1024x1024] 3.236328 2.248047 2.550781 .. | |
|<- 1. 0x1438de890 (0x285da6a40:0) [1024x1024] 0.005947 0.002214 0.002996 .. | |
CCV_NNC_GEMM_FORWARD [402]: [2] -> [1] (0) | |
|-> 1. 0x1438de9b0 (0x285da6a40:0) [1x1024x1024] 0.005947 0.002214 0.002996 .. | |
|-> 2. 0x1438de900 (0x285da6a80:0) [1x1024x80] 0.152222 0.447998 -0.931152 .. | |
|<- 1. 0x1438e03f0 (0x285da6900:0) [1x1024x80] 0.197144 0.156372 -0.209839 .. | |
CCV_NNC_GEMM_FORWARD [403]: [2] -> [1] (0) | |
|-> 1. 0x1438dead0 (0x285da61c0:0) [1x1024x80] -0.092834 0.040253 -0.051239 .. | |
|-> 2. 0x1438dea20 (0x285da6a00:0) [1x1024x80] -0.705566 0.117432 -0.708008 .. | |
|<- 1. 0x1438a6040 (0x285da6a40:0) [1x1024x1024] 1.405273 1.069336 1.289062 .. | |
CCV_NNC_SOFTMAX_FORWARD [404]: [1] -> [1] (0) | |
|-> 1. 0x1438deb80 (0x285da6a40:0) [1024x1024] 1.405273 1.069336 1.289062 .. | |
|<- 1. 0x1438deb80 (0x285da6a40:0) [1024x1024] 0.002813 0.002010 0.002504 .. | |
CCV_NNC_GEMM_FORWARD [405]: [2] -> [1] (0) | |
|-> 1. 0x1438deca0 (0x285da6a40:0) [1x1024x1024] 0.002813 0.002010 0.002504 .. | |
|-> 2. 0x1438debf0 (0x285da6a80:0) [1x1024x80] -0.702148 0.228027 0.257080 .. | |
|<- 1. 0x1438e04a0 (0x285da6900:0) [1x1024x80] -0.105469 0.167114 0.158203 .. | |
CCV_NNC_GEMM_FORWARD [406]: [2] -> [1] (0) | |
|-> 1. 0x1438dedc0 (0x285da61c0:0) [1x1024x80] -0.032654 -0.016022 -0.220581 .. | |
|-> 2. 0x1438ded10 (0x285da6a00:0) [1x1024x80] -2.205078 1.277344 0.299072 .. | |
|<- 1. 0x1438a60b0 (0x285da6a40:0) [1x1024x1024] 4.171875 3.775391 3.832031 .. | |
CCV_NNC_SOFTMAX_FORWARD [407]: [1] -> [1] (0) | |
|-> 1. 0x1438dee70 (0x285da6a40:0) [1024x1024] 4.171875 3.775391 3.832031 .. | |
|<- 1. 0x1438dee70 (0x285da6a40:0) [1024x1024] 0.004757 0.003199 0.003386 .. | |
CCV_NNC_GEMM_FORWARD [408]: [2] -> [1] (0) | |
|-> 1. 0x1438def90 (0x285da6a40:0) [1x1024x1024] 0.004757 0.003199 0.003386 .. | |
|-> 2. 0x1438deee0 (0x285da6a80:0) [1x1024x80] 0.172607 0.293945 0.113037 .. | |
|<- 1. 0x1438e0550 (0x285da6900:0) [1x1024x80] -0.015930 0.073975 0.182617 .. | |
CCV_NNC_GEMM_FORWARD [409]: [2] -> [1] (0) | |
|-> 1. 0x1438df0b0 (0x285da61c0:0) [1x1024x80] 0.027542 0.017517 -0.111816 .. | |
|-> 2. 0x1438df000 (0x285da6a00:0) [1x1024x80] 1.426758 -0.935059 -0.490967 .. | |
|<- 1. 0x1438a6120 (0x285da6a40:0) [1x1024x1024] 3.460938 1.697266 1.443359 .. | |
CCV_NNC_SOFTMAX_FORWARD [410]: [1] -> [1] (0) | |
|-> 1. 0x1438df160 (0x285da6a40:0) [1024x1024] 3.460938 1.697266 1.443359 .. | |
|<- 1. 0x1438df160 (0x285da6a40:0) [1024x1024] 0.018478 0.003166 0.002457 .. | |
CCV_NNC_GEMM_FORWARD [411]: [2] -> [1] (0) | |
|-> 1. 0x1438df280 (0x285da6a40:0) [1x1024x1024] 0.018478 0.003166 0.002457 .. | |
|-> 2. 0x1438df1d0 (0x285da6a80:0) [1x1024x80] 0.607910 0.047882 0.110474 .. | |
|<- 1. 0x1438e0600 (0x285da6900:0) [1x1024x80] 0.119263 0.173218 0.064758 .. | |
CCV_NNC_GEMM_FORWARD [412]: [2] -> [1] (0) | |
|-> 1. 0x1438df3a0 (0x285da61c0:0) [1x1024x80] -0.106445 -0.013931 -0.134888 .. | |
|-> 2. 0x1438df2f0 (0x285da6a00:0) [1x1024x80] -2.423828 -1.475586 -2.005859 .. | |
|<- 1. 0x1438a6190 (0x285da6a40:0) [1x1024x1024] 4.218750 2.298828 3.312500 .. | |
CCV_NNC_SOFTMAX_FORWARD [413]: [1] -> [1] (0) | |
|-> 1. 0x1438df450 (0x285da6a40:0) [1024x1024] 4.218750 2.298828 3.312500 .. | |
|<- 1. 0x1438df450 (0x285da6a40:0) [1024x1024] 0.017838 0.002615 0.007206 .. | |
CCV_NNC_GEMM_FORWARD [414]: [2] -> [1] (0) | |
|-> 1. 0x1438df570 (0x285da6a40:0) [1x1024x1024] 0.017838 0.002615 0.007206 .. | |
|-> 2. 0x1438df4c0 (0x285da6a80:0) [1x1024x80] 0.096375 0.453369 0.812500 .. | |
|<- 1. 0x1438e06b0 (0x285da6900:0) [1x1024x80] 0.111572 0.018936 0.000479 .. | |
CCV_NNC_GEMM_FORWARD [415]: [2] -> [1] (0) | |
|-> 1. 0x1438df690 (0x285da61c0:0) [1x1024x80] 0.038483 -0.093567 -0.032227 .. | |
|-> 2. 0x1438df5e0 (0x285da6a00:0) [1x1024x80] -0.815918 1.705078 -1.846680 .. | |
|<- 1. 0x1438a6200 (0x285da6a40:0) [1x1024x1024] 5.933594 4.253906 4.980469 .. | |
CCV_NNC_SOFTMAX_FORWARD [416]: [1] -> [1] (0) | |
|-> 1. 0x1438df740 (0x285da6a40:0) [1024x1024] 5.933594 4.253906 4.980469 .. | |
|<- 1. 0x1438df740 (0x285da6a40:0) [1024x1024] 0.033173 0.006184 0.012787 .. | |
CCV_NNC_GEMM_FORWARD [417]: [2] -> [1] (0) | |
|-> 1. 0x1438df860 (0x285da6a40:0) [1x1024x1024] 0.033173 0.006184 0.012787 .. | |
|-> 2. 0x1438df7b0 (0x285da6a80:0) [1x1024x80] -0.008102 0.009789 -0.357422 .. | |
|<- 1. 0x1438e0760 (0x285da6900:0) [1x1024x80] 0.023224 -0.078186 -0.232178 .. | |
CCV_NNC_GEMM_FORWARD [418]: [2] -> [1] (0) | |
|-> 1. 0x1438df980 (0x285da61c0:0) [1x1024x80] -0.027267 -0.082520 0.016251 .. | |
|-> 2. 0x1438df8d0 (0x285da6a00:0) [1x1024x80] -0.986328 -1.624023 1.705078 .. | |
|<- 1. 0x1438a6270 (0x285da6a40:0) [1x1024x1024] 4.851562 2.693359 2.812500 .. | |
CCV_NNC_SOFTMAX_FORWARD [419]: [1] -> [1] (0) | |
|-> 1. 0x1438dfa30 (0x285da6a40:0) [1024x1024] 4.851562 2.693359 2.812500 .. | |
|<- 1. 0x1438dfa30 (0x285da6a40:0) [1024x1024] 0.029175 0.003372 0.003798 .. | |
CCV_NNC_GEMM_FORWARD [420]: [2] -> [1] (0) | |
|-> 1. 0x1438dfb50 (0x285da6a40:0) [1x1024x1024] 0.029175 0.003372 0.003798 .. | |
|-> 2. 0x1438dfaa0 (0x285da6a80:0) [1x1024x80] 0.325195 0.280273 0.072632 .. | |
|<- 1. 0x1438e0810 (0x285da6900:0) [1x1024x80] -0.245361 0.074158 0.215332 .. | |
CCV_NNC_GEMM_FORWARD [421]: [2] -> [1] (0) | |
|-> 1. 0x1438dfc70 (0x285da61c0:0) [1x1024x80] -0.017166 -0.070496 0.091309 .. | |
|-> 2. 0x1438dfbc0 (0x285da6a00:0) [1x1024x80] 1.819336 -0.112854 1.263672 .. | |
|<- 1. 0x1438a62e0 (0x285da6a40:0) [1x1024x1024] 3.550781 2.378906 2.474609 .. | |
CCV_NNC_SOFTMAX_FORWARD [422]: [1] -> [1] (0) | |
|-> 1. 0x1438dfd20 (0x285da6a40:0) [1024x1024] 3.550781 2.378906 2.474609 .. | |
|<- 1. 0x1438dfd20 (0x285da6a40:0) [1024x1024] 0.017593 0.005447 0.005997 .. | |
CCV_NNC_GEMM_FORWARD [423]: [2] -> [1] (0) | |
|-> 1. 0x1438dfe40 (0x285da6a40:0) [1x1024x1024] 0.017593 0.005447 0.005997 .. | |
|-> 2. 0x1438dfd90 (0x285da6a80:0) [1x1024x80] -0.548340 0.207520 0.329590 .. | |
|<- 1. 0x1438e08c0 (0x285da6900:0) [1x1024x80] -0.087341 0.180542 0.006233 .. | |
CCV_NNC_TRANSPOSE_FORWARD [424]: [1] -> [1] (0) | |
|-> 1. 0x1438e0970 (0x285da6900:0) [2x8x1024x80] 0.265381 0.010628 -0.298096 .. | |
|<- 1. 0x1438a63c0 (0x285da6a80:0) [2x1024x8x80] 0.265381 0.010628 -0.298096 .. | |
CCV_NNC_GEMM_FORWARD [425]: [3] -> [1] (0) | |
|-> 1. 0x1438e09e0 (0x285da6a80:0) [2x1024x640] 0.265381 0.010628 -0.298096 .. | |
|-> 2. 0x1438c1400 (0x285d86ac0:0) [640x640] 0.014511 -0.044617 -0.003338 .. | |
|-> 3. 0x1438c1470 (0x285d86b00:0) [640] 0.025314 -0.092285 0.005138 .. | |
|<- 1. 0x1438a6430 (0x285da6900:0) [2x1024x640] 0.065735 -0.153809 0.075806 .. | |
CCV_NNC_ADD_FORWARD [426]: [2] -> [1] (0) | |
|-> 1. 0x1438a6430 (0x285da6900:0) [2x1024x640] 0.065735 -0.153809 0.075806 .. | |
|-> 2. 0x1438dceb0 (0x285da6480:0) [2x1024x640] -0.096313 0.765625 0.216919 .. | |
|<- 1. 0x1438a6430 (0x285da6900:0) [2x1024x640] -0.030579 0.611816 0.292725 .. | |
CCV_NNC_LAYER_NORM_FORWARD [427]: [3] -> [3] (0) | |
|-> 1. 0x1438a6430 (0x285da6900:0) [2x1024x640] -0.030579 0.611816 0.292725 .. | |
|-> 2. 0x1438c14e0 (0x285d86b40:0) [1x1x640] 0.397217 0.405762 0.360596 .. | |
|-> 3. 0x1438c1550 (0x285d86b80:0) [1x1x640] 0.145630 0.032623 -0.199097 .. | |
|<- 1. 0x1438a64a0 (0x285da6480:0) [2x1024x640] 0.158325 0.280273 -0.082581 .. | |
|<- 2. 0x1438a6510 (0x285da6ac0:0) [2x1024x1] -0.065979 .. | |
|<- 3. 0x1438a6580 (0x285da6b00:0) [2x1024x1] 0.900879 .. | |
CCV_NNC_GEMM_FORWARD [428]: [2] -> [1] (0) | |
|-> 1. 0x1438a64a0 (0x285da6480:0) [2x1024x640] 0.158325 0.280273 -0.082581 .. | |
|-> 2. 0x1438c15c0 (0x285d86bc0:0) [640x640] -0.017227 0.001777 -0.034637 .. | |
|<- 1. 0x1438a65f0 (0x285da6a00:0) [2x1024x640] -0.191772 0.359131 -0.877441 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [429]: [1] -> [1] (0) | |
|-> 1. 0x1438a65f0 (0x285da6a00:0) [2x1024x640] -0.191772 0.359131 -0.877441 .. | |
|<- 1. 0x1438a65f0 (0x285da6a00:0) [2x1024x640] -0.021439 0.040161 -0.098083 .. | |
CCV_NNC_TRANSPOSE_FORWARD [430]: [1] -> [1] (0) | |
|-> 1. 0x1438e0ac0 (0x285da6a00:0) [2x1024x8x80] -0.021439 0.040161 -0.098083 .. | |
|<- 1. 0x1438a6740 (0x285da6a80:0) [2x8x1024x80] -0.021439 0.040161 -0.098083 .. | |
CCV_NNC_GEMM_FORWARD [431]: [2] -> [1] (0) | |
Wait: (0, 32) | |
|-> 1. 0x1438a6740 (0x285da6a80:0) [2x8x1024x80] -0.021439 0.040161 -0.098083 .. | |
|-> 2. 0x1438a66d0 (0x285da6b80:0) [2x8x133x80] -0.381836 -0.479736 0.379883 .. | |
|<- 1. 0x1438a67b0 (0x285da6bc0:0) [2x8x1024x133] 7.480469 0.335205 1.155273 .. | |
CCV_NNC_SOFTMAX_FORWARD [432]: [1] -> [1] (0) | |
|-> 1. 0x1438e0b30 (0x285da6bc0:0) [16384x133] 7.480469 0.335205 1.155273 .. | |
|<- 1. 0x1438e0b30 (0x285da6bc0:0) [16384x133] 0.817871 0.000645 0.001464 .. | |
CCV_NNC_GEMM_FORWARD [433]: [2] -> [1] (0) | |
Wait: (0, 33) | |
|-> 1. 0x1438e0c10 (0x285da6bc0:0) [2x8x1024x133] 0.817871 0.000645 0.001464 .. | |
|-> 2. 0x1438a6890 (0x285da6c40:0) [2x8x133x80] 0.031586 0.014740 -0.047302 .. | |
|<- 1. 0x1438a6900 (0x285da6a80:0) [2x8x1024x80] 0.018341 0.024033 -0.024689 .. | |
CCV_NNC_TRANSPOSE_FORWARD [434]: [1] -> [1] (0) | |
|-> 1. 0x1438e0c80 (0x285da6a80:0) [2x8x1024x80] 0.018341 0.024033 -0.024689 .. | |
|<- 1. 0x1438a6970 (0x285da6480:0) [2x1024x8x80] 0.018341 0.024033 -0.024689 .. | |
CCV_NNC_GEMM_FORWARD [435]: [3] -> [1] (0) | |
|-> 1. 0x1438e0cf0 (0x285da6480:0) [2x1024x640] 0.018341 0.024033 -0.024689 .. | |
|-> 2. 0x1438c1710 (0x285d86c80:0) [640x640] 0.006489 0.004543 -0.020630 .. | |
|-> 3. 0x1438c1780 (0x285d86cc0:0) [640] -0.030243 -0.027390 -0.015312 .. | |
|<- 1. 0x1438a69e0 (0x285da69c0:0) [2x1024x640] 0.121094 -0.053955 -0.106079 .. | |
CCV_NNC_ADD_FORWARD [436]: [2] -> [1] (0) | |
|-> 1. 0x1438a69e0 (0x285da69c0:0) [2x1024x640] 0.121094 -0.053955 -0.106079 .. | |
|-> 2. 0x1438a6430 (0x285da6900:0) [2x1024x640] -0.030579 0.611816 0.292725 .. | |
|<- 1. 0x1438a69e0 (0x285da69c0:0) [2x1024x640] 0.090515 0.557617 0.186646 .. | |
CCV_NNC_LAYER_NORM_FORWARD [437]: [3] -> [3] (0) | |
|-> 1. 0x1438a69e0 (0x285da69c0:0) [2x1024x640] 0.090515 0.557617 0.186646 .. | |
|-> 2. 0x1438c17f0 (0x285d86d00:0) [1x1x640] 0.336426 0.341064 0.359131 .. | |
|-> 3. 0x1438c1860 (0x285d86d40:0) [1x1x640] 0.066956 0.044464 -0.004032 .. | |
|<- 1. 0x1438a6a50 (0x285da6c80:0) [2x1024x640] 0.118164 0.241577 0.082092 .. | |
|<- 2. 0x1438a6ac0 (0x285da6cc0:0) [2x1024x1] -0.076477 .. | |
|<- 3. 0x1438a6b30 (0x285da6d00:0) [2x1024x1] 0.911621 .. | |
Emit: (0, 34) | |
CCV_NNC_GEMM_FORWARD [438]: [3] -> [1] (0) | |
|-> 1. 0x1438a6a50 (0x285da6c80:0) [2x1024x640] 0.118164 0.241577 0.082092 .. | |
|-> 2. 0x1438c18d0 (0x285d86d80:0) [2560x640] 0.056854 0.001586 -0.018921 .. | |
|-> 3. 0x1438c1940 (0x285d86dc0:0) [2560] 0.042633 0.058716 0.007183 .. | |
|<- 1. 0x1438a6ba0 (0x285da6740:0) [2x1024x2560] -0.250000 -0.606934 -0.143677 .. | |
CCV_NNC_GELU_FORWARD [439]: [1] -> [1] (0) | |
|-> 1. 0x1438a6ba0 (0x285da6740:0) [2x1024x2560] -0.250000 -0.606934 -0.143677 .. | |
|<- 1. 0x1438a6ba0 (0x285da6740:0) [2x1024x2560] -0.100342 -0.165039 -0.063660 .. | |
CCV_NNC_GEMM_FORWARD [440]: [3] -> [1] (1) | |
Wait: (1, 34) | |
|-> 1. 0x1438a6a50 (0x285da6c80:0) [2x1024x640] 0.118164 0.241577 0.082092 .. | |
|-> 2. 0x1438c19b0 (0x285d86e00:0) [2560x640] -0.040924 -0.039307 0.095337 .. | |
|-> 3. 0x1438c1a20 (0x285d86e40:0) [2560] -0.001872 0.017807 0.035004 .. | |
|<- 1. 0x1438a6c10 (0x285da6780:0) [2x1024x2560] -0.643555 0.389648 0.595215 .. | |
Emit: (1, 35) | |
CCV_NNC_MUL_FORWARD [441]: [2] -> [1] (0) | |
Wait: (0, 35) | |
|-> 1. 0x1438a6c10 (0x285da6780:0) [2x1024x2560] -0.643555 0.389648 0.595215 .. | |
|-> 2. 0x1438a6ba0 (0x285da6740:0) [2x1024x2560] -0.100342 -0.165039 -0.063660 .. | |
|<- 1. 0x1438a6c10 (0x285da6780:0) [2x1024x2560] 0.064575 -0.064331 -0.037903 .. | |
CCV_NNC_GEMM_FORWARD [442]: [3] -> [1] (0) | |
|-> 1. 0x1438a6c10 (0x285da6780:0) [2x1024x2560] 0.064575 -0.064331 -0.037903 .. | |
|-> 2. 0x1438c1a90 (0x285d86e80:0) [640x2560] 0.041840 0.020172 0.001719 .. | |
|-> 3. 0x1438c1b00 (0x285d86ec0:0) [640] -0.002460 0.025970 0.007858 .. | |
|<- 1. 0x1438a6c80 (0x285da61c0:0) [2x1024x640] 0.011269 -1.174805 -1.065430 .. | |
CCV_NNC_ADD_FORWARD [443]: [2] -> [1] (0) | |
|-> 1. 0x1438a6c80 (0x285da61c0:0) [2x1024x640] 0.011269 -1.174805 -1.065430 .. | |
|-> 2. 0x1438a69e0 (0x285da69c0:0) [2x1024x640] 0.090515 0.557617 0.186646 .. | |
|<- 1. 0x1438a6c80 (0x285da61c0:0) [2x1024x640] 0.101807 -0.617188 -0.878906 .. | |
CCV_NNC_CONVOLUTION_FORWARD [444]: [3] -> [1] (0) | |
|-> 1. 0x1438e0d60 (0x285da61c0:0) [2x32x32x640] 0.101807 -0.617188 -0.878906 .. | |
|-> 2. 0x1438c1b70 (0x285d86f00:0) [640x640x1x1] -0.002705 .. | |
|-> 3. 0x1438c1be0 (0x285d86f40:0) [640] -0.061615 -0.015152 0.004658 .. | |
|<- 1. 0x1438a6cf0 (0x285da69c0:0) [2x32x32x640] 1.405273 0.543457 -0.504883 .. | |
CCV_NNC_ADD_FORWARD [445]: [2] -> [1] (0) | |
|-> 1. 0x1438a6cf0 (0x285da69c0:0) [2x32x32x640] 1.405273 0.543457 -0.504883 .. | |
|-> 2. 0x1438a5630 (0x285da62c0:0) [2x32x32x640] -3.199219 0.046875 1.228516 .. | |
|<- 1. 0x1438f96c0 (0x285d8a540:0) [2x32x32x640] -1.793945 0.590332 0.723633 .. | |
CCV_NNC_CONVOLUTION_FORWARD [446]: [3] -> [1] (0) | |
|-> 1. 0x1438f96c0 (0x285d8a540:0) [2x32x32x640] -1.793945 0.590332 0.723633 .. | |
|-> 2. 0x1438c1c50 (0x285d86f80:0) [640x640x3x3] 0.002350 -0.003546 -0.003578 .. | |
|-> 3. 0x1438c1cc0 (0x285d86fc0:0) [640] 0.015541 -0.005711 0.016861 .. | |
|<- 1. 0x1438f55d0 (0x285d8f6c0:0) [2x16x16x640] 0.511230 1.206055 0.435791 .. | |
Emit: (0, 37) | |
CCV_NNC_GROUP_NORM_FORWARD [447]: [3] -> [3] (0) | |
|-> 1. 0x1438f55d0 (0x285d8f6c0:0) [2x16x16x640] 0.511230 1.206055 0.435791 .. | |
|-> 2. 0x1438c1d30 (0x285d87000:0) [1x1x1x640] 0.273926 0.466309 0.314697 .. | |
|-> 3. 0x1438c1da0 (0x285d87040:0) [1x1x1x640] -0.018585 -0.111938 -0.034729 .. | |
|<- 1. 0x1438a6d60 (0x285da6d40:0) [2x16x16x640] 0.130005 0.520996 0.108154 .. | |
|<- 2. 0x1438a6dd0 (0x285da6800:0) [2x1x1x32] 0.048676 0.003143 0.062347 .. | |
|<- 3. 0x1438a6e40 (0x285da67c0:0) [2x1x1x32] 1.172852 1.277344 1.097656 .. | |
CCV_NNC_SWISH_FORWARD [448]: [1] -> [1] (0) | |
|-> 1. 0x1438a6d60 (0x285da6d40:0) [2x16x16x640] 0.130005 0.520996 0.108154 .. | |
|<- 1. 0x1438a6d60 (0x285da6d40:0) [2x16x16x640] 0.069214 0.326904 0.057007 .. | |
CCV_NNC_CONVOLUTION_FORWARD [449]: [3] -> [1] (0) | |
|-> 1. 0x1438a6d60 (0x285da6d40:0) [2x16x16x640] 0.069214 0.326904 0.057007 .. | |
|-> 2. 0x1438c1ef0 (0x285d87100:0) [1280x640x3x3] -0.047272 0.032166 0.071716 .. | |
|-> 3. 0x1438c1f60 (0x285d87140:0) [1280] 0.016006 0.001427 0.001047 .. | |
|<- 1. 0x1438a6f20 (0x285da6dc0:0) [2x16x16x1280] 0.482910 0.290771 -0.923828 .. | |
CCV_NNC_ADD_FORWARD [450]: [2] -> [1] (0) | |
Wait: (0, 36) | |
|-> 1. 0x1438a6f20 (0x285da6dc0:0) [2x16x16x1280] 0.482910 0.290771 -0.923828 .. | |
|-> 2. 0x1438e0dd0 (0x285da6d80:0) [2x1x1x1280] 0.093994 0.277832 0.315918 .. | |
|<- 1. 0x1438a6f20 (0x285da6dc0:0) [2x16x16x1280] 0.577148 0.568359 -0.607910 .. | |
CCV_NNC_GROUP_NORM_FORWARD [451]: [3] -> [3] (0) | |
|-> 1. 0x1438a6f20 (0x285da6dc0:0) [2x16x16x1280] 0.577148 0.568359 -0.607910 .. | |
|-> 2. 0x1438c1fd0 (0x285d87180:0) [1x1x1x1280] 0.351807 0.352783 0.389404 .. | |
|-> 3. 0x1438c2040 (0x285d871c0:0) [1x1x1x1280] -0.060883 -0.064331 -0.050873 .. | |
|<- 1. 0x1438a6f90 (0x285da6e00:0) [2x16x16x1280] 0.344238 0.337646 -0.254150 .. | |
|<- 2. 0x1438a7000 (0x285da6e40:0) [2x1x1x32] -0.238403 -0.539062 -0.552734 .. | |
|<- 3. 0x1438a7070 (0x285da6e80:0) [2x1x1x32] 1.412109 0.240601 0.430664 .. | |
CCV_NNC_SWISH_FORWARD [452]: [1] -> [1] (0) | |
|-> 1. 0x1438a6f90 (0x285da6e00:0) [2x16x16x1280] 0.344238 0.337646 -0.254150 .. | |
|<- 1. 0x1438a6f90 (0x285da6e00:0) [2x16x16x1280] 0.201416 0.197021 -0.111023 .. | |
CCV_NNC_CONVOLUTION_FORWARD [453]: [3] -> [1] (0) | |
|-> 1. 0x1438a6f90 (0x285da6e00:0) [2x16x16x1280] 0.201416 0.197021 -0.111023 .. | |
|-> 2. 0x1438c20b0 (0x285d87200:0) [1280x1280x3x3] 0.057434 -0.026169 -0.027893 .. | |
|-> 3. 0x1438c2120 (0x285d87240:0) [1280] 0.034912 0.017990 0.040131 .. | |
|<- 1. 0x1438a70e0 (0x285da6dc0:0) [2x16x16x1280] -0.461914 -0.300781 -1.104492 .. | |
CCV_NNC_CONVOLUTION_FORWARD [454]: [3] -> [1] (1) | |
Wait: (1, 37) | |
|-> 1. 0x1438f55d0 (0x285d8f6c0:0) [2x16x16x640] 0.511230 1.206055 0.435791 .. | |
|-> 2. 0x1438c2190 (0x285d87280:0) [1280x640x1x1] 0.004993 .. | |
|-> 3. 0x1438c2200 (0x285d872c0:0) [1280] 0.042450 0.028534 0.049713 .. | |
|<- 1. 0x1438a7150 (0x285da6f00:0) [2x16x16x1280] 0.120300 0.447754 0.978516 .. | |
Emit: (1, 38) | |
CCV_NNC_ADD_FORWARD [455]: [2] -> [1] (0) | |
Wait: (0, 38) | |
|-> 1. 0x1438a7150 (0x285da6f00:0) [2x16x16x1280] 0.120300 0.447754 0.978516 .. | |
|-> 2. 0x1438a70e0 (0x285da6dc0:0) [2x16x16x1280] -0.461914 -0.300781 -1.104492 .. | |
|<- 1. 0x1438a7150 (0x285da6f00:0) [2x16x16x1280] -0.341553 0.146973 -0.125977 .. | |
CCV_NNC_GROUP_NORM_FORWARD [456]: [3] -> [3] (0) | |
|-> 1. 0x1438a7150 (0x285da6f00:0) [2x16x16x1280] -0.341553 0.146973 -0.125977 .. | |
|-> 2. 0x1438c2270 (0x285d87300:0) [1x1x1x1280] 0.224976 0.224609 0.224731 .. | |
|-> 3. 0x1438c22e0 (0x285d87340:0) [1x1x1x1280] -0.013771 0.003616 0.001595 .. | |
|<- 1. 0x1438a71c0 (0x285da6e00:0) [2x16x16x1280] -0.055328 0.083130 0.013512 .. | |
|<- 2. 0x1438a7230 (0x285da6800:0) [2x1x1x32] -0.174072 -0.127808 -0.152222 .. | |
|<- 3. 0x1438a72a0 (0x285da67c0:0) [2x1x1x32] 1.102539 1.019531 0.989746 .. | |
CCV_NNC_CONVOLUTION_FORWARD [457]: [3] -> [1] (0) | |
|-> 1. 0x1438a71c0 (0x285da6e00:0) [2x16x16x1280] -0.055328 0.083130 0.013512 .. | |
|-> 2. 0x1438c2350 (0x285d87380:0) [1280x1280x1x1] -0.000048 .. | |
|-> 3. 0x1438c23c0 (0x285d873c0:0) [1280] -0.010078 -0.024460 0.010605 .. | |
|<- 1. 0x1438a7310 (0x285da6dc0:0) [2x16x16x1280] 0.916016 0.061157 0.760742 .. | |
CCV_NNC_LAYER_NORM_FORWARD [458]: [3] -> [3] (0) | |
|-> 1. 0x1438e0e40 (0x285da6dc0:0) [2x256x1280] 0.916016 0.061157 0.760742 .. | |
|-> 2. 0x1438c2430 (0x285d87400:0) [1x1x1280] 0.296143 0.296631 0.322021 .. | |
|-> 3. 0x1438c24a0 (0x285d87440:0) [1x1x1280] 0.009285 -0.026138 0.003679 .. | |
|<- 1. 0x1438a7380 (0x285da6e00:0) [2x256x1280] 0.315430 -0.002338 0.280762 .. | |
|<- 2. 0x1438a73f0 (0x285da6f40:0) [2x256x1] -0.010788 .. | |
|<- 3. 0x1438a7460 (0x285da6f80:0) [2x256x1] 1.115234 .. | |
Emit: (0, 39) | |
CCV_NNC_GEMM_FORWARD [459]: [2] -> [1] (0) | |
|-> 1. 0x1438a7380 (0x285da6e00:0) [2x256x1280] 0.315430 -0.002338 0.280762 .. | |
|-> 2. 0x1438c2510 (0x285d87480:0) [1280x1280] -0.022614 -0.011375 0.041016 .. | |
|<- 1. 0x1438a74d0 (0x285da6fc0:0) [2x256x1280] 0.355957 -0.752930 -0.484131 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [460]: [1] -> [1] (0) | |
|-> 1. 0x1438a74d0 (0x285da6fc0:0) [2x256x1280] 0.355957 -0.752930 -0.484131 .. | |
|<- 1. 0x1438a74d0 (0x285da6fc0:0) [2x256x1280] 0.028137 -0.059509 -0.038269 .. | |
CCV_NNC_TRANSPOSE_FORWARD [461]: [1] -> [1] (0) | |
|-> 1. 0x1438e0f20 (0x285da6fc0:0) [2x256x8x160] 0.028137 -0.059509 -0.038269 .. | |
|<- 1. 0x1438a7620 (0x285da7080:0) [2x8x256x160] 0.028137 -0.059509 -0.038269 .. | |
CCV_NNC_GEMM_FORWARD [462]: [2] -> [1] (1) | |
Wait: (1, 39) | |
|-> 1. 0x1438a7380 (0x285da6e00:0) [2x256x1280] 0.315430 -0.002338 0.280762 .. | |
|-> 2. 0x1438c2580 (0x285d874c0:0) [1280x1280] 0.106079 -0.006134 -0.057587 .. | |
|<- 1. 0x1438a7540 (0x285da7000:0) [2x256x1280] 0.707031 -0.326416 0.686035 .. | |
CCV_NNC_TRANSPOSE_FORWARD [463]: [1] -> [1] (1) | |
|-> 1. 0x1438e0eb0 (0x285da7000:0) [2x256x8x160] 0.707031 -0.326416 0.686035 .. | |
|<- 1. 0x1438a75b0 (0x285da7040:0) [2x8x256x160] 0.707031 -0.326416 0.686035 .. | |
Emit: (1, 40) | |
CCV_NNC_GEMM_FORWARD [464]: [2] -> [1] (2) | |
Wait: (2, 39) | |
|-> 1. 0x1438a7380 (0x285da6e00:0) [2x256x1280] 0.315430 -0.002338 0.280762 .. | |
|-> 2. 0x1438c25f0 (0x285d87500:0) [1280x1280] 0.055420 0.017975 0.068176 .. | |
|<- 1. 0x1438a7690 (0x285da70c0:0) [2x256x1280] -0.751953 0.787109 0.171875 .. | |
CCV_NNC_TRANSPOSE_FORWARD [465]: [1] -> [1] (2) | |
|-> 1. 0x1438e1070 (0x285da70c0:0) [2x256x8x160] -0.751953 0.787109 0.171875 .. | |
|<- 1. 0x1438a7770 (0x285da7140:0) [2x8x256x160] -0.751953 0.787109 0.171875 .. | |
Emit: (2, 41) | |
CCV_NNC_GEMM_FORWARD [466]: [2] -> [1] (0) | |
Wait: (0, 40) | |
|-> 1. 0x1438e1000 (0x285da7080:0) [1x256x160] 0.028137 -0.059509 -0.038269 .. | |
|-> 2. 0x1438e0f90 (0x285da7040:0) [1x256x160] 0.707031 -0.326416 0.686035 .. | |
|<- 1. 0x1438a7700 (0x285da7100:0) [1x256x256] 4.882812 2.759766 3.513672 .. | |
CCV_NNC_SOFTMAX_FORWARD [467]: [1] -> [1] (0) | |
|-> 1. 0x1438e10e0 (0x285da7100:0) [256x256] 4.882812 2.759766 3.513672 .. | |
|<- 1. 0x1438e10e0 (0x285da7100:0) [256x256] 0.094788 0.011345 0.024109 .. | |
CCV_NNC_GEMM_FORWARD [468]: [2] -> [1] (0) | |
Wait: (0, 41) | |
|-> 1. 0x1438e11c0 (0x285da7100:0) [1x256x256] 0.094788 0.011345 0.024109 .. | |
|-> 2. 0x1438e1150 (0x285da7140:0) [1x256x160] -0.751953 0.787109 0.171875 .. | |
|<- 1. 0x1438e3e40 (0x285da6e00:0) [1x256x160] -0.256104 0.208862 0.047241 .. | |
CCV_NNC_GEMM_FORWARD [469]: [2] -> [1] (0) | |
|-> 1. 0x1438e12e0 (0x285da7080:0) [1x256x160] -0.042328 0.019577 -0.101440 .. | |
|-> 2. 0x1438e1230 (0x285da7040:0) [1x256x160] -0.701172 1.413086 0.542969 .. | |
|<- 1. 0x1438a77e0 (0x285da7100:0) [1x256x256] 6.472656 4.500000 5.277344 .. | |
CCV_NNC_SOFTMAX_FORWARD [470]: [1] -> [1] (0) | |
|-> 1. 0x1438e1390 (0x285da7100:0) [256x256] 6.472656 4.500000 5.277344 .. | |
|<- 1. 0x1438e1390 (0x285da7100:0) [256x256] 0.058502 0.008141 0.017700 .. | |
CCV_NNC_GEMM_FORWARD [471]: [2] -> [1] (0) | |
|-> 1. 0x1438e14b0 (0x285da7100:0) [1x256x256] 0.058502 0.008141 0.017700 .. | |
|-> 2. 0x1438e1400 (0x285da7140:0) [1x256x160] 0.479492 -0.240845 0.208130 .. | |
|<- 1. 0x1438e3eb0 (0x285da6e00:0) [1x256x160] 0.035278 -0.018234 0.306641 .. | |
CCV_NNC_GEMM_FORWARD [472]: [2] -> [1] (0) | |
|-> 1. 0x1438e15d0 (0x285da7080:0) [1x256x160] -0.039490 -0.046509 -0.083435 .. | |
|-> 2. 0x1438e1520 (0x285da7040:0) [1x256x160] 1.148438 -1.852539 -2.455078 .. | |
|<- 1. 0x1438a7850 (0x285da7100:0) [1x256x256] 3.619141 -0.240723 0.866211 .. | |
CCV_NNC_SOFTMAX_FORWARD [473]: [1] -> [1] (0) | |
|-> 1. 0x1438e1680 (0x285da7100:0) [256x256] 3.619141 -0.240723 0.866211 .. | |
|<- 1. 0x1438e1680 (0x285da7100:0) [256x256] 0.013039 0.000275 0.000831 .. | |
CCV_NNC_GEMM_FORWARD [474]: [2] -> [1] (0) | |
|-> 1. 0x1438e17a0 (0x285da7100:0) [1x256x256] 0.013039 0.000275 0.000831 .. | |
|-> 2. 0x1438e16f0 (0x285da7140:0) [1x256x160] 0.175171 0.172974 -0.729004 .. | |
|<- 1. 0x1438e3f60 (0x285da6e00:0) [1x256x160] -0.153076 -0.212891 0.104187 .. | |
CCV_NNC_GEMM_FORWARD [475]: [2] -> [1] (0) | |
|-> 1. 0x1438e18c0 (0x285da7080:0) [1x256x160] -0.005409 -0.000726 0.022507 .. | |
|-> 2. 0x1438e1810 (0x285da7040:0) [1x256x160] 0.128418 -1.059570 -0.328613 .. | |
|<- 1. 0x1438a78c0 (0x285da7100:0) [1x256x256] 1.959961 1.376953 1.509766 .. | |
CCV_NNC_SOFTMAX_FORWARD [476]: [1] -> [1] (0) | |
|-> 1. 0x1438e1970 (0x285da7100:0) [256x256] 1.959961 1.376953 1.509766 .. | |
|<- 1. 0x1438e1970 (0x285da7100:0) [256x256] 0.012146 0.006779 0.007744 .. | |
CCV_NNC_GEMM_FORWARD [477]: [2] -> [1] (0) | |
|-> 1. 0x1438e1a90 (0x285da7100:0) [1x256x256] 0.012146 0.006779 0.007744 .. | |
|-> 2. 0x1438e19e0 (0x285da7140:0) [1x256x160] 0.505371 0.581055 -0.445312 .. | |
|<- 1. 0x1438e4010 (0x285da6e00:0) [1x256x160] 0.362793 0.014778 0.280518 .. | |
CCV_NNC_GEMM_FORWARD [478]: [2] -> [1] (0) | |
|-> 1. 0x1438e1bb0 (0x285da7080:0) [1x256x160] 0.002422 0.013702 0.031921 .. | |
|-> 2. 0x1438e1b00 (0x285da7040:0) [1x256x160] 1.154297 0.705566 -0.611328 .. | |
|<- 1. 0x1438a7930 (0x285da7100:0) [1x256x256] 4.734375 1.331055 1.833008 .. | |
CCV_NNC_SOFTMAX_FORWARD [479]: [1] -> [1] (0) | |
|-> 1. 0x1438e1c60 (0x285da7100:0) [256x256] 4.734375 1.331055 1.833008 .. | |
|<- 1. 0x1438e1c60 (0x285da7100:0) [256x256] 0.128662 0.004276 0.007065 .. | |
CCV_NNC_GEMM_FORWARD [480]: [2] -> [1] (0) | |
|-> 1. 0x1438e1d80 (0x285da7100:0) [1x256x256] 0.128662 0.004276 0.007065 .. | |
|-> 2. 0x1438e1cd0 (0x285da7140:0) [1x256x160] -0.613281 0.469727 0.428467 .. | |
|<- 1. 0x1438e40c0 (0x285da6e00:0) [1x256x160] -0.031250 0.179688 0.014679 .. | |
CCV_NNC_GEMM_FORWARD [481]: [2] -> [1] (0) | |
|-> 1. 0x1438e1ea0 (0x285da7080:0) [1x256x160] 0.100281 -0.066895 -0.050751 .. | |
|-> 2. 0x1438e1df0 (0x285da7040:0) [1x256x160] -0.807617 -0.915527 -0.214478 .. | |
|<- 1. 0x1438a79a0 (0x285da7100:0) [1x256x256] 1.790039 0.644043 0.502441 .. | |
CCV_NNC_SOFTMAX_FORWARD [482]: [1] -> [1] (0) | |
|-> 1. 0x1438e1f50 (0x285da7100:0) [256x256] 1.790039 0.644043 0.502441 .. | |
|<- 1. 0x1438e1f50 (0x285da7100:0) [256x256] 0.008904 0.002831 0.002457 .. | |
CCV_NNC_GEMM_FORWARD [483]: [2] -> [1] (0) | |
|-> 1. 0x1438e2070 (0x285da7100:0) [1x256x256] 0.008904 0.002831 0.002457 .. | |
|-> 2. 0x1438e1fc0 (0x285da7140:0) [1x256x160] 0.596191 -0.624023 0.214111 .. | |
|<- 1. 0x1438e4170 (0x285da6e00:0) [1x256x160] -0.063843 -0.168335 -0.070435 .. | |
CCV_NNC_GEMM_FORWARD [484]: [2] -> [1] (0) | |
|-> 1. 0x1438e2190 (0x285da7080:0) [1x256x160] 0.038116 0.057861 0.024002 .. | |
|-> 2. 0x1438e20e0 (0x285da7040:0) [1x256x160] -2.386719 0.047760 -0.548828 .. | |
|<- 1. 0x1438a7a10 (0x285da7100:0) [1x256x256] 5.691406 4.570312 4.808594 .. | |
CCV_NNC_SOFTMAX_FORWARD [485]: [1] -> [1] (0) | |
|-> 1. 0x1438e2240 (0x285da7100:0) [256x256] 5.691406 4.570312 4.808594 .. | |
|<- 1. 0x1438e2240 (0x285da7100:0) [256x256] 0.016617 0.005417 0.006874 .. | |
CCV_NNC_GEMM_FORWARD [486]: [2] -> [1] (0) | |
|-> 1. 0x1438e2360 (0x285da7100:0) [1x256x256] 0.016617 0.005417 0.006874 .. | |
|-> 2. 0x1438e22b0 (0x285da7140:0) [1x256x160] -0.256592 -0.104736 -0.637695 .. | |
|<- 1. 0x1438e4220 (0x285da6e00:0) [1x256x160] -0.047211 -0.195923 -0.123291 .. | |
CCV_NNC_GEMM_FORWARD [487]: [2] -> [1] (0) | |
|-> 1. 0x1438e2480 (0x285da7080:0) [1x256x160] -0.047668 0.008713 0.019104 .. | |
|-> 2. 0x1438e23d0 (0x285da7040:0) [1x256x160] 0.291992 0.872070 0.010788 .. | |
|<- 1. 0x1438a7a80 (0x285da7100:0) [1x256x256] 0.074707 -0.410156 -0.641113 .. | |
CCV_NNC_SOFTMAX_FORWARD [488]: [1] -> [1] (0) | |
|-> 1. 0x1438e2530 (0x285da7100:0) [256x256] 0.074707 -0.410156 -0.641113 .. | |
|<- 1. 0x1438e2530 (0x285da7100:0) [256x256] 0.006721 0.004139 0.003284 .. | |
CCV_NNC_GEMM_FORWARD [489]: [2] -> [1] (0) | |
|-> 1. 0x1438e2650 (0x285da7100:0) [1x256x256] 0.006721 0.004139 0.003284 .. | |
|-> 2. 0x1438e25a0 (0x285da7140:0) [1x256x160] -0.481689 -0.672852 -0.152954 .. | |
|<- 1. 0x1438e42d0 (0x285da6e00:0) [1x256x160] -0.108215 -0.042847 -0.190308 .. | |
CCV_NNC_GEMM_FORWARD [490]: [2] -> [1] (0) | |
|-> 1. 0x1438e2770 (0x285da7080:0) [1x256x160] 0.032257 -0.060242 -0.044037 .. | |
|-> 2. 0x1438e26c0 (0x285da7040:0) [1x256x160] 0.795410 -0.431152 0.629883 .. | |
|<- 1. 0x1438a7af0 (0x285da7100:0) [1x256x256] 4.914062 2.873047 3.279297 .. | |
CCV_NNC_SOFTMAX_FORWARD [491]: [1] -> [1] (0) | |
|-> 1. 0x1438e2820 (0x285da7100:0) [256x256] 4.914062 2.873047 3.279297 .. | |
|<- 1. 0x1438e2820 (0x285da7100:0) [256x256] 0.107849 0.014008 0.021027 .. | |
CCV_NNC_GEMM_FORWARD [492]: [2] -> [1] (0) | |
|-> 1. 0x1438e2940 (0x285da7100:0) [1x256x256] 0.107849 0.014008 0.021027 .. | |
|-> 2. 0x1438e2890 (0x285da7140:0) [1x256x160] -0.669922 0.712402 0.161255 .. | |
|<- 1. 0x1438e4380 (0x285da6e00:0) [1x256x160] -0.199951 0.126953 0.041595 .. | |
CCV_NNC_GEMM_FORWARD [493]: [2] -> [1] (0) | |
|-> 1. 0x1438e2a60 (0x285da7080:0) [1x256x160] -0.038391 0.020187 -0.100281 .. | |
|-> 2. 0x1438e29b0 (0x285da7040:0) [1x256x160] -0.332275 1.332031 0.343018 .. | |
|<- 1. 0x1438a7b60 (0x285da7100:0) [1x256x256] 6.468750 4.593750 5.273438 .. | |
CCV_NNC_SOFTMAX_FORWARD [494]: [1] -> [1] (0) | |
|-> 1. 0x1438e2b10 (0x285da7100:0) [256x256] 6.468750 4.593750 5.273438 .. | |
|<- 1. 0x1438e2b10 (0x285da7100:0) [256x256] 0.065979 0.010117 0.019958 .. | |
CCV_NNC_GEMM_FORWARD [495]: [2] -> [1] (0) | |
|-> 1. 0x1438e2c30 (0x285da7100:0) [1x256x256] 0.065979 0.010117 0.019958 .. | |
|-> 2. 0x1438e2b80 (0x285da7140:0) [1x256x160] 0.428467 -0.251465 0.082031 .. | |
|<- 1. 0x1438e4430 (0x285da6e00:0) [1x256x160] -0.021912 -0.003967 0.127075 .. | |
CCV_NNC_GEMM_FORWARD [496]: [2] -> [1] (0) | |
|-> 1. 0x1438e2d50 (0x285da7080:0) [1x256x160] -0.041290 -0.048462 -0.083313 .. | |
|-> 2. 0x1438e2ca0 (0x285da7040:0) [1x256x160] 1.102539 -2.031250 -2.511719 .. | |
|<- 1. 0x1438a7bd0 (0x285da7100:0) [1x256x256] 3.585938 -0.072998 0.993164 .. | |
CCV_NNC_SOFTMAX_FORWARD [497]: [1] -> [1] (0) | |
|-> 1. 0x1438e2e00 (0x285da7100:0) [256x256] 3.585938 -0.072998 0.993164 .. | |
|<- 1. 0x1438e2e00 (0x285da7100:0) [256x256] 0.012482 0.000322 0.000934 .. | |
CCV_NNC_GEMM_FORWARD [498]: [2] -> [1] (0) | |
|-> 1. 0x1438e2f20 (0x285da7100:0) [1x256x256] 0.012482 0.000322 0.000934 .. | |
|-> 2. 0x1438e2e70 (0x285da7140:0) [1x256x160] 0.198364 -0.013878 -0.708496 .. | |
|<- 1. 0x1438e44e0 (0x285da6e00:0) [1x256x160] -0.229980 -0.289551 0.093201 .. | |
CCV_NNC_GEMM_FORWARD [499]: [2] -> [1] (0) | |
|-> 1. 0x1438e3040 (0x285da7080:0) [1x256x160] -0.005821 -0.014534 0.018280 .. | |
|-> 2. 0x1438e2f90 (0x285da7040:0) [1x256x160] 0.269775 -1.095703 -0.198120 .. | |
|<- 1. 0x1438a7c40 (0x285da7100:0) [1x256x256] 2.164062 1.581055 1.705078 .. | |
CCV_NNC_SOFTMAX_FORWARD [500]: [1] -> [1] (0) | |
|-> 1. 0x1438e30f0 (0x285da7100:0) [256x256] 2.164062 1.581055 1.705078 .. | |
|<- 1. 0x1438e30f0 (0x285da7100:0) [256x256] 0.015244 0.008514 0.009636 .. | |
CCV_NNC_GEMM_FORWARD [501]: [2] -> [1] (0) | |
|-> 1. 0x1438e3210 (0x285da7100:0) [1x256x256] 0.015244 0.008514 0.009636 .. | |
|-> 2. 0x1438e3160 (0x285da7140:0) [1x256x160] 0.503418 0.542480 -0.369141 .. | |
|<- 1. 0x1438e4590 (0x285da6e00:0) [1x256x160] 0.316406 -0.060425 0.264648 .. | |
CCV_NNC_GEMM_FORWARD [502]: [2] -> [1] (0) | |
|-> 1. 0x1438e3330 (0x285da7080:0) [1x256x160] 0.001838 0.020554 0.028427 .. | |
|-> 2. 0x1438e3280 (0x285da7040:0) [1x256x160] 1.364258 0.760254 -0.581543 .. | |
|<- 1. 0x1438a7cb0 (0x285da7100:0) [1x256x256] 4.667969 1.554688 2.054688 .. | |
CCV_NNC_SOFTMAX_FORWARD [503]: [1] -> [1] (0) | |
|-> 1. 0x1438e33e0 (0x285da7100:0) [256x256] 4.667969 1.554688 2.054688 .. | |
|<- 1. 0x1438e33e0 (0x285da7100:0) [256x256] 0.131592 0.005848 0.009644 .. | |
CCV_NNC_GEMM_FORWARD [504]: [2] -> [1] (0) | |
|-> 1. 0x1438e3500 (0x285da7100:0) [1x256x256] 0.131592 0.005848 0.009644 .. | |
|-> 2. 0x1438e3450 (0x285da7140:0) [1x256x160] -0.534180 0.441162 0.400391 .. | |
|<- 1. 0x1438e4640 (0x285da6e00:0) [1x256x160] -0.003521 0.156860 -0.056000 .. | |
CCV_NNC_GEMM_FORWARD [505]: [2] -> [1] (0) | |
|-> 1. 0x1438e3620 (0x285da7080:0) [1x256x160] 0.087830 -0.050659 -0.052521 .. | |
|-> 2. 0x1438e3570 (0x285da7040:0) [1x256x160] -0.844727 -0.783203 -0.423096 .. | |
|<- 1. 0x1438a7d20 (0x285da7100:0) [1x256x256] 1.906250 1.033203 0.901855 .. | |
CCV_NNC_SOFTMAX_FORWARD [506]: [1] -> [1] (0) | |
|-> 1. 0x1438e36d0 (0x285da7100:0) [256x256] 1.906250 1.033203 0.901855 .. | |
|<- 1. 0x1438e36d0 (0x285da7100:0) [256x256] 0.007812 0.003263 0.002861 .. | |
CCV_NNC_GEMM_FORWARD [507]: [2] -> [1] (0) | |
|-> 1. 0x1438e37f0 (0x285da7100:0) [1x256x256] 0.007812 0.003263 0.002861 .. | |
|-> 2. 0x1438e3740 (0x285da7140:0) [1x256x160] 0.654785 -0.521484 0.268311 .. | |
|<- 1. 0x1438e46f0 (0x285da6e00:0) [1x256x160] -0.063782 -0.092041 0.057983 .. | |
CCV_NNC_GEMM_FORWARD [508]: [2] -> [1] (0) | |
|-> 1. 0x1438e3910 (0x285da7080:0) [1x256x160] 0.038544 0.041870 0.012657 .. | |
|-> 2. 0x1438e3860 (0x285da7040:0) [1x256x160] -2.333984 0.066101 -0.386230 .. | |
|<- 1. 0x1438a7d90 (0x285da7100:0) [1x256x256] 5.812500 4.636719 5.191406 .. | |
CCV_NNC_SOFTMAX_FORWARD [509]: [1] -> [1] (0) | |
|-> 1. 0x1438e39c0 (0x285da7100:0) [256x256] 5.812500 4.636719 5.191406 .. | |
|<- 1. 0x1438e39c0 (0x285da7100:0) [256x256] 0.017822 0.005497 0.009575 .. | |
CCV_NNC_GEMM_FORWARD [510]: [2] -> [1] (0) | |
|-> 1. 0x1438e3ae0 (0x285da7100:0) [1x256x256] 0.017822 0.005497 0.009575 .. | |
|-> 2. 0x1438e3a30 (0x285da7140:0) [1x256x160] -0.254150 -0.162598 -0.588867 .. | |
|<- 1. 0x1438e47a0 (0x285da6e00:0) [1x256x160] -0.045349 -0.212646 -0.063049 .. | |
CCV_NNC_GEMM_FORWARD [511]: [2] -> [1] (0) | |
|-> 1. 0x1438e3c00 (0x285da7080:0) [1x256x160] -0.048370 0.008675 0.014503 .. | |
|-> 2. 0x1438e3b50 (0x285da7040:0) [1x256x160] 0.213135 0.942871 0.182495 .. | |
|<- 1. 0x1438a7e00 (0x285da7100:0) [1x256x256] 0.286133 -0.336914 -0.302002 .. | |
CCV_NNC_SOFTMAX_FORWARD [512]: [1] -> [1] (0) | |
|-> 1. 0x1438e3cb0 (0x285da7100:0) [256x256] 0.286133 -0.336914 -0.302002 .. | |
|<- 1. 0x1438e3cb0 (0x285da7100:0) [256x256] 0.007343 0.003937 0.004078 .. | |
CCV_NNC_GEMM_FORWARD [513]: [2] -> [1] (0) | |
|-> 1. 0x1438e3dd0 (0x285da7100:0) [1x256x256] 0.007343 0.003937 0.004078 .. | |
|-> 2. 0x1438e3d20 (0x285da7140:0) [1x256x160] -0.340088 -0.412598 -0.144287 .. | |
|<- 1. 0x1438e4850 (0x285da6e00:0) [1x256x160] -0.008133 0.087646 -0.112488 .. | |
CCV_NNC_TRANSPOSE_FORWARD [514]: [1] -> [1] (0) | |
|-> 1. 0x1438e4900 (0x285da6e00:0) [2x8x256x160] -0.256104 0.208862 0.047241 .. | |
|<- 1. 0x1438a7ee0 (0x285da7140:0) [2x256x8x160] -0.256104 0.208862 0.047241 .. | |
CCV_NNC_GEMM_FORWARD [515]: [3] -> [1] (0) | |
|-> 1. 0x1438e4970 (0x285da7140:0) [2x256x1280] -0.256104 0.208862 0.047241 .. | |
|-> 2. 0x1438c2660 (0x285d87540:0) [1280x1280] -0.033295 -0.005096 0.008888 .. | |
|-> 3. 0x1438c26d0 (0x285d87580:0) [1280] 0.042267 -0.030930 0.017395 .. | |
|<- 1. 0x1438a7f50 (0x285da6e00:0) [2x256x1280] 0.172607 -0.576660 0.459961 .. | |
CCV_NNC_ADD_FORWARD [516]: [2] -> [1] (0) | |
|-> 1. 0x1438a7f50 (0x285da6e00:0) [2x256x1280] 0.172607 -0.576660 0.459961 .. | |
|-> 2. 0x1438e0e40 (0x285da6dc0:0) [2x256x1280] 0.916016 0.061157 0.760742 .. | |
|<- 1. 0x1438a7f50 (0x285da6e00:0) [2x256x1280] 1.088867 -0.515625 1.220703 .. | |
CCV_NNC_LAYER_NORM_FORWARD [517]: [3] -> [3] (0) | |
|-> 1. 0x1438a7f50 (0x285da6e00:0) [2x256x1280] 1.088867 -0.515625 1.220703 .. | |
|-> 2. 0x1438c2740 (0x285d875c0:0) [1x1x1280] 0.298828 0.334473 0.325195 .. | |
|-> 3. 0x1438c27b0 (0x285d87600:0) [1x1x1280] 0.028320 -0.101685 0.016495 .. | |
|<- 1. 0x1438a7fc0 (0x285da6dc0:0) [2x256x1280] 0.471436 -0.338379 0.557129 .. | |
|<- 2. 0x1438a8030 (0x285da6f40:0) [2x256x1] 0.002930 .. | |
|<- 3. 0x1438a80a0 (0x285da6f80:0) [2x256x1] 1.365234 .. | |
CCV_NNC_GEMM_FORWARD [518]: [2] -> [1] (0) | |
|-> 1. 0x1438a7fc0 (0x285da6dc0:0) [2x256x1280] 0.471436 -0.338379 0.557129 .. | |
|-> 2. 0x1438c2820 (0x285d87640:0) [1280x1280] -0.016846 -0.033051 -0.043243 .. | |
|<- 1. 0x1438a8110 (0x285da7140:0) [2x256x1280] 0.489746 1.373047 0.477539 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [519]: [1] -> [1] (0) | |
|-> 1. 0x1438a8110 (0x285da7140:0) [2x256x1280] 0.489746 1.373047 0.477539 .. | |
|<- 1. 0x1438a8110 (0x285da7140:0) [2x256x1280] 0.038696 0.108521 0.037750 .. | |
CCV_NNC_TRANSPOSE_FORWARD [520]: [1] -> [1] (0) | |
|-> 1. 0x1438e4a50 (0x285da7140:0) [2x256x8x160] 0.038696 0.108521 0.037750 .. | |
|<- 1. 0x1438a8260 (0x285da6dc0:0) [2x8x256x160] 0.038696 0.108521 0.037750 .. | |
CCV_NNC_GEMM_FORWARD [521]: [2] -> [1] (0) | |
Wait: (0, 42) | |
|-> 1. 0x1438a8260 (0x285da6dc0:0) [2x8x256x160] 0.038696 0.108521 0.037750 .. | |
|-> 2. 0x1438a81f0 (0x285da71c0:0) [2x8x133x160] -0.213623 0.277832 -0.094299 .. | |
|<- 1. 0x1438a82d0 (0x285da7200:0) [2x8x256x133] 10.367188 2.091797 0.305908 .. | |
CCV_NNC_SOFTMAX_FORWARD [522]: [1] -> [1] (0) | |
|-> 1. 0x1438e4ac0 (0x285da7200:0) [4096x133] 10.367188 2.091797 0.305908 .. | |
|<- 1. 0x1438e4ac0 (0x285da7200:0) [4096x133] 0.488037 0.000124 0.000021 .. | |
CCV_NNC_GEMM_FORWARD [523]: [2] -> [1] (0) | |
Wait: (0, 43) | |
|-> 1. 0x1438e4ba0 (0x285da7200:0) [2x8x256x133] 0.488037 0.000124 0.000021 .. | |
|-> 2. 0x1438a83b0 (0x285da7280:0) [2x8x133x160] -0.006889 -0.040039 0.008888 .. | |
|<- 1. 0x1438a8420 (0x285da6dc0:0) [2x8x256x160] 0.411377 0.048035 0.267090 .. | |
CCV_NNC_TRANSPOSE_FORWARD [524]: [1] -> [1] (0) | |
|-> 1. 0x1438e4c10 (0x285da6dc0:0) [2x8x256x160] 0.411377 0.048035 0.267090 .. | |
|<- 1. 0x1438a8490 (0x285da7140:0) [2x256x8x160] 0.411377 0.048035 0.267090 .. | |
CCV_NNC_GEMM_FORWARD [525]: [3] -> [1] (0) | |
|-> 1. 0x1438e4c80 (0x285da7140:0) [2x256x1280] 0.411377 0.048035 0.267090 .. | |
|-> 2. 0x1438c2970 (0x285d87700:0) [1280x1280] 0.012047 -0.022003 -0.013741 .. | |
|-> 3. 0x1438c29e0 (0x285d87740:0) [1280] 0.027283 -0.020676 0.019165 .. | |
|<- 1. 0x1438a8500 (0x285da7000:0) [2x256x1280] 0.229858 -0.220703 -0.032501 .. | |
CCV_NNC_ADD_FORWARD [526]: [2] -> [1] (0) | |
|-> 1. 0x1438a8500 (0x285da7000:0) [2x256x1280] 0.229858 -0.220703 -0.032501 .. | |
|-> 2. 0x1438a7f50 (0x285da6e00:0) [2x256x1280] 1.088867 -0.515625 1.220703 .. | |
|<- 1. 0x1438a8500 (0x285da7000:0) [2x256x1280] 1.318359 -0.736328 1.188477 .. | |
CCV_NNC_LAYER_NORM_FORWARD [527]: [3] -> [3] (0) | |
|-> 1. 0x1438a8500 (0x285da7000:0) [2x256x1280] 1.318359 -0.736328 1.188477 .. | |
|-> 2. 0x1438c2a50 (0x285d87780:0) [1x1x1280] 0.214355 0.206787 0.204468 .. | |
|-> 3. 0x1438c2ac0 (0x285d877c0:0) [1x1x1280] -0.040192 0.012550 -0.007683 .. | |
|<- 1. 0x1438a8570 (0x285da72c0:0) [2x256x1280] 0.326904 -0.185669 0.307861 .. | |
|<- 2. 0x1438a85e0 (0x285da7300:0) [2x256x1] 0.000971 .. | |
|<- 3. 0x1438a8650 (0x285da7340:0) [2x256x1] 1.299805 .. | |
Emit: (0, 44) | |
CCV_NNC_GEMM_FORWARD [528]: [3] -> [1] (0) | |
|-> 1. 0x1438a8570 (0x285da72c0:0) [2x256x1280] 0.326904 -0.185669 0.307861 .. | |
|-> 2. 0x1438c2b30 (0x285d87800:0) [5120x1280] 0.086304 -0.005783 0.019226 .. | |
|-> 3. 0x1438c2ba0 (0x285d87840:0) [5120] 0.013763 0.002728 0.104187 .. | |
|<- 1. 0x1438a86c0 (0x285da7380:0) [2x256x5120] -0.285889 0.167847 0.058746 .. | |
CCV_NNC_GELU_FORWARD [529]: [1] -> [1] (0) | |
|-> 1. 0x1438a86c0 (0x285da7380:0) [2x256x5120] -0.285889 0.167847 0.058746 .. | |
|<- 1. 0x1438a86c0 (0x285da7380:0) [2x256x5120] -0.110779 0.095093 0.030746 .. | |
CCV_NNC_GEMM_FORWARD [530]: [3] -> [1] (1) | |
Wait: (1, 44) | |
|-> 1. 0x1438a8570 (0x285da72c0:0) [2x256x1280] 0.326904 -0.185669 0.307861 .. | |
|-> 2. 0x1438c2c10 (0x285d87880:0) [5120x1280] -0.046326 -0.024994 -0.023727 .. | |
|-> 3. 0x1438c2c80 (0x285d878c0:0) [5120] 0.017410 -0.023102 0.002996 .. | |
|<- 1. 0x1438a8730 (0x285da5ac0:0) [2x256x5120] 0.425537 -0.358887 0.792480 .. | |
Emit: (1, 45) | |
CCV_NNC_MUL_FORWARD [531]: [2] -> [1] (0) | |
Wait: (0, 45) | |
|-> 1. 0x1438a8730 (0x285da5ac0:0) [2x256x5120] 0.425537 -0.358887 0.792480 .. | |
|-> 2. 0x1438a86c0 (0x285da7380:0) [2x256x5120] -0.110779 0.095093 0.030746 .. | |
|<- 1. 0x1438a8730 (0x285da5ac0:0) [2x256x5120] -0.047150 -0.034119 0.024368 .. | |
CCV_NNC_GEMM_FORWARD [532]: [3] -> [1] (0) | |
|-> 1. 0x1438a8730 (0x285da5ac0:0) [2x256x5120] -0.047150 -0.034119 0.024368 .. | |
|-> 2. 0x1438c2cf0 (0x285d87900:0) [1280x5120] -0.042450 -0.023239 0.037201 .. | |
|-> 3. 0x1438c2d60 (0x285d87940:0) [1280] -0.003574 -0.007950 0.008675 .. | |
|<- 1. 0x1438a87a0 (0x285da72c0:0) [2x256x1280] -1.554688 -0.173950 -1.076172 .. | |
CCV_NNC_ADD_FORWARD [533]: [2] -> [1] (0) | |
|-> 1. 0x1438a87a0 (0x285da72c0:0) [2x256x1280] -1.554688 -0.173950 -1.076172 .. | |
|-> 2. 0x1438a8500 (0x285da7000:0) [2x256x1280] 1.318359 -0.736328 1.188477 .. | |
|<- 1. 0x1438a87a0 (0x285da72c0:0) [2x256x1280] -0.236328 -0.910156 0.112305 .. | |
CCV_NNC_CONVOLUTION_FORWARD [534]: [3] -> [1] (0) | |
|-> 1. 0x1438e4cf0 (0x285da72c0:0) [2x16x16x1280] -0.236328 -0.910156 0.112305 .. | |
|-> 2. 0x1438c2dd0 (0x285d87980:0) [1280x1280x1x1] 0.000402 .. | |
|-> 3. 0x1438c2e40 (0x285d879c0:0) [1280] 0.016434 0.028961 0.004444 .. | |
|<- 1. 0x1438a8810 (0x285da6e00:0) [2x16x16x1280] 2.337891 1.597656 -1.694336 .. | |
CCV_NNC_ADD_FORWARD [535]: [2] -> [1] (0) | |
|-> 1. 0x1438a8810 (0x285da6e00:0) [2x16x16x1280] 2.337891 1.597656 -1.694336 .. | |
|-> 2. 0x1438a7150 (0x285da6f00:0) [2x16x16x1280] -0.341553 0.146973 -0.125977 .. | |
|<- 1. 0x1438f14e0 (0x285da64c0:0) [2x16x16x1280] 1.996094 1.744141 -1.820312 .. | |
CCV_NNC_GROUP_NORM_FORWARD [536]: [3] -> [3] (0) | |
|-> 1. 0x1438f14e0 (0x285da64c0:0) [2x16x16x1280] 1.996094 1.744141 -1.820312 .. | |
|-> 2. 0x1438c2eb0 (0x285d87a00:0) [1x1x1x1280] 0.333008 0.327637 0.387939 .. | |
|-> 3. 0x1438c2f20 (0x285d87a40:0) [1x1x1x1280] -0.034149 -0.050507 -0.072388 .. | |
|<- 1. 0x1438a8880 (0x285da6e00:0) [2x16x16x1280] 0.492676 0.400391 -0.667969 .. | |
|<- 2. 0x1438a88f0 (0x285da73c0:0) [2x1x1x32] 0.059357 -0.062683 -0.005947 .. | |
|<- 3. 0x1438a8960 (0x285da7400:0) [2x1x1x32] 0.816895 0.872070 0.783691 .. | |
CCV_NNC_SWISH_FORWARD [537]: [1] -> [1] (0) | |
|-> 1. 0x1438a8880 (0x285da6e00:0) [2x16x16x1280] 0.492676 0.400391 -0.667969 .. | |
|<- 1. 0x1438a8880 (0x285da6e00:0) [2x16x16x1280] 0.305908 0.239746 -0.226440 .. | |
CCV_NNC_CONVOLUTION_FORWARD [538]: [3] -> [1] (0) | |
|-> 1. 0x1438a8880 (0x285da6e00:0) [2x16x16x1280] 0.305908 0.239746 -0.226440 .. | |
|-> 2. 0x1438c3070 (0x285d87b00:0) [1280x1280x3x3] -0.036163 0.019897 0.004116 .. | |
|-> 3. 0x1438c30e0 (0x285d87b40:0) [1280] 0.052185 -0.014023 0.033203 .. | |
|<- 1. 0x1438a8a40 (0x285da6f00:0) [2x16x16x1280] -0.425781 -0.730957 -0.226562 .. | |
CCV_NNC_ADD_FORWARD [539]: [2] -> [1] (0) | |
Wait: (0, 46) | |
|-> 1. 0x1438a8a40 (0x285da6f00:0) [2x16x16x1280] -0.425781 -0.730957 -0.226562 .. | |
|-> 2. 0x1438e4d60 (0x285da7440:0) [2x1x1x1280] 0.601562 -0.082703 0.705078 .. | |
|<- 1. 0x1438a8a40 (0x285da6f00:0) [2x16x16x1280] 0.175781 -0.813477 0.478516 .. | |
CCV_NNC_GROUP_NORM_FORWARD [540]: [3] -> [3] (0) | |
|-> 1. 0x1438a8a40 (0x285da6f00:0) [2x16x16x1280] 0.175781 -0.813477 0.478516 .. | |
|-> 2. 0x1438c3150 (0x285d87b80:0) [1x1x1x1280] 0.284668 0.658203 0.624023 .. | |
|-> 3. 0x1438c31c0 (0x285d87bc0:0) [1x1x1x1280] -0.110962 -0.154785 -0.171997 .. | |
|<- 1. 0x1438a8ab0 (0x285da6e00:0) [2x16x16x1280] -0.144409 -0.709473 -0.106750 .. | |
|<- 2. 0x1438a8b20 (0x285da6800:0) [2x1x1x32] 0.335938 0.340576 0.368408 .. | |
|<- 3. 0x1438a8b90 (0x285da67c0:0) [2x1x1x32] 0.733398 0.658691 0.897461 .. | |
CCV_NNC_SWISH_FORWARD [541]: [1] -> [1] (0) | |
|-> 1. 0x1438a8ab0 (0x285da6e00:0) [2x16x16x1280] -0.144409 -0.709473 -0.106750 .. | |
|<- 1. 0x1438a8ab0 (0x285da6e00:0) [2x16x16x1280] -0.067017 -0.233887 -0.050537 .. | |
CCV_NNC_CONVOLUTION_FORWARD [542]: [3] -> [1] (0) | |
|-> 1. 0x1438a8ab0 (0x285da6e00:0) [2x16x16x1280] -0.067017 -0.233887 -0.050537 .. | |
|-> 2. 0x1438c3230 (0x285d87c00:0) [1280x1280x3x3] -0.012634 0.007359 -0.021210 .. | |
|-> 3. 0x1438c32a0 (0x285d87c40:0) [1280] 0.004417 -0.009216 0.003883 .. | |
|<- 1. 0x1438a8c00 (0x285da6dc0:0) [2x16x16x1280] -0.556152 0.048492 -0.749023 .. | |
CCV_NNC_ADD_FORWARD [543]: [2] -> [1] (0) | |
|-> 1. 0x1438f14e0 (0x285da64c0:0) [2x16x16x1280] 1.996094 1.744141 -1.820312 .. | |
|-> 2. 0x1438a8c00 (0x285da6dc0:0) [2x16x16x1280] -0.556152 0.048492 -0.749023 .. | |
|<- 1. 0x1438a8c70 (0x285da6f00:0) [2x16x16x1280] 1.439453 1.792969 -2.570312 .. | |
CCV_NNC_GROUP_NORM_FORWARD [544]: [3] -> [3] (0) | |
|-> 1. 0x1438a8c70 (0x285da6f00:0) [2x16x16x1280] 1.439453 1.792969 -2.570312 .. | |
|-> 2. 0x1438c3310 (0x285d87c80:0) [1x1x1x1280] 0.274902 0.281982 0.277588 .. | |
|-> 3. 0x1438c3380 (0x285d87cc0:0) [1x1x1x1280] -0.027802 0.013046 -0.012108 .. | |
|<- 1. 0x1438a8ce0 (0x285da6dc0:0) [2x16x16x1280] 0.266113 0.388184 -0.538086 .. | |
|<- 2. 0x1438a8d50 (0x285da6100:0) [2x1x1x32] -0.006233 -0.164307 -0.001076 .. | |
|<- 3. 0x1438a8dc0 (0x285da6140:0) [2x1x1x32] 0.739258 0.812500 0.757812 .. | |
CCV_NNC_CONVOLUTION_FORWARD [545]: [3] -> [1] (0) | |
|-> 1. 0x1438a8ce0 (0x285da6dc0:0) [2x16x16x1280] 0.266113 0.388184 -0.538086 .. | |
|-> 2. 0x1438c33f0 (0x285d87d00:0) [1280x1280x1x1] -0.043732 .. | |
|-> 3. 0x1438c3460 (0x285d87d40:0) [1280] -0.055511 0.011642 0.023346 .. | |
|<- 1. 0x1438a8e30 (0x285da6e00:0) [2x16x16x1280] -0.364502 -0.283447 0.436768 .. | |
CCV_NNC_LAYER_NORM_FORWARD [546]: [3] -> [3] (0) | |
|-> 1. 0x1438e4dd0 (0x285da6e00:0) [2x256x1280] -0.364502 -0.283447 0.436768 .. | |
|-> 2. 0x1438c34d0 (0x285d87d80:0) [1x1x1280] 0.291748 0.307373 0.281494 .. | |
|-> 3. 0x1438c3540 (0x285d87dc0:0) [1x1x1280] 0.017899 0.019028 -0.010086 .. | |
|<- 1. 0x1438a8ea0 (0x285da6dc0:0) [2x256x1280] -0.095398 -0.074036 0.118713 .. | |
|<- 2. 0x1438a8f10 (0x285da7480:0) [2x256x1] 0.003412 .. | |
|<- 3. 0x1438a8f80 (0x285da74c0:0) [2x256x1] 1.055664 .. | |
Emit: (0, 47) | |
CCV_NNC_GEMM_FORWARD [547]: [2] -> [1] (0) | |
|-> 1. 0x1438a8ea0 (0x285da6dc0:0) [2x256x1280] -0.095398 -0.074036 0.118713 .. | |
|-> 2. 0x1438c35b0 (0x285d87e00:0) [1280x1280] -0.015358 0.006359 -0.070374 .. | |
|<- 1. 0x1438a8ff0 (0x285da7040:0) [2x256x1280] 0.133667 1.254883 -0.314697 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [548]: [1] -> [1] (0) | |
|-> 1. 0x1438a8ff0 (0x285da7040:0) [2x256x1280] 0.133667 1.254883 -0.314697 .. | |
|<- 1. 0x1438a8ff0 (0x285da7040:0) [2x256x1280] 0.010567 0.099182 -0.024872 .. | |
CCV_NNC_TRANSPOSE_FORWARD [549]: [1] -> [1] (0) | |
|-> 1. 0x1438e4eb0 (0x285da7040:0) [2x256x8x160] 0.010567 0.099182 -0.024872 .. | |
|<- 1. 0x1438a9140 (0x285da70c0:0) [2x8x256x160] 0.010567 0.099182 -0.024872 .. | |
CCV_NNC_GEMM_FORWARD [550]: [2] -> [1] (1) | |
Wait: (1, 47) | |
|-> 1. 0x1438a8ea0 (0x285da6dc0:0) [2x256x1280] -0.095398 -0.074036 0.118713 .. | |
|-> 2. 0x1438c3620 (0x285d87e40:0) [1280x1280] 0.025864 0.021133 0.003876 .. | |
|<- 1. 0x1438a9060 (0x285da7080:0) [2x256x1280] -2.302734 -0.755371 -2.503906 .. | |
CCV_NNC_TRANSPOSE_FORWARD [551]: [1] -> [1] (1) | |
|-> 1. 0x1438e4e40 (0x285da7080:0) [2x256x8x160] -2.302734 -0.755371 -2.503906 .. | |
|<- 1. 0x1438a90d0 (0x285da7500:0) [2x8x256x160] -2.302734 -0.755371 -2.503906 .. | |
Emit: (1, 48) | |
CCV_NNC_GEMM_FORWARD [552]: [2] -> [1] (2) | |
Wait: (2, 47) | |
|-> 1. 0x1438a8ea0 (0x285da6dc0:0) [2x256x1280] -0.095398 -0.074036 0.118713 .. | |
|-> 2. 0x1438c3690 (0x285d87e80:0) [1280x1280] 0.038574 -0.058319 -0.039154 .. | |
|<- 1. 0x1438a91b0 (0x285da7140:0) [2x256x1280] -0.527344 0.304688 -0.289795 .. | |
CCV_NNC_TRANSPOSE_FORWARD [553]: [1] -> [1] (2) | |
|-> 1. 0x1438e5000 (0x285da7140:0) [2x256x8x160] -0.527344 0.304688 -0.289795 .. | |
|<- 1. 0x1438a9290 (0x285da6fc0:0) [2x8x256x160] -0.527344 0.304688 -0.289795 .. | |
Emit: (2, 49) | |
CCV_NNC_GEMM_FORWARD [554]: [2] -> [1] (0) | |
Wait: (0, 48) | |
|-> 1. 0x1438e4f90 (0x285da70c0:0) [1x256x160] 0.010567 0.099182 -0.024872 .. | |
|-> 2. 0x1438e4f20 (0x285da7500:0) [1x256x160] -2.302734 -0.755371 -2.503906 .. | |
|<- 1. 0x1438a9220 (0x285da7540:0) [1x256x256] 4.894531 2.089844 2.791016 .. | |
CCV_NNC_SOFTMAX_FORWARD [555]: [1] -> [1] (0) | |
|-> 1. 0x1438e5070 (0x285da7540:0) [256x256] 4.894531 2.089844 2.791016 .. | |
|<- 1. 0x1438e5070 (0x285da7540:0) [256x256] 0.150513 0.009109 0.018372 .. | |
CCV_NNC_GEMM_FORWARD [556]: [2] -> [1] (0) | |
Wait: (0, 49) | |
|-> 1. 0x1438e5150 (0x285da7540:0) [1x256x256] 0.150513 0.009109 0.018372 .. | |
|-> 2. 0x1438e50e0 (0x285da6fc0:0) [1x256x160] -0.527344 0.304688 -0.289795 .. | |
|<- 1. 0x1438e7dd0 (0x285da6dc0:0) [1x256x160] -0.100159 0.029770 -0.032318 .. | |
CCV_NNC_GEMM_FORWARD [557]: [2] -> [1] (0) | |
|-> 1. 0x1438e5270 (0x285da70c0:0) [1x256x160] 0.060364 -0.017807 -0.125244 .. | |
|-> 2. 0x1438e51c0 (0x285da7500:0) [1x256x160] -0.488770 0.827637 -0.550293 .. | |
|<- 1. 0x1438a9300 (0x285da7580:0) [1x256x256] 3.794922 2.361328 2.544922 .. | |
CCV_NNC_SOFTMAX_FORWARD [558]: [1] -> [1] (0) | |
|-> 1. 0x1438e5320 (0x285da7580:0) [256x256] 3.794922 2.361328 2.544922 .. | |
|<- 1. 0x1438e5320 (0x285da7580:0) [256x256] 0.053955 0.012863 0.015457 .. | |
CCV_NNC_GEMM_FORWARD [559]: [2] -> [1] (0) | |
|-> 1. 0x1438e5440 (0x285da7580:0) [1x256x256] 0.053955 0.012863 0.015457 .. | |
|-> 2. 0x1438e5390 (0x285da6fc0:0) [1x256x160] 1.671875 -0.443359 -0.339600 .. | |
|<- 1. 0x1438e7e40 (0x285da6dc0:0) [1x256x160] 0.442627 -0.208984 0.044159 .. | |
CCV_NNC_GEMM_FORWARD [560]: [2] -> [1] (0) | |
|-> 1. 0x1438e5560 (0x285da70c0:0) [1x256x160] -0.029770 0.065918 -0.002853 .. | |
|-> 2. 0x1438e54b0 (0x285da7500:0) [1x256x160] -0.056305 0.210815 -0.447021 .. | |
|<- 1. 0x1438a9370 (0x285da7580:0) [1x256x256] 0.416992 0.937988 1.477539 .. | |
CCV_NNC_SOFTMAX_FORWARD [561]: [1] -> [1] (0) | |
|-> 1. 0x1438e5610 (0x285da7580:0) [256x256] 0.416992 0.937988 1.477539 .. | |
|<- 1. 0x1438e5610 (0x285da7580:0) [256x256] 0.004230 0.007122 0.012215 .. | |
CCV_NNC_GEMM_FORWARD [562]: [2] -> [1] (0) | |
|-> 1. 0x1438e5730 (0x285da7580:0) [1x256x256] 0.004230 0.007122 0.012215 .. | |
|-> 2. 0x1438e5680 (0x285da6fc0:0) [1x256x160] 0.977051 0.479736 -0.059082 .. | |
|<- 1. 0x1438e7ef0 (0x285da6dc0:0) [1x256x160] 0.174927 0.110413 -0.197388 .. | |
CCV_NNC_GEMM_FORWARD [563]: [2] -> [1] (0) | |
|-> 1. 0x1438e5850 (0x285da70c0:0) [1x256x160] 0.001321 -0.062500 -0.055420 .. | |
|-> 2. 0x1438e57a0 (0x285da7500:0) [1x256x160] -0.796387 1.776367 -1.452148 .. | |
|<- 1. 0x1438a93e0 (0x285da7580:0) [1x256x256] 4.015625 2.263672 1.491211 .. | |
CCV_NNC_SOFTMAX_FORWARD [564]: [1] -> [1] (0) | |
|-> 1. 0x1438e5900 (0x285da7580:0) [256x256] 4.015625 2.263672 1.491211 .. | |
|<- 1. 0x1438e5900 (0x285da7580:0) [256x256] 0.096619 0.016754 0.007740 .. | |
CCV_NNC_GEMM_FORWARD [565]: [2] -> [1] (0) | |
|-> 1. 0x1438e5a20 (0x285da7580:0) [1x256x256] 0.096619 0.016754 0.007740 .. | |
|-> 2. 0x1438e5970 (0x285da6fc0:0) [1x256x160] -0.647949 0.601562 -0.448486 .. | |
|<- 1. 0x1438e7fa0 (0x285da6dc0:0) [1x256x160] -0.178589 0.133667 -0.261475 .. | |
CCV_NNC_GEMM_FORWARD [566]: [2] -> [1] (0) | |
|-> 1. 0x1438e5b40 (0x285da70c0:0) [1x256x160] 0.036041 -0.091003 -0.021805 .. | |
|-> 2. 0x1438e5a90 (0x285da7500:0) [1x256x160] 1.529297 -0.785156 -0.509766 .. | |
|<- 1. 0x1438a9450 (0x285da7580:0) [1x256x256] 1.646484 0.920410 0.490479 .. | |
CCV_NNC_SOFTMAX_FORWARD [567]: [1] -> [1] (0) | |
|-> 1. 0x1438e5bf0 (0x285da7580:0) [256x256] 1.646484 0.920410 0.490479 .. | |
|<- 1. 0x1438e5bf0 (0x285da7580:0) [256x256] 0.013008 0.006290 0.004093 .. | |
CCV_NNC_GEMM_FORWARD [568]: [2] -> [1] (0) | |
|-> 1. 0x1438e5d10 (0x285da7580:0) [1x256x256] 0.013008 0.006290 0.004093 .. | |
|-> 2. 0x1438e5c60 (0x285da6fc0:0) [1x256x160] 0.245117 -0.159668 -0.031799 .. | |
|<- 1. 0x1438e8050 (0x285da6dc0:0) [1x256x160] 0.120544 0.106873 -0.191162 .. | |
CCV_NNC_GEMM_FORWARD [569]: [2] -> [1] (0) | |
|-> 1. 0x1438e5e30 (0x285da70c0:0) [1x256x160] -0.022400 -0.059692 0.108887 .. | |
|-> 2. 0x1438e5d80 (0x285da7500:0) [1x256x160] 2.158203 -0.620117 -0.736328 .. | |
|<- 1. 0x1438a94c0 (0x285da7580:0) [1x256x256] 4.046875 2.863281 2.845703 .. | |
CCV_NNC_SOFTMAX_FORWARD [570]: [1] -> [1] (0) | |
|-> 1. 0x1438e5ee0 (0x285da7580:0) [256x256] 4.046875 2.863281 2.845703 .. | |
|<- 1. 0x1438e5ee0 (0x285da7580:0) [256x256] 0.064026 0.019608 0.019257 .. | |
CCV_NNC_GEMM_FORWARD [571]: [2] -> [1] (0) | |
|-> 1. 0x1438e6000 (0x285da7580:0) [1x256x256] 0.064026 0.019608 0.019257 .. | |
|-> 2. 0x1438e5f50 (0x285da6fc0:0) [1x256x160] -0.402588 0.544922 0.652344 .. | |
|<- 1. 0x1438e8100 (0x285da6dc0:0) [1x256x160] -0.246094 0.122498 0.167969 .. | |
CCV_NNC_GEMM_FORWARD [572]: [2] -> [1] (0) | |
|-> 1. 0x1438e6120 (0x285da70c0:0) [1x256x160] -0.048553 0.041901 -0.054443 .. | |
|-> 2. 0x1438e6070 (0x285da7500:0) [1x256x160] -0.235596 -1.250977 0.411621 .. | |
|<- 1. 0x1438a9530 (0x285da7580:0) [1x256x256] 2.195312 0.461914 1.040039 .. | |
CCV_NNC_SOFTMAX_FORWARD [573]: [1] -> [1] (0) | |
|-> 1. 0x1438e61d0 (0x285da7580:0) [256x256] 2.195312 0.461914 1.040039 .. | |
|<- 1. 0x1438e61d0 (0x285da7580:0) [256x256] 0.025986 0.004593 0.008186 .. | |
CCV_NNC_GEMM_FORWARD [574]: [2] -> [1] (0) | |
|-> 1. 0x1438e62f0 (0x285da7580:0) [1x256x256] 0.025986 0.004593 0.008186 .. | |
|-> 2. 0x1438e6240 (0x285da6fc0:0) [1x256x160] 0.405029 0.111938 -0.727539 .. | |
|<- 1. 0x1438e81b0 (0x285da6dc0:0) [1x256x160] 0.085144 0.086792 -0.215942 .. | |
CCV_NNC_GEMM_FORWARD [575]: [2] -> [1] (0) | |
|-> 1. 0x1438e6410 (0x285da70c0:0) [1x256x160] -0.049408 -0.056091 0.026978 .. | |
|-> 2. 0x1438e6360 (0x285da7500:0) [1x256x160] 0.274902 1.085938 0.201660 .. | |
|<- 1. 0x1438a95a0 (0x285da7580:0) [1x256x256] 0.449463 -0.291992 0.279297 .. | |
CCV_NNC_SOFTMAX_FORWARD [576]: [1] -> [1] (0) | |
|-> 1. 0x1438e64c0 (0x285da7580:0) [256x256] 0.449463 -0.291992 0.279297 .. | |
|<- 1. 0x1438e64c0 (0x285da7580:0) [256x256] 0.007122 0.003393 0.006008 .. | |
CCV_NNC_GEMM_FORWARD [577]: [2] -> [1] (0) | |
|-> 1. 0x1438e65e0 (0x285da7580:0) [1x256x256] 0.007122 0.003393 0.006008 .. | |
|-> 2. 0x1438e6530 (0x285da6fc0:0) [1x256x160] -0.062256 -0.687988 0.006107 .. | |
|<- 1. 0x1438e8260 (0x285da6dc0:0) [1x256x160] 0.142456 0.228638 0.217896 .. | |
CCV_NNC_GEMM_FORWARD [578]: [2] -> [1] (0) | |
|-> 1. 0x1438e6700 (0x285da70c0:0) [1x256x160] 0.006504 0.094727 0.000420 .. | |
|-> 2. 0x1438e6650 (0x285da7500:0) [1x256x160] -1.830078 -0.961914 -2.369141 .. | |
|<- 1. 0x1438a9610 (0x285da7580:0) [1x256x256] 3.703125 1.928711 2.630859 .. | |
CCV_NNC_SOFTMAX_FORWARD [579]: [1] -> [1] (0) | |
|-> 1. 0x1438e67b0 (0x285da7580:0) [256x256] 3.703125 1.928711 2.630859 .. | |
|<- 1. 0x1438e67b0 (0x285da7580:0) [256x256] 0.064453 0.010925 0.022049 .. | |
CCV_NNC_GEMM_FORWARD [580]: [2] -> [1] (0) | |
|-> 1. 0x1438e68d0 (0x285da7580:0) [1x256x256] 0.064453 0.010925 0.022049 .. | |
|-> 2. 0x1438e6820 (0x285da6fc0:0) [1x256x160] 0.068298 0.421387 -0.546875 .. | |
|<- 1. 0x1438e8310 (0x285da6dc0:0) [1x256x160] 0.269287 0.084229 -0.165527 .. | |
CCV_NNC_GEMM_FORWARD [581]: [2] -> [1] (0) | |
|-> 1. 0x1438e69f0 (0x285da70c0:0) [1x256x160] 0.027283 -0.056458 -0.107361 .. | |
|-> 2. 0x1438e6940 (0x285da7500:0) [1x256x160] -0.593750 0.997559 -0.401367 .. | |
|<- 1. 0x1438a9680 (0x285da7580:0) [1x256x256] 3.335938 2.433594 2.679688 .. | |
CCV_NNC_SOFTMAX_FORWARD [582]: [1] -> [1] (0) | |
|-> 1. 0x1438e6aa0 (0x285da7580:0) [256x256] 3.335938 2.433594 2.679688 .. | |
|<- 1. 0x1438e6aa0 (0x285da7580:0) [256x256] 0.029083 0.011795 0.015083 .. | |
CCV_NNC_GEMM_FORWARD [583]: [2] -> [1] (0) | |
|-> 1. 0x1438e6bc0 (0x285da7580:0) [1x256x256] 0.029083 0.011795 0.015083 .. | |
|-> 2. 0x1438e6b10 (0x285da6fc0:0) [1x256x160] 1.571289 -0.274170 -0.147339 .. | |
|<- 1. 0x1438e83c0 (0x285da6dc0:0) [1x256x160] 0.405029 -0.203491 0.009926 .. | |
CCV_NNC_GEMM_FORWARD [584]: [2] -> [1] (0) | |
|-> 1. 0x1438e6ce0 (0x285da70c0:0) [1x256x160] -0.041870 0.017044 0.002636 .. | |
|-> 2. 0x1438e6c30 (0x285da7500:0) [1x256x160] 0.144165 0.397949 -0.394287 .. | |
|<- 1. 0x1438a96f0 (0x285da7580:0) [1x256x256] 0.147827 0.866211 1.292969 .. | |
CCV_NNC_SOFTMAX_FORWARD [585]: [1] -> [1] (0) | |
|-> 1. 0x1438e6d90 (0x285da7580:0) [256x256] 0.147827 0.866211 1.292969 .. | |
|<- 1. 0x1438e6d90 (0x285da7580:0) [256x256] 0.003628 0.007442 0.011406 .. | |
CCV_NNC_GEMM_FORWARD [586]: [2] -> [1] (0) | |
|-> 1. 0x1438e6eb0 (0x285da7580:0) [1x256x256] 0.003628 0.007442 0.011406 .. | |
|-> 2. 0x1438e6e00 (0x285da6fc0:0) [1x256x160] 0.803711 0.322998 0.055878 .. | |
|<- 1. 0x1438e8470 (0x285da6dc0:0) [1x256x160] 0.079590 -0.215210 -0.254395 .. | |
CCV_NNC_GEMM_FORWARD [587]: [2] -> [1] (0) | |
|-> 1. 0x1438e6fd0 (0x285da70c0:0) [1x256x160] -0.017853 -0.044434 -0.070007 .. | |
|-> 2. 0x1438e6f20 (0x285da7500:0) [1x256x160] -0.208130 1.618164 -0.839355 .. | |
|<- 1. 0x1438a9760 (0x285da7580:0) [1x256x256] 3.435547 2.369141 2.031250 .. | |
CCV_NNC_SOFTMAX_FORWARD [588]: [1] -> [1] (0) | |
|-> 1. 0x1438e7080 (0x285da7580:0) [256x256] 3.435547 2.369141 2.031250 .. | |
|<- 1. 0x1438e7080 (0x285da7580:0) [256x256] 0.050537 0.017395 0.012405 .. | |
CCV_NNC_GEMM_FORWARD [589]: [2] -> [1] (0) | |
|-> 1. 0x1438e71a0 (0x285da7580:0) [1x256x256] 0.050537 0.017395 0.012405 .. | |
|-> 2. 0x1438e70f0 (0x285da6fc0:0) [1x256x160] -0.221924 0.450928 -0.369873 .. | |
|<- 1. 0x1438e8520 (0x285da6dc0:0) [1x256x160] -0.151733 -0.010597 -0.077820 .. | |
CCV_NNC_GEMM_FORWARD [590]: [2] -> [1] (0) | |
|-> 1. 0x1438e72c0 (0x285da70c0:0) [1x256x160] 0.013718 -0.084595 -0.019669 .. | |
|-> 2. 0x1438e7210 (0x285da7500:0) [1x256x160] 1.333984 -0.531250 -0.787109 .. | |
|<- 1. 0x1438a97d0 (0x285da7580:0) [1x256x256] 1.380859 0.741211 0.596680 .. | |
CCV_NNC_SOFTMAX_FORWARD [591]: [1] -> [1] (0) | |
|-> 1. 0x1438e7370 (0x285da7580:0) [256x256] 1.380859 0.741211 0.596680 .. | |
|<- 1. 0x1438e7370 (0x285da7580:0) [256x256] 0.011063 0.005833 0.005051 .. | |
CCV_NNC_GEMM_FORWARD [592]: [2] -> [1] (0) | |
|-> 1. 0x1438e7490 (0x285da7580:0) [1x256x256] 0.011063 0.005833 0.005051 .. | |
|-> 2. 0x1438e73e0 (0x285da6fc0:0) [1x256x160] 0.061432 0.197632 0.123413 .. | |
|<- 1. 0x1438e85d0 (0x285da6dc0:0) [1x256x160] -0.003710 0.210205 -0.161499 .. | |
CCV_NNC_GEMM_FORWARD [593]: [2] -> [1] (0) | |
|-> 1. 0x1438e75b0 (0x285da70c0:0) [1x256x160] -0.015137 -0.041901 0.080566 .. | |
|-> 2. 0x1438e7500 (0x285da7500:0) [1x256x160] 1.485352 -0.556152 -0.729004 .. | |
|<- 1. 0x1438a9840 (0x285da7580:0) [1x256x256] 3.076172 2.332031 2.509766 .. | |
CCV_NNC_SOFTMAX_FORWARD [594]: [1] -> [1] (0) | |
|-> 1. 0x1438e7660 (0x285da7580:0) [256x256] 3.076172 2.332031 2.509766 .. | |
|<- 1. 0x1438e7660 (0x285da7580:0) [256x256] 0.037445 0.017792 0.021240 .. | |
CCV_NNC_GEMM_FORWARD [595]: [2] -> [1] (0) | |
|-> 1. 0x1438e7780 (0x285da7580:0) [1x256x256] 0.037445 0.017792 0.021240 .. | |
|-> 2. 0x1438e76d0 (0x285da6fc0:0) [1x256x160] -0.040405 0.395996 0.506348 .. | |
|<- 1. 0x1438e8680 (0x285da6dc0:0) [1x256x160] 0.000468 0.043640 -0.069946 .. | |
CCV_NNC_GEMM_FORWARD [596]: [2] -> [1] (0) | |
|-> 1. 0x1438e78a0 (0x285da70c0:0) [1x256x160] -0.033600 0.044037 -0.009346 .. | |
|-> 2. 0x1438e77f0 (0x285da7500:0) [1x256x160] -0.108948 -1.175781 0.637207 .. | |
|<- 1. 0x1438a98b0 (0x285da7580:0) [1x256x256] 1.259766 0.194092 0.427246 .. | |
CCV_NNC_SOFTMAX_FORWARD [597]: [1] -> [1] (0) | |
|-> 1. 0x1438e7950 (0x285da7580:0) [256x256] 1.259766 0.194092 0.427246 .. | |
|<- 1. 0x1438e7950 (0x285da7580:0) [256x256] 0.014397 0.004959 0.006260 .. | |
CCV_NNC_GEMM_FORWARD [598]: [2] -> [1] (0) | |
|-> 1. 0x1438e7a70 (0x285da7580:0) [1x256x256] 0.014397 0.004959 0.006260 .. | |
|-> 2. 0x1438e79c0 (0x285da6fc0:0) [1x256x160] 0.186890 -0.200806 -0.648438 .. | |
|<- 1. 0x1438e8730 (0x285da6dc0:0) [1x256x160] 0.004116 -0.114197 -0.297119 .. | |
CCV_NNC_GEMM_FORWARD [599]: [2] -> [1] (0) | |
|-> 1. 0x1438e7b90 (0x285da70c0:0) [1x256x160] -0.020721 -0.068787 0.010681 .. | |
|-> 2. 0x1438e7ae0 (0x285da7500:0) [1x256x160] 0.197998 0.843262 0.037109 .. | |
|<- 1. 0x1438a9920 (0x285da7580:0) [1x256x256] 0.241943 -0.459473 0.271729 .. | |
CCV_NNC_SOFTMAX_FORWARD [600]: [1] -> [1] (0) | |
|-> 1. 0x1438e7c40 (0x285da7580:0) [256x256] 0.241943 -0.459473 0.271729 .. | |
|<- 1. 0x1438e7c40 (0x285da7580:0) [256x256] 0.005272 0.002615 0.005432 .. | |
CCV_NNC_GEMM_FORWARD [601]: [2] -> [1] (0) | |
|-> 1. 0x1438e7d60 (0x285da7580:0) [1x256x256] 0.005272 0.002615 0.005432 .. | |
|-> 2. 0x1438e7cb0 (0x285da6fc0:0) [1x256x160] -0.120789 -0.682129 0.342041 .. | |
|<- 1. 0x1438e87e0 (0x285da6dc0:0) [1x256x160] -0.112000 0.312012 0.225830 .. | |
CCV_NNC_TRANSPOSE_FORWARD [602]: [1] -> [1] (0) | |
|-> 1. 0x1438e8890 (0x285da6dc0:0) [2x8x256x160] -0.100159 0.029770 -0.032318 .. | |
|<- 1. 0x1438a9a00 (0x285da6fc0:0) [2x256x8x160] -0.100159 0.029770 -0.032318 .. | |
CCV_NNC_GEMM_FORWARD [603]: [3] -> [1] (0) | |
|-> 1. 0x1438e8900 (0x285da6fc0:0) [2x256x1280] -0.100159 0.029770 -0.032318 .. | |
|-> 2. 0x1438c3700 (0x285d87ec0:0) [1280x1280] -0.012550 0.027084 -0.008194 .. | |
|-> 3. 0x1438c3770 (0x285d87f00:0) [1280] -0.020645 -0.020111 0.022873 .. | |
|<- 1. 0x1438a9a70 (0x285da6dc0:0) [2x256x1280] -0.150757 -0.070435 0.160278 .. | |
CCV_NNC_ADD_FORWARD [604]: [2] -> [1] (0) | |
|-> 1. 0x1438a9a70 (0x285da6dc0:0) [2x256x1280] -0.150757 -0.070435 0.160278 .. | |
|-> 2. 0x1438e4dd0 (0x285da6e00:0) [2x256x1280] -0.364502 -0.283447 0.436768 .. | |
|<- 1. 0x1438a9a70 (0x285da6dc0:0) [2x256x1280] -0.515137 -0.354004 0.597168 .. | |
CCV_NNC_LAYER_NORM_FORWARD [605]: [3] -> [3] (0) | |
|-> 1. 0x1438a9a70 (0x285da6dc0:0) [2x256x1280] -0.515137 -0.354004 0.597168 .. | |
|-> 2. 0x1438c37e0 (0x285d87f40:0) [1x1x1280] 0.366943 0.374268 0.404053 .. | |
|-> 3. 0x1438c3850 (0x285d87f80:0) [1x1x1280] 0.053497 0.086670 0.045715 .. | |
|<- 1. 0x1438a9ae0 (0x285da6e00:0) [2x256x1280] -0.168701 -0.067566 0.340820 .. | |
|<- 2. 0x1438a9b50 (0x285da75c0:0) [2x256x1] -0.010880 .. | |
|<- 3. 0x1438a9bc0 (0x285da7600:0) [2x256x1] 1.201172 .. | |
CCV_NNC_GEMM_FORWARD [606]: [2] -> [1] (0) | |
|-> 1. 0x1438a9ae0 (0x285da6e00:0) [2x256x1280] -0.168701 -0.067566 0.340820 .. | |
|-> 2. 0x1438c38c0 (0x285d87fc0:0) [1280x1280] -0.109070 -0.095642 0.015358 .. | |
|<- 1. 0x1438a9c30 (0x285da6fc0:0) [2x256x1280] -0.723145 0.180664 -1.426758 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [607]: [1] -> [1] (0) | |
|-> 1. 0x1438a9c30 (0x285da6fc0:0) [2x256x1280] -0.723145 0.180664 -1.426758 .. | |
|<- 1. 0x1438a9c30 (0x285da6fc0:0) [2x256x1280] -0.057159 0.014282 -0.112793 .. | |
CCV_NNC_TRANSPOSE_FORWARD [608]: [1] -> [1] (0) | |
|-> 1. 0x1438e89e0 (0x285da6fc0:0) [2x256x8x160] -0.057159 0.014282 -0.112793 .. | |
|<- 1. 0x1438a9d80 (0x285da6e00:0) [2x8x256x160] -0.057159 0.014282 -0.112793 .. | |
CCV_NNC_GEMM_FORWARD [609]: [2] -> [1] (0) | |
Wait: (0, 50) | |
|-> 1. 0x1438a9d80 (0x285da6e00:0) [2x8x256x160] -0.057159 0.014282 -0.112793 .. | |
|-> 2. 0x1438a9d10 (0x285da7680:0) [2x8x133x160] 0.191650 0.108704 -0.219238 .. | |
|<- 1. 0x1438a9df0 (0x285da76c0:0) [2x8x256x133] 5.523438 -2.220703 1.056641 .. | |
CCV_NNC_SOFTMAX_FORWARD [610]: [1] -> [1] (0) | |
|-> 1. 0x1438e8a50 (0x285da76c0:0) [4096x133] 5.523438 -2.220703 1.056641 .. | |
|<- 1. 0x1438e8a50 (0x285da76c0:0) [4096x133] 0.313232 0.000136 0.003597 .. | |
CCV_NNC_GEMM_FORWARD [611]: [2] -> [1] (0) | |
Wait: (0, 51) | |
|-> 1. 0x1438e8b30 (0x285da76c0:0) [2x8x256x133] 0.313232 0.000136 0.003597 .. | |
|-> 2. 0x1438a9ed0 (0x285da7740:0) [2x8x133x160] -0.091675 0.026260 0.035645 .. | |
|<- 1. 0x1438a9f40 (0x285da6e00:0) [2x8x256x160] -0.397217 -0.514160 -0.087708 .. | |
CCV_NNC_TRANSPOSE_FORWARD [612]: [1] -> [1] (0) | |
|-> 1. 0x1438e8ba0 (0x285da6e00:0) [2x8x256x160] -0.397217 -0.514160 -0.087708 .. | |
|<- 1. 0x1438a9fb0 (0x285da6fc0:0) [2x256x8x160] -0.397217 -0.514160 -0.087708 .. | |
CCV_NNC_GEMM_FORWARD [613]: [3] -> [1] (0) | |
|-> 1. 0x1438e8c10 (0x285da6fc0:0) [2x256x1280] -0.397217 -0.514160 -0.087708 .. | |
|-> 2. 0x1438c3a10 (0x285d8e040:0) [1280x1280] 0.031433 -0.050446 -0.028473 .. | |
|-> 3. 0x1438c3a80 (0x285d8ca80:0) [1280] -0.027130 -0.031281 0.020508 .. | |
|<- 1. 0x1438aa020 (0x285da7780:0) [2x256x1280] -0.458984 0.142212 -0.198608 .. | |
CCV_NNC_ADD_FORWARD [614]: [2] -> [1] (0) | |
|-> 1. 0x1438aa020 (0x285da7780:0) [2x256x1280] -0.458984 0.142212 -0.198608 .. | |
|-> 2. 0x1438a9a70 (0x285da6dc0:0) [2x256x1280] -0.515137 -0.354004 0.597168 .. | |
|<- 1. 0x1438aa020 (0x285da7780:0) [2x256x1280] -0.974121 -0.211792 0.398438 .. | |
CCV_NNC_LAYER_NORM_FORWARD [615]: [3] -> [3] (0) | |
|-> 1. 0x1438aa020 (0x285da7780:0) [2x256x1280] -0.974121 -0.211792 0.398438 .. | |
|-> 2. 0x1438c3af0 (0x285d8ca40:0) [1x1x1280] 0.270264 0.272949 0.266113 .. | |
|-> 3. 0x1438c3b60 (0x285d894c0:0) [1x1x1280] 0.040833 0.036346 -0.000885 .. | |
|<- 1. 0x1438aa090 (0x285da77c0:0) [2x256x1280] -0.247681 -0.026260 0.116638 .. | |
|<- 2. 0x1438aa100 (0x285da7800:0) [2x256x1] -0.003222 .. | |
|<- 3. 0x1438aa170 (0x285da7840:0) [2x256x1] 1.099609 .. | |
Emit: (0, 52) | |
CCV_NNC_GEMM_FORWARD [616]: [3] -> [1] (0) | |
|-> 1. 0x1438aa090 (0x285da77c0:0) [2x256x1280] -0.247681 -0.026260 0.116638 .. | |
|-> 2. 0x1438c3bd0 (0x285d8b3c0:0) [5120x1280] 0.022415 0.104980 0.020538 .. | |
|-> 3. 0x1438c3c40 (0x285d8b5c0:0) [5120] -0.012016 -0.047729 -0.024719 .. | |
|<- 1. 0x1438aa1e0 (0x285da7380:0) [2x256x5120] 0.011574 0.051270 -0.283203 .. | |
CCV_NNC_GELU_FORWARD [617]: [1] -> [1] (0) | |
|-> 1. 0x1438aa1e0 (0x285da7380:0) [2x256x5120] 0.011574 0.051270 -0.283203 .. | |
|<- 1. 0x1438aa1e0 (0x285da7380:0) [2x256x5120] 0.005840 0.026688 -0.110046 .. | |
CCV_NNC_GEMM_FORWARD [618]: [3] -> [1] (1) | |
Wait: (1, 52) | |
|-> 1. 0x1438aa090 (0x285da77c0:0) [2x256x1280] -0.247681 -0.026260 0.116638 .. | |
|-> 2. 0x1438c3cb0 (0x285d8aac0:0) [5120x1280] -0.012741 -0.106445 0.001978 .. | |
|-> 3. 0x1438c3d20 (0x285d8b9c0:0) [5120] -0.004272 0.021820 0.003801 .. | |
|<- 1. 0x1438aa250 (0x285da5ac0:0) [2x256x5120] -0.095154 0.661133 0.175903 .. | |
Emit: (1, 53) | |
CCV_NNC_MUL_FORWARD [619]: [2] -> [1] (0) | |
Wait: (0, 53) | |
|-> 1. 0x1438aa250 (0x285da5ac0:0) [2x256x5120] -0.095154 0.661133 0.175903 .. | |
|-> 2. 0x1438aa1e0 (0x285da7380:0) [2x256x5120] 0.005840 0.026688 -0.110046 .. | |
|<- 1. 0x1438aa250 (0x285da5ac0:0) [2x256x5120] -0.000556 0.017639 -0.019363 .. | |
CCV_NNC_GEMM_FORWARD [620]: [3] -> [1] (0) | |
|-> 1. 0x1438aa250 (0x285da5ac0:0) [2x256x5120] -0.000556 0.017639 -0.019363 .. | |
|-> 2. 0x1438c3d90 (0x285d896c0:0) [1280x5120] -0.018845 -0.054626 0.055389 .. | |
|-> 3. 0x1438c3e00 (0x285d8b900:0) [1280] 0.008690 -0.017319 0.016159 .. | |
|<- 1. 0x1438aa2c0 (0x285da6dc0:0) [2x256x1280] 0.151489 0.550293 0.319824 .. | |
CCV_NNC_ADD_FORWARD [621]: [2] -> [1] (0) | |
|-> 1. 0x1438aa2c0 (0x285da6dc0:0) [2x256x1280] 0.151489 0.550293 0.319824 .. | |
|-> 2. 0x1438aa020 (0x285da7780:0) [2x256x1280] -0.974121 -0.211792 0.398438 .. | |
|<- 1. 0x1438aa2c0 (0x285da6dc0:0) [2x256x1280] -0.822754 0.338379 0.718262 .. | |
CCV_NNC_CONVOLUTION_FORWARD [622]: [3] -> [1] (0) | |
|-> 1. 0x1438e8c80 (0x285da6dc0:0) [2x16x16x1280] -0.822754 0.338379 0.718262 .. | |
|-> 2. 0x1438c3e70 (0x285d8a880:0) [1280x1280x1x1] 0.033752 .. | |
|-> 3. 0x1438c3ee0 (0x285d8a7c0:0) [1280] -0.081055 0.000585 0.003956 .. | |
|<- 1. 0x1438aa330 (0x285da6fc0:0) [2x16x16x1280] -2.039062 -2.007812 2.421875 .. | |
CCV_NNC_ADD_FORWARD [623]: [2] -> [1] (0) | |
|-> 1. 0x1438aa330 (0x285da6fc0:0) [2x16x16x1280] -2.039062 -2.007812 2.421875 .. | |
|-> 2. 0x1438a8c70 (0x285da6f00:0) [2x16x16x1280] 1.439453 1.792969 -2.570312 .. | |
|<- 1. 0x1438ed3f0 (0x285da61c0:0) [2x16x16x1280] -0.599609 -0.214844 -0.148438 .. | |
CCV_NNC_CONVOLUTION_FORWARD [624]: [3] -> [1] (0) | |
|-> 1. 0x1438ed3f0 (0x285da61c0:0) [2x16x16x1280] -0.599609 -0.214844 -0.148438 .. | |
|-> 2. 0x1438c3f50 (0x285d89d00:0) [1280x1280x3x3] -0.013542 -0.019775 -0.012993 .. | |
|-> 3. 0x1438c3fc0 (0x285d8a6c0:0) [1280] -0.010803 -0.018738 -0.024414 .. | |
|<- 1. 0x1438ed220 (0x285d83dc0:0) [2x8x8x1280] -0.415771 -0.962891 1.918945 .. | |
CCV_NNC_GROUP_NORM_FORWARD [625]: [3] -> [3] (0) | |
|-> 1. 0x1438ed220 (0x285d83dc0:0) [2x8x8x1280] -0.415771 -0.962891 1.918945 .. | |
|-> 2. 0x1438c4030 (0x285d89dc0:0) [1x1x1x1280] 0.356445 0.575195 0.341064 .. | |
|-> 3. 0x1438c40a0 (0x285d89b40:0) [1x1x1x1280] -0.049286 -0.172241 -0.042419 .. | |
|<- 1. 0x1438aa3a0 (0x285da7880:0) [2x8x8x1280] -0.102966 -0.444580 0.375977 .. | |
|<- 2. 0x1438aa410 (0x285da78c0:0) [2x1x1x32] -0.160400 -0.602539 -0.460938 .. | |
|<- 3. 0x1438aa480 (0x285da7900:0) [2x1x1x32] 0.589844 0.599121 0.614746 .. | |
CCV_NNC_SWISH_FORWARD [626]: [1] -> [1] (0) | |
|-> 1. 0x1438aa3a0 (0x285da7880:0) [2x8x8x1280] -0.102966 -0.444580 0.375977 .. | |
|<- 1. 0x1438aa3a0 (0x285da7880:0) [2x8x8x1280] -0.048828 -0.173706 0.222900 .. | |
CCV_NNC_CONVOLUTION_FORWARD [627]: [3] -> [1] (0) | |
|-> 1. 0x1438aa3a0 (0x285da7880:0) [2x8x8x1280] -0.048828 -0.173706 0.222900 .. | |
|-> 2. 0x1438c41f0 (0x285d8adc0:0) [1280x1280x3x3] -0.041321 -0.024048 -0.009758 .. | |
|-> 3. 0x1438c4260 (0x285d8ad00:0) [1280] 0.068237 -0.042267 -0.026306 .. | |
|<- 1. 0x1438aa560 (0x285da7980:0) [2x8x8x1280] 0.378662 -0.772949 1.360352 .. | |
CCV_NNC_ADD_FORWARD [628]: [2] -> [1] (0) | |
Wait: (0, 54) | |
|-> 1. 0x1438aa560 (0x285da7980:0) [2x8x8x1280] 0.378662 -0.772949 1.360352 .. | |
|-> 2. 0x1438e8cf0 (0x285da7940:0) [2x1x1x1280] 0.770020 0.276611 0.438477 .. | |
|<- 1. 0x1438aa560 (0x285da7980:0) [2x8x8x1280] 1.148438 -0.496338 1.798828 .. | |
CCV_NNC_GROUP_NORM_FORWARD [629]: [3] -> [3] (0) | |
|-> 1. 0x1438aa560 (0x285da7980:0) [2x8x8x1280] 1.148438 -0.496338 1.798828 .. | |
|-> 2. 0x1438c42d0 (0x285d8b040:0) [1x1x1x1280] 0.588379 0.901367 0.817383 .. | |
|-> 3. 0x1438c4340 (0x285d8af80:0) [1x1x1x1280] -0.204224 -0.406982 -0.299072 .. | |
|<- 1. 0x1438aa5d0 (0x285da7880:0) [2x8x8x1280] 0.072388 -1.202148 0.522461 .. | |
|<- 2. 0x1438aa640 (0x285da79c0:0) [2x1x1x32] 0.576660 0.451416 0.241577 .. | |
|<- 3. 0x1438aa6b0 (0x285da7a00:0) [2x1x1x32] 0.822266 1.111328 0.558105 .. | |
CCV_NNC_SWISH_FORWARD [630]: [1] -> [1] (0) | |
|-> 1. 0x1438aa5d0 (0x285da7880:0) [2x8x8x1280] 0.072388 -1.202148 0.522461 .. | |
|<- 1. 0x1438aa5d0 (0x285da7880:0) [2x8x8x1280] 0.037506 -0.277832 0.327881 .. | |
CCV_NNC_CONVOLUTION_FORWARD [631]: [3] -> [1] (0) | |
|-> 1. 0x1438aa5d0 (0x285da7880:0) [2x8x8x1280] 0.037506 -0.277832 0.327881 .. | |
|-> 2. 0x1438c43b0 (0x285d8a740:0) [1280x1280x3x3] -0.007942 -0.025864 -0.020462 .. | |
|-> 3. 0x1438c4420 (0x285df7900:0) [1280] 0.032349 0.049072 0.003355 .. | |
|<- 1. 0x1438aa720 (0x285da7a40:0) [2x8x8x1280] -0.593750 0.087769 -0.660156 .. | |
CCV_NNC_ADD_FORWARD [632]: [2] -> [1] (0) | |
|-> 1. 0x1438ed220 (0x285d83dc0:0) [2x8x8x1280] -0.415771 -0.962891 1.918945 .. | |
|-> 2. 0x1438aa720 (0x285da7a40:0) [2x8x8x1280] -0.593750 0.087769 -0.660156 .. | |
|<- 1. 0x1438ed050 (0x285d81340:0) [2x8x8x1280] -1.009766 -0.875000 1.258789 .. | |
CCV_NNC_GROUP_NORM_FORWARD [633]: [3] -> [3] (0) | |
|-> 1. 0x1438ed050 (0x285d81340:0) [2x8x8x1280] -1.009766 -0.875000 1.258789 .. | |
|-> 2. 0x1438c4490 (0x285df6980:0) [1x1x1x1280] 0.375000 0.524902 0.364502 .. | |
|-> 3. 0x1438c4500 (0x285df5540:0) [1x1x1x1280] -0.052826 -0.081726 -0.053253 .. | |
|<- 1. 0x1438aa790 (0x285da7a40:0) [2x8x8x1280] -0.244141 -0.308594 0.238037 .. | |
|<- 2. 0x1438aa800 (0x285da67c0:0) [2x1x1x32] -0.125854 -0.469971 -0.328613 .. | |
|<- 3. 0x1438aa870 (0x285da6800:0) [2x1x1x32] 0.577148 0.594727 0.626953 .. | |
CCV_NNC_SWISH_FORWARD [634]: [1] -> [1] (0) | |
|-> 1. 0x1438aa790 (0x285da7a40:0) [2x8x8x1280] -0.244141 -0.308594 0.238037 .. | |
|<- 1. 0x1438aa790 (0x285da7a40:0) [2x8x8x1280] -0.107239 -0.130737 0.133057 .. | |
CCV_NNC_CONVOLUTION_FORWARD [635]: [3] -> [1] (0) | |
|-> 1. 0x1438aa790 (0x285da7a40:0) [2x8x8x1280] -0.107239 -0.130737 0.133057 .. | |
|-> 2. 0x1438c4650 (0x285df5440:0) [1280x1280x3x3] -0.037018 -0.017319 -0.041565 .. | |
|-> 3. 0x1438c46c0 (0x285df6d40:0) [1280] -0.069641 0.033020 0.103821 .. | |
|<- 1. 0x1438aa950 (0x285da7ac0:0) [2x8x8x1280] -0.646973 0.340088 0.199463 .. | |
CCV_NNC_ADD_FORWARD [636]: [2] -> [1] (0) | |
Wait: (0, 55) | |
|-> 1. 0x1438aa950 (0x285da7ac0:0) [2x8x8x1280] -0.646973 0.340088 0.199463 .. | |
|-> 2. 0x1438e8d60 (0x285da7a80:0) [2x1x1x1280] -0.554199 0.637207 0.615234 .. | |
|<- 1. 0x1438aa950 (0x285da7ac0:0) [2x8x8x1280] -1.201172 0.977539 0.814453 .. | |
CCV_NNC_GROUP_NORM_FORWARD [637]: [3] -> [3] (0) | |
|-> 1. 0x1438aa950 (0x285da7ac0:0) [2x8x8x1280] -1.201172 0.977539 0.814453 .. | |
|-> 2. 0x1438c4730 (0x285df68c0:0) [1x1x1x1280] 1.188477 0.872559 0.577637 .. | |
|-> 3. 0x1438c47a0 (0x285df5640:0) [1x1x1x1280] -0.458496 -0.503418 -0.258057 .. | |
|<- 1. 0x1438aa9c0 (0x285da7a40:0) [2x8x8x1280] -2.001953 -0.152344 -0.099182 .. | |
|<- 2. 0x1438aaa30 (0x285da7400:0) [2x1x1x32] 0.462158 0.926270 0.564453 .. | |
|<- 3. 0x1438aaaa0 (0x285da73c0:0) [2x1x1x32] 0.780762 0.915039 0.851074 .. | |
CCV_NNC_SWISH_FORWARD [638]: [1] -> [1] (0) | |
|-> 1. 0x1438aa9c0 (0x285da7a40:0) [2x8x8x1280] -2.001953 -0.152344 -0.099182 .. | |
|<- 1. 0x1438aa9c0 (0x285da7a40:0) [2x8x8x1280] -0.238281 -0.070374 -0.047119 .. | |
CCV_NNC_CONVOLUTION_FORWARD [639]: [3] -> [1] (0) | |
|-> 1. 0x1438aa9c0 (0x285da7a40:0) [2x8x8x1280] -0.238281 -0.070374 -0.047119 .. | |
|-> 2. 0x1438c4810 (0x285dfcc40:0) [1280x1280x3x3] -0.015480 0.022446 0.044220 .. | |
|-> 3. 0x1438c4880 (0x285dfe440:0) [1280] 0.082153 -0.000108 0.050964 .. | |
|<- 1. 0x1438aab10 (0x285da7b00:0) [2x8x8x1280] 0.281006 -0.273682 0.623047 .. | |
CCV_NNC_ADD_FORWARD [640]: [2] -> [1] (0) | |
|-> 1. 0x1438ed050 (0x285d81340:0) [2x8x8x1280] -1.009766 -0.875000 1.258789 .. | |
|-> 2. 0x1438aab10 (0x285da7b00:0) [2x8x8x1280] 0.281006 -0.273682 0.623047 .. | |
|<- 1. 0x1438ece80 (0x285d81380:0) [2x8x8x1280] -0.728516 -1.148438 1.881836 .. | |
CCV_NNC_GROUP_NORM_FORWARD [641]: [3] -> [3] (0) | |
|-> 1. 0x1438ece80 (0x285d81380:0) [2x8x8x1280] -0.728516 -1.148438 1.881836 .. | |
|-> 2. 0x1438c48f0 (0x285dfef40:0) [1x1x1x1280] 0.395996 0.522461 0.387939 .. | |
|-> 3. 0x1438c4960 (0x285dfe480:0) [1x1x1x1280] -0.032867 -0.152466 -0.053741 .. | |
|<- 1. 0x1438aab80 (0x285da7b00:0) [2x8x8x1280] -0.187622 -0.470459 0.320312 .. | |
|<- 2. 0x1438aabf0 (0x285da7b40:0) [2x1x1x32] 0.024628 -0.541504 -0.468750 .. | |
|<- 3. 0x1438aac60 (0x285da7b80:0) [2x1x1x32] 0.519043 0.539062 0.569824 .. | |
CCV_NNC_SWISH_FORWARD [642]: [1] -> [1] (0) | |
|-> 1. 0x1438aab80 (0x285da7b00:0) [2x8x8x1280] -0.187622 -0.470459 0.320312 .. | |
|<- 1. 0x1438aab80 (0x285da7b00:0) [2x8x8x1280] -0.085022 -0.180908 0.185547 .. | |
CCV_NNC_CONVOLUTION_FORWARD [643]: [3] -> [1] (0) | |
|-> 1. 0x1438aab80 (0x285da7b00:0) [2x8x8x1280] -0.085022 -0.180908 0.185547 .. | |
|-> 2. 0x1438c4ab0 (0x285e6d8c0:0) [1280x1280x3x3] 0.019470 0.036560 0.024933 .. | |
|-> 3. 0x1438c4b20 (0x285e6da00:0) [1280] 0.072510 0.083374 -0.002544 .. | |
|<- 1. 0x1438aad40 (0x285da7c00:0) [2x8x8x1280] 1.964844 1.085938 1.739258 .. | |
CCV_NNC_ADD_FORWARD [644]: [2] -> [1] (0) | |
Wait: (0, 56) | |
|-> 1. 0x1438aad40 (0x285da7c00:0) [2x8x8x1280] 1.964844 1.085938 1.739258 .. | |
|-> 2. 0x1438e8dd0 (0x285da7bc0:0) [2x1x1x1280] 0.581543 1.150391 0.077393 .. | |
|<- 1. 0x1438aad40 (0x285da7c00:0) [2x8x8x1280] 2.546875 2.236328 1.816406 .. | |
CCV_NNC_GROUP_NORM_FORWARD [645]: [3] -> [3] (0) | |
|-> 1. 0x1438aad40 (0x285da7c00:0) [2x8x8x1280] 2.546875 2.236328 1.816406 .. | |
|-> 2. 0x1438c4b90 (0x285e6d980:0) [1x1x1x1280] 0.350830 0.572266 0.883789 .. | |
|-> 3. 0x1438c4c00 (0x285e6d740:0) [1x1x1x1280] -0.258301 -0.269287 -0.452881 .. | |
|<- 1. 0x1438aadb0 (0x285da7b00:0) [2x8x8x1280] 0.063660 0.144531 -0.046509 .. | |
|<- 2. 0x1438aae20 (0x285da6880:0) [2x1x1x32] 1.083008 0.687988 0.489258 .. | |
|<- 3. 0x1438aae90 (0x285da68c0:0) [2x1x1x32] 0.626953 0.719238 0.718750 .. | |
CCV_NNC_SWISH_FORWARD [646]: [1] -> [1] (0) | |
|-> 1. 0x1438aadb0 (0x285da7b00:0) [2x8x8x1280] 0.063660 0.144531 -0.046509 .. | |
|<- 1. 0x1438aadb0 (0x285da7b00:0) [2x8x8x1280] 0.032837 0.077454 -0.022720 .. | |
CCV_NNC_CONVOLUTION_FORWARD [647]: [3] -> [1] (0) | |
|-> 1. 0x1438aadb0 (0x285da7b00:0) [2x8x8x1280] 0.032837 0.077454 -0.022720 .. | |
|-> 2. 0x1438c4c70 (0x285e6a4c0:0) [1280x1280x3x3] 0.009064 -0.005798 0.006561 .. | |
|-> 3. 0x1438c4ce0 (0x285e69a40:0) [1280] 0.033661 0.001286 0.012787 .. | |
|<- 1. 0x1438aaf00 (0x285da7c40:0) [2x8x8x1280] -0.475586 1.485352 0.928711 .. | |
CCV_NNC_ADD_FORWARD [648]: [2] -> [1] (0) | |
|-> 1. 0x1438ece80 (0x285d81380:0) [2x8x8x1280] -0.728516 -1.148438 1.881836 .. | |
|-> 2. 0x1438aaf00 (0x285da7c40:0) [2x8x8x1280] -0.475586 1.485352 0.928711 .. | |
|<- 1. 0x1438aaf70 (0x285da7c00:0) [2x8x8x1280] -1.204102 0.336914 2.810547 .. | |
CCV_NNC_GROUP_NORM_FORWARD [649]: [3] -> [3] (0) | |
|-> 1. 0x1438aaf70 (0x285da7c00:0) [2x8x8x1280] -1.204102 0.336914 2.810547 .. | |
|-> 2. 0x1438c4d50 (0x285e69f40:0) [1x1x1x1280] 0.379883 0.236816 0.363037 .. | |
|-> 3. 0x1438c4dc0 (0x285e6a200:0) [1x1x1x1280] -0.019196 -0.055298 -0.023285 .. | |
|<- 1. 0x1438aafe0 (0x285da7c40:0) [2x8x8x1280] -0.208252 -0.025070 0.387451 .. | |
|<- 2. 0x1438ab050 (0x285da73c0:0) [2x1x1x32] 0.022263 -0.726074 -0.319092 .. | |
|<- 3. 0x1438ab0c0 (0x285da7400:0) [2x1x1x32] 0.405762 0.396484 0.438232 .. | |
CCV_NNC_CONVOLUTION_FORWARD [650]: [3] -> [1] (0) | |
|-> 1. 0x1438aafe0 (0x285da7c40:0) [2x8x8x1280] -0.208252 -0.025070 0.387451 .. | |
|-> 2. 0x1438c4e30 (0x285e69980:0) [1280x1280x1x1] 0.035675 .. | |
|-> 3. 0x1438c4ea0 (0x285e69b40:0) [1280] 0.062561 -0.012909 0.075867 .. | |
|<- 1. 0x1438ab130 (0x285da7b00:0) [2x8x8x1280] 0.255371 -2.494141 0.954590 .. | |
CCV_NNC_LAYER_NORM_FORWARD [651]: [3] -> [3] (0) | |
|-> 1. 0x1438e8e40 (0x285da7b00:0) [2x64x1280] 0.255371 -2.494141 0.954590 .. | |
|-> 2. 0x1438c4f10 (0x285e69900:0) [1x1x1280] 0.276611 0.290771 0.278564 .. | |
|-> 3. 0x1438c4f80 (0x285e69c40:0) [1x1x1280] 0.014793 -0.018753 0.015091 .. | |
|<- 1. 0x1438ab1a0 (0x285da7c40:0) [2x64x1280] 0.080811 -0.657227 0.253906 .. | |
|<- 2. 0x1438ab210 (0x285da7c80:0) [2x64x1] -0.014259 .. | |
|<- 3. 0x1438ab280 (0x285da7cc0:0) [2x64x1] 0.885254 .. | |
Emit: (0, 57) | |
CCV_NNC_GEMM_FORWARD [652]: [2] -> [1] (0) | |
|-> 1. 0x1438ab1a0 (0x285da7c40:0) [2x64x1280] 0.080811 -0.657227 0.253906 .. | |
|-> 2. 0x1438c4ff0 (0x285e69b80:0) [1280x1280] 0.006420 0.047607 -0.014336 .. | |
|<- 1. 0x1438ab2f0 (0x285da7d00:0) [2x64x1280] -1.171875 -0.037689 0.780762 .. | |
CCV_NNC_SCALAR_MUL_FORWARD [653]: [1] -> [1] (0) | |
|-> 1. 0x1438ab2f0 (0x285da7d00:0) [2x64x1280] -1.171875 -0.037689 0.780762 .. | |
|<- 1. 0x1438ab2f0 (0x285da7d00:0) [2x64x1280] -0.092651 -0.002979 0.061707 .. | |
CCV_NNC_TRANSPOSE_FORWARD [654]: [1] -> [1] (0) | |
|-> 1. 0x1438e8f20 (0x285da7d00:0) [2x64x8x160] -0.092651 -0.002979 0.061707 .. | |
|<- 1. 0x1438ab440 (0x285da7dc0:0) [2x8x64x160] -0.092651 -0.002979 0.061707 .. | |
CCV_NNC_GEMM_FORWARD [655]: [2] -> [1] (1) | |
Wait: (1, 57) | |
|-> 1. 0x1438ab1a0 (0x285da7c40:0) [2x64x1280] 0.080811 -0.657227 0.253906 .. | |
|-> 2. 0x1438c5060 (0x285e69880:0) [1280x1280] -0.001306 -0.038757 -0.076477 .. | |
|<- 1. 0x1438ab360 (0x285da7d40:0) [2x64x1280] -1.183594 0.456299 1.410156 .. | |
CCV_NNC_TRANSPOSE_FORWARD [656]: [1] -> [1] (1) | |
|-> 1. 0x1438e8eb0 (0x285da7d40:0) [2x64x8x160] -1.183594 0.456299 1.410156 .. | |
|<- 1. 0x1438ab3d0 (0x285da7d80:0) [2x8x64x160] -1.183594 0.456299 1.410156 .. | |
Emit: (1, 58) | |
CCV_NNC_GEMM_FORWARD [657]: [2] -> [1] (2) | |
Wait: (2, 57) | |
|-> 1. 0x1438ab1a0 (0x285da7c40:0) [2x64x1280] 0.080811 -0.657227 0.253906 .. | |
|-> 2. 0x1438c50d0 (0x285e6a340:0) [1280x1280] 0.044281 -0.023407 0.047577 .. | |
|<- 1. 0x1438ab4b0 (0x285da7e00:0) [2x64x1280] 1.144531 -0.024384 -0.335205 .. | |
CCV_NNC_TRANSPOSE_FORWARD [658]: [1] -> [1] (2) | |
|-> 1. 0x1438e9070 (0x285da7e00:0) [2x64x8x160] 1.144531 -0.024384 -0.335205 .. | |
|<- 1. 0x1438ab590 (0x285da7e80:0) [2x8x64x160] 1.144531 -0.024384 -0.335205 .. | |
Emit: (2, 59) | |
CCV_NNC_GEMM_FORWARD [659]: [2] -> [1] (0) | |
Wait: (0, 58) | |
|-> 1. 0x1438e9000 (0x285da7dc0:0) [1x64x160] -0.092651 -0.002979 0.061707 .. | |
|-> 2. 0x1438e8f90 (0x285da7d80:0) [1x64x160] -1.183594 0.456299 1.410156 .. | |
|<- 1. 0x1438ab520 (0x285da7e40:0) [1x64x64] 4.921875 0.821289 0.454834 .. | |
CCV_NNC_SOFTMAX_FORWARD [660]: [1] -> [1] (0) | |
|-> 1. 0x1438e90e0 (0x285da7e40:0) [64x64] 4.921875 0.821289 0.454834 .. | |
|<- 1. 0x1438e90e0 (0x285da7e40:0) [64x64] 0.506836 0.008400 0.005821 .. | |
CCV_NNC_GEMM_FORWARD [661]: [2] -> [1] (0) | |
Wait: (0, 59) | |
|-> 1. 0x1438e91c0 (0x285da7e40:0) [1x64x64] 0.506836 0.008400 0.005821 .. | |
|-> 2. 0x1438e9150 (0x285da7e80:0) [1x64x160] 1.144531 -0.024384 -0.335205 .. | |
|<- 1. 0x1438ebe40 (0x285da7c40:0) [1x64x160] 0.771484 -0.089233 -0.232788 .. | |
CCV_NNC_GEMM_FORWARD [662]: [2] -> [1] (0) | |
|-> 1. 0x1438e92e0 (0x285da7dc0:0) [1x64x160] 0.081360 0.004601 -0.015053 .. | |
|-> 2. 0x1438e9230 (0x285da7d80:0) [1x64x160] 1.039062 0.099976 -0.261475 .. | |
|<- 1. 0x1438ab600 (0x285da7ec0:0) [1x64x64] 3.675781 0.514160 0.521484 .. | |
CCV_NNC_SOFTMAX_FORWARD [663]: [1] -> [1] (0) | |
|-> 1. 0x1438e9390 (0x285da7ec0:0) [64x64] 3.675781 0.514160 0.521484 .. | |
|<- 1. 0x1438e9390 (0x285da7ec0:0) [64x64] 0.338379 0.014336 0.014435 .. | |
CCV_NNC_GEMM_FORWARD [664]: [2] -> [1] (0) | |
|-> 1. 0x1438e94b0 (0x285da7ec0:0) [1x64x64] 0.338379 0.014336 0.014435 .. | |
|-> 2. 0x1438e9400 (0x285da7e80:0) [1x64x160] -0.206665 -0.201904 -0.258545 .. | |
|<- 1. 0x1438ebeb0 (0x285da7c40:0) [1x64x160] 0.018921 -0.016174 -0.269775 .. | |
CCV_NNC_GEMM_FORWARD [665]: [2] -> [1] (0) | |
|-> 1. 0x1438e95d0 (0x285da7dc0:0) [1x64x160] 0.072449 -0.079407 0.030930 .. | |
|-> 2. 0x1438e9520 (0x285da7d80:0) [1x64x160] 1.650391 -0.655762 -0.003675 .. | |
|<- 1. 0x1438ab670 (0x285da7ec0:0) [1x64x64] 4.578125 1.877930 1.080078 .. | |
CCV_NNC_SOFTMAX_FORWARD [666]: [1] -> [1] (0) | |
|-> 1. 0x1438e9680 (0x285da7ec0:0) [64x64] 4.578125 1.877930 1.080078 .. | |
|<- 1. 0x1438e9680 (0x285da7ec0:0) [64x64] 0.360840 0.024246 0.010918 .. | |
CCV_NNC_GEMM_FORWARD [667]: [2] -> [1] (0) | |
|-> 1. 0x1438e97a0 (0x285da7ec0:0) [1x64x64] 0.360840 0.024246 0.010918 .. | |
|-> |