Created
August 26, 2024 16:03
asm file out of mat3d and mat4d comparison
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
.file "tmp.cpp" | |
.text | |
#APP | |
.globl _ZSt21ios_base_library_initv | |
#NO_APP | |
.section .text._ZNKSt5ctypeIcE8do_widenEc,"axG",@progbits,_ZNKSt5ctypeIcE8do_widenEc,comdat | |
.align 2 | |
.p2align 4 | |
.weak _ZNKSt5ctypeIcE8do_widenEc | |
.type _ZNKSt5ctypeIcE8do_widenEc, @function | |
_ZNKSt5ctypeIcE8do_widenEc: | |
.LFB2397: | |
.cfi_startproc | |
endbr64 | |
movl %esi, %eax | |
ret | |
.cfi_endproc | |
.LFE2397: | |
.size _ZNKSt5ctypeIcE8do_widenEc, .-_ZNKSt5ctypeIcE8do_widenEc | |
.section .text._ZN5Eigen8IOFormatD2Ev,"axG",@progbits,_ZN5Eigen8IOFormatD5Ev,comdat | |
.align 2 | |
.p2align 4 | |
.weak _ZN5Eigen8IOFormatD2Ev | |
.type _ZN5Eigen8IOFormatD2Ev, @function | |
_ZN5Eigen8IOFormatD2Ev: | |
.LFB9798: | |
.cfi_startproc | |
endbr64 | |
pushq %rbx | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 3, -16 | |
movq %rdi, %rbx | |
movq 192(%rdi), %rdi | |
leaq 208(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L4 | |
movq 208(%rbx), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L4: | |
movq 160(%rbx), %rdi | |
leaq 176(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L5 | |
movq 176(%rbx), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L5: | |
movq 128(%rbx), %rdi | |
leaq 144(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L6 | |
movq 144(%rbx), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L6: | |
movq 96(%rbx), %rdi | |
leaq 112(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L7 | |
movq 112(%rbx), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L7: | |
movq 64(%rbx), %rdi | |
leaq 80(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L8 | |
movq 80(%rbx), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L8: | |
movq 32(%rbx), %rdi | |
leaq 48(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L9 | |
movq 48(%rbx), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L9: | |
movq (%rbx), %rdi | |
leaq 16(%rbx), %rax | |
cmpq %rax, %rdi | |
je .L3 | |
movq 16(%rbx), %rsi | |
popq %rbx | |
.cfi_remember_state | |
.cfi_def_cfa_offset 8 | |
addq $1, %rsi | |
jmp _ZdlPvm@PLT | |
.p2align 4,,10 | |
.p2align 3 | |
.L3: | |
.cfi_restore_state | |
popq %rbx | |
.cfi_def_cfa_offset 8 | |
ret | |
.cfi_endproc | |
.LFE9798: | |
.size _ZN5Eigen8IOFormatD2Ev, .-_ZN5Eigen8IOFormatD2Ev | |
.weak _ZN5Eigen8IOFormatD1Ev | |
.set _ZN5Eigen8IOFormatD1Ev,_ZN5Eigen8IOFormatD2Ev | |
.section .rodata._ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv.str1.8,"aMS",@progbits,1 | |
.align 8 | |
.LC4: | |
.string "Eigen::internal::plain_array<T, Size, MatrixOrArrayOptions, 16>::plain_array() [with T = double; int Size = 4; int MatrixOrArrayOptions = 0]" | |
.align 8 | |
.LC5: | |
.string "/usr/include/eigen3/Eigen/src/Core/DenseStorage.h" | |
.align 8 | |
.LC6: | |
.string "(internal::UIntPtr(eigen_unaligned_array_assert_workaround_gcc47(array)) & (15)) == 0 && \"this assertion is explained here: \" \"http://eigen.tuxfamily.org/dox-devel/group__TopicUnalignedArrayAssert.html\" \" **** READ THIS WEB PAGE !!! ****\"" | |
.section .text._ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv,"axG",@progbits,_ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv,comdat | |
.align 2 | |
.p2align 4 | |
.weak _ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv | |
.type _ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv, @function | |
_ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv: | |
.LFB9821: | |
.cfi_startproc | |
endbr64 | |
pushq %r15 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 15, -16 | |
pushq %r14 | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 14, -24 | |
pushq %r12 | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 12, -32 | |
pushq %rbp | |
.cfi_def_cfa_offset 40 | |
.cfi_offset 6, -40 | |
pushq %rbx | |
.cfi_def_cfa_offset 48 | |
.cfi_offset 3, -48 | |
movq %rdi, %rbx | |
subq $48, %rsp | |
.cfi_def_cfa_offset 96 | |
call rand@PLT | |
pxor %xmm3, %xmm3 | |
pxor %xmm1, %xmm1 | |
cvtsi2sdl %eax, %xmm1 | |
divsd .LC0(%rip), %xmm1 | |
addsd %xmm3, %xmm1 | |
movsd %xmm1, (%rsp) | |
call rand@PLT | |
pxor %xmm0, %xmm0 | |
pxor %xmm3, %xmm3 | |
cvtsi2sdl %eax, %xmm0 | |
mulsd .LC2(%rip), %xmm0 | |
divsd .LC0(%rip), %xmm0 | |
addsd %xmm3, %xmm0 | |
movq %xmm0, %r15 | |
call rand@PLT | |
movsd (%rsp), %xmm1 | |
pxor %xmm0, %xmm0 | |
movsd .LC3(%rip), %xmm2 | |
pxor %xmm3, %xmm3 | |
cvtsi2sdl %eax, %xmm0 | |
subsd %xmm1, %xmm2 | |
mulsd .LC2(%rip), %xmm0 | |
divsd .LC0(%rip), %xmm0 | |
addsd %xmm3, %xmm0 | |
ucomisd %xmm2, %xmm3 | |
movq %xmm0, %r14 | |
ja .L20 | |
ucomisd %xmm1, %xmm3 | |
sqrtsd %xmm2, %xmm2 | |
ja .L23 | |
.L15: | |
sqrtsd %xmm1, %xmm1 | |
.L17: | |
leaq 40(%rsp), %rbp | |
leaq 32(%rsp), %r12 | |
movq %r15, %xmm0 | |
movsd %xmm1, 24(%rsp) | |
movq %r12, %rsi | |
movq %rbp, %rdi | |
movsd %xmm2, 16(%rsp) | |
call sincos@PLT | |
movq %r14, %xmm0 | |
movq %r12, %rsi | |
movq %rbp, %rdi | |
movsd 32(%rsp), %xmm3 | |
movsd 40(%rsp), %xmm4 | |
movsd %xmm3, 8(%rsp) | |
movsd %xmm4, (%rsp) | |
call sincos@PLT | |
movsd 16(%rsp), %xmm2 | |
movsd 24(%rsp), %xmm1 | |
movsd 8(%rsp), %xmm3 | |
movsd 40(%rsp), %xmm0 | |
mulsd %xmm2, %xmm3 | |
mulsd %xmm1, %xmm0 | |
mulsd (%rsp), %xmm2 | |
mulsd 32(%rsp), %xmm1 | |
unpcklpd %xmm0, %xmm3 | |
unpcklpd %xmm2, %xmm1 | |
testb $15, %bl | |
jne .L24 | |
movups %xmm3, (%rbx) | |
movq %rbx, %rax | |
movups %xmm1, 16(%rbx) | |
addq $48, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 48 | |
popq %rbx | |
.cfi_def_cfa_offset 40 | |
popq %rbp | |
.cfi_def_cfa_offset 32 | |
popq %r12 | |
.cfi_def_cfa_offset 24 | |
popq %r14 | |
.cfi_def_cfa_offset 16 | |
popq %r15 | |
.cfi_def_cfa_offset 8 | |
ret | |
.L20: | |
.cfi_restore_state | |
movapd %xmm2, %xmm0 | |
movsd %xmm1, (%rsp) | |
call sqrt@PLT | |
movsd (%rsp), %xmm1 | |
movapd %xmm0, %xmm2 | |
jmp .L15 | |
.L23: | |
movapd %xmm1, %xmm0 | |
movsd %xmm2, (%rsp) | |
call sqrt@PLT | |
movsd (%rsp), %xmm2 | |
movapd %xmm0, %xmm1 | |
jmp .L17 | |
.L24: | |
leaq .LC4(%rip), %rcx | |
movl $109, %edx | |
leaq .LC5(%rip), %rsi | |
leaq .LC6(%rip), %rdi | |
call __assert_fail@PLT | |
.cfi_endproc | |
.LFE9821: | |
.size _ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv, .-_ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv | |
.section .text._ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE,"axG",@progbits,_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE,comdat | |
.p2align 4 | |
.weak _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE | |
.type _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE, @function | |
_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE: | |
.LFB10067: | |
.cfi_startproc | |
.cfi_personality 0x9b,DW.ref.__gxx_personality_v0 | |
.cfi_lsda 0x1b,.LLSDA10067 | |
endbr64 | |
pushq %r15 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 15, -16 | |
pushq %r14 | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 14, -24 | |
pushq %r13 | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 13, -32 | |
pushq %r12 | |
.cfi_def_cfa_offset 40 | |
.cfi_offset 12, -40 | |
pushq %rbp | |
.cfi_def_cfa_offset 48 | |
.cfi_offset 6, -48 | |
movq %rdx, %rbp | |
pushq %rbx | |
.cfi_def_cfa_offset 56 | |
.cfi_offset 3, -56 | |
movq %rdi, %rbx | |
subq $568, %rsp | |
.cfi_def_cfa_offset 624 | |
movq %rsi, 104(%rsp) | |
movq %fs:40, %rax | |
movq %rax, 552(%rsp) | |
xorl %eax, %eax | |
movslq 224(%rdx), %rax | |
cmpl $-1, %eax | |
je .L55 | |
cmpl $-2, %eax | |
je .L56 | |
movq %rax, 112(%rsp) | |
movq $0, 120(%rsp) | |
testq %rax, %rax | |
je .L26 | |
.L27: | |
movq (%rbx), %rax | |
movq -24(%rax), %rdx | |
addq %rbx, %rdx | |
movq %rdx, %rax | |
movq 8(%rdx), %rdx | |
movq %rdx, 120(%rsp) | |
movq 112(%rsp), %rdx | |
movq %rdx, 8(%rax) | |
.L26: | |
testb $1, 228(%rbp) | |
jne .L58 | |
.L82: | |
leaq 64+_ZTVNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 16+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %r12 | |
movq $0, 96(%rsp) | |
movq %rax, %xmm0 | |
movq 104(%rsp), %rax | |
movq $0, 16(%rsp) | |
movdqa %xmm0, %xmm3 | |
movdqa %xmm0, %xmm4 | |
movq 32+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %r15 | |
movq %rax, 40(%rsp) | |
leaq 160(%rsp), %rax | |
movhps .LC7(%rip), %xmm3 | |
movhps .LC8(%rip), %xmm4 | |
movq %rax, 56(%rsp) | |
leaq 288(%rsp), %rax | |
movq %rax, 8(%rsp) | |
movaps %xmm3, 64(%rsp) | |
movaps %xmm4, 80(%rsp) | |
.L29: | |
xorl %r13d, %r13d | |
.L43: | |
movq 8(%rsp), %rdi | |
call _ZNSt8ios_baseC2Ev@PLT | |
leaq 16+_ZTVSt9basic_iosIcSt11char_traitsIcEE(%rip), %rax | |
xorl %edx, %edx | |
xorl %esi, %esi | |
pxor %xmm0, %xmm0 | |
movw %dx, 512(%rsp) | |
movq 24+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rcx | |
movups %xmm0, 520(%rsp) | |
movups %xmm0, 536(%rsp) | |
movq %rax, 288(%rsp) | |
movq -24(%r12), %rax | |
movq $0, 504(%rsp) | |
movq %r12, 160(%rsp) | |
movq %rcx, 160(%rsp,%rax) | |
movq 56(%rsp), %rax | |
movq $0, 168(%rsp) | |
addq -24(%r12), %rax | |
movq %rax, %rdi | |
.LEHB0: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE4initEPSt15basic_streambufIcS1_E@PLT | |
.LEHE0: | |
movq -24(%r15), %rax | |
leaq 176(%rsp), %r14 | |
movq %r15, 176(%rsp) | |
xorl %esi, %esi | |
addq %r14, %rax | |
movq %rax, %rdi | |
movq 40+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq %rax, (%rdi) | |
.LEHB1: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE4initEPSt15basic_streambufIcS1_E@PLT | |
.LEHE1: | |
movq 8+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 48+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rcx | |
pxor %xmm0, %xmm0 | |
movdqa 80(%rsp), %xmm1 | |
movq -24(%rax), %rax | |
movq %rcx, 160(%rsp,%rax) | |
leaq 24+_ZTVNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq %rax, 160(%rsp) | |
addq $80, %rax | |
movq %rax, 288(%rsp) | |
leaq 240(%rsp), %rax | |
movq %rax, %rdi | |
movq %rax, 24(%rsp) | |
movaps %xmm1, 176(%rsp) | |
movaps %xmm0, 192(%rsp) | |
movaps %xmm0, 208(%rsp) | |
movaps %xmm0, 224(%rsp) | |
call _ZNSt6localeC1Ev@PLT | |
leaq 16+_ZTVNSt7__cxx1115basic_stringbufIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 8(%rsp), %rdi | |
leaq 184(%rsp), %rsi | |
movq %rax, 184(%rsp) | |
leaq 272(%rsp), %rax | |
movl $24, 248(%rsp) | |
movq %rax, 32(%rsp) | |
movq %rax, 256(%rsp) | |
movq $0, 264(%rsp) | |
movb $0, 272(%rsp) | |
.LEHB2: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE4initEPSt15basic_streambufIcS1_E@PLT | |
.LEHE2: | |
movq (%rbx), %rax | |
movq 8(%rsp), %rdi | |
movq -24(%rax), %rsi | |
addq %rbx, %rsi | |
.LEHB3: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE7copyfmtERKS2_@PLT | |
movq 40(%rsp), %rax | |
movq %r14, %rdi | |
movsd (%rax,%r13,8), %xmm0 | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
.LEHE3: | |
movq 224(%rsp), %r8 | |
leaq 128(%rsp), %rdi | |
leaq 144(%rsp), %r14 | |
movq $0, 136(%rsp) | |
movq %rdi, 48(%rsp) | |
movq %r14, 128(%rsp) | |
movb $0, 144(%rsp) | |
testq %r8, %r8 | |
je .L35 | |
movq 208(%rsp), %rax | |
movq %r8, %rdx | |
movq 216(%rsp), %rcx | |
cmpq %r8, %rax | |
cmovnb %rax, %r8 | |
testq %rax, %rax | |
cmove %rdx, %r8 | |
xorl %edx, %edx | |
xorl %esi, %esi | |
subq %rcx, %r8 | |
.LEHB4: | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_replaceEmmPKcm@PLT | |
.LEHE4: | |
.L37: | |
movq 16(%rsp), %rcx | |
movq 136(%rsp), %rax | |
movq 128(%rsp), %rdi | |
cmpq %rax, %rcx | |
cmovge %rcx, %rax | |
movq %rax, 16(%rsp) | |
cmpq %r14, %rdi | |
je .L38 | |
movq 144(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L38: | |
leaq 24+_ZTVNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movdqa 64(%rsp), %xmm2 | |
movq 256(%rsp), %rdi | |
movq %rax, 160(%rsp) | |
addq $80, %rax | |
movq %rax, 288(%rsp) | |
movq 32(%rsp), %rax | |
movaps %xmm2, 176(%rsp) | |
cmpq %rax, %rdi | |
je .L42 | |
movq 272(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L42: | |
movq 24(%rsp), %rdi | |
leaq 16+_ZTVSt15basic_streambufIcSt11char_traitsIcEE(%rip), %rax | |
addq $1, %r13 | |
movq %rax, 184(%rsp) | |
call _ZNSt6localeD1Ev@PLT | |
movq 8+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 8(%rsp), %rdi | |
movq 48+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq 40+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rcx | |
movq -24(%rax), %rax | |
movq %rdx, 160(%rsp,%rax) | |
movq -24(%r15), %rax | |
movq %r15, 176(%rsp) | |
movq 24+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq %rcx, 176(%rsp,%rax) | |
movq -24(%r12), %rax | |
movq %r12, 160(%rsp) | |
movq %rdx, 160(%rsp,%rax) | |
leaq 16+_ZTVSt9basic_iosIcSt11char_traitsIcEE(%rip), %rax | |
movq $0, 168(%rsp) | |
movq %rax, 288(%rsp) | |
call _ZNSt8ios_baseD2Ev@PLT | |
cmpq $3, %r13 | |
jne .L43 | |
addq $3, 96(%rsp) | |
movq 96(%rsp), %rax | |
addq $24, 40(%rsp) | |
cmpq $9, %rax | |
jne .L29 | |
.L28: | |
movq 8(%rbp), %rdx | |
movq 0(%rbp), %rsi | |
movq %rbx, %rdi | |
xorl %r13d, %r13d | |
.LEHB5: | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq 104(%rsp), %r12 | |
movq 16(%rsp), %r15 | |
addq $48, %r12 | |
.L52: | |
movq 72(%rbp), %rdx | |
movq 64(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
testq %r15, %r15 | |
je .L44 | |
movq (%rbx), %rax | |
movq -24(%rax), %rax | |
movq %r15, 16(%rbx,%rax) | |
.L44: | |
movsd -48(%r12), %xmm0 | |
movq %rbx, %rdi | |
leaq -48(%r12), %r14 | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
movq 200(%rbp), %rdx | |
movq 192(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
testq %r15, %r15 | |
je .L45 | |
.L48: | |
movq (%rbx), %rax | |
movsd 24(%r14), %xmm0 | |
movq %rbx, %rdi | |
addq $24, %r14 | |
movq -24(%rax), %rax | |
movq %r15, 16(%rbx,%rax) | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
cmpq %r14, %r12 | |
je .L47 | |
movq 200(%rbp), %rdx | |
movq 192(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
jmp .L48 | |
.p2align 4,,10 | |
.p2align 3 | |
.L45: | |
movsd 24(%r14), %xmm0 | |
movq %rbx, %rdi | |
addq $24, %r14 | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
cmpq %r14, %r12 | |
je .L47 | |
movq 200(%rbp), %rdx | |
movq 192(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
jmp .L45 | |
.p2align 4,,10 | |
.p2align 3 | |
.L56: | |
movq $15, 112(%rsp) | |
jmp .L27 | |
.p2align 4,,10 | |
.p2align 3 | |
.L47: | |
movq 104(%rbp), %rdx | |
movq 96(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
cmpq $2, %r13 | |
je .L81 | |
movq 136(%rbp), %rdx | |
movq %rbx, %rdi | |
addq $8, %r12 | |
addq $1, %r13 | |
movq 128(%rbp), %rsi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq 168(%rbp), %rdx | |
movq 160(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
.LEHE5: | |
jmp .L52 | |
.p2align 4,,10 | |
.p2align 3 | |
.L35: | |
leaq 256(%rsp), %rsi | |
.LEHB6: | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE9_M_assignERKS4_@PLT | |
.LEHE6: | |
jmp .L37 | |
.p2align 4,,10 | |
.p2align 3 | |
.L81: | |
movq 40(%rbp), %rdx | |
movq 32(%rbp), %rsi | |
movq %rbx, %rdi | |
.LEHB7: | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
cmpq $0, 112(%rsp) | |
je .L51 | |
movq (%rbx), %rax | |
movq 120(%rsp), %rdx | |
movq -24(%rax), %rax | |
movq %rdx, 8(%rbx,%rax) | |
.L51: | |
movq 552(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L77 | |
addq $568, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 56 | |
movq %rbx, %rax | |
popq %rbx | |
.cfi_def_cfa_offset 48 | |
popq %rbp | |
.cfi_def_cfa_offset 40 | |
popq %r12 | |
.cfi_def_cfa_offset 32 | |
popq %r13 | |
.cfi_def_cfa_offset 24 | |
popq %r14 | |
.cfi_def_cfa_offset 16 | |
popq %r15 | |
.cfi_def_cfa_offset 8 | |
ret | |
.p2align 4,,10 | |
.p2align 3 | |
.L55: | |
.cfi_restore_state | |
movq $0, 112(%rsp) | |
movq $0, 120(%rsp) | |
testb $1, 228(%rbp) | |
je .L82 | |
.L58: | |
movq $0, 16(%rsp) | |
jmp .L28 | |
.L40: | |
movq 48(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
.L41: | |
movq 56(%rsp), %rdi | |
call _ZNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEED1Ev@PLT | |
movq 552(%rsp), %rax | |
subq %fs:40, %rax | |
je .L53 | |
.L77: | |
call __stack_chk_fail@PLT | |
.L60: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L32 | |
.L62: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L31 | |
.L59: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L41 | |
.L61: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L33 | |
.L63: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L40 | |
.L33: | |
leaq 16+_ZTVNSt7__cxx1115basic_stringbufIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
leaq 256(%rsp), %rdi | |
movq %rax, 184(%rsp) | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
movq 24(%rsp), %rdi | |
leaq 16+_ZTVSt15basic_streambufIcSt11char_traitsIcEE(%rip), %rax | |
movq %rax, 184(%rsp) | |
call _ZNSt6localeD1Ev@PLT | |
movq 8+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 48+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq -24(%rax), %rax | |
movq %rdx, 160(%rsp,%rax) | |
movq -24(%r15), %rax | |
movq 40+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq %r15, 176(%rsp) | |
movq %rdx, 176(%rsp,%rax) | |
.L79: | |
movq -24(%r12), %rax | |
movq 24+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq %r12, 160(%rsp) | |
movq %rdx, 160(%rsp,%rax) | |
xorl %eax, %eax | |
movq %rax, 168(%rsp) | |
.L32: | |
movq 8(%rsp), %rdi | |
leaq 16+_ZTVSt9basic_iosIcSt11char_traitsIcEE(%rip), %rax | |
movq %rax, 288(%rsp) | |
call _ZNSt8ios_baseD2Ev@PLT | |
movq 552(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L77 | |
.L53: | |
movq %rbx, %rdi | |
call _Unwind_Resume@PLT | |
.LEHE7: | |
.L31: | |
jmp .L79 | |
.cfi_endproc | |
.LFE10067: | |
.globl __gxx_personality_v0 | |
.section .gcc_except_table._ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE,"aG",@progbits,_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE,comdat | |
.LLSDA10067: | |
.byte 0xff | |
.byte 0xff | |
.byte 0x1 | |
.uleb128 .LLSDACSE10067-.LLSDACSB10067 | |
.LLSDACSB10067: | |
.uleb128 .LEHB0-.LFB10067 | |
.uleb128 .LEHE0-.LEHB0 | |
.uleb128 .L60-.LFB10067 | |
.uleb128 0 | |
.uleb128 .LEHB1-.LFB10067 | |
.uleb128 .LEHE1-.LEHB1 | |
.uleb128 .L62-.LFB10067 | |
.uleb128 0 | |
.uleb128 .LEHB2-.LFB10067 | |
.uleb128 .LEHE2-.LEHB2 | |
.uleb128 .L61-.LFB10067 | |
.uleb128 0 | |
.uleb128 .LEHB3-.LFB10067 | |
.uleb128 .LEHE3-.LEHB3 | |
.uleb128 .L59-.LFB10067 | |
.uleb128 0 | |
.uleb128 .LEHB4-.LFB10067 | |
.uleb128 .LEHE4-.LEHB4 | |
.uleb128 .L63-.LFB10067 | |
.uleb128 0 | |
.uleb128 .LEHB5-.LFB10067 | |
.uleb128 .LEHE5-.LEHB5 | |
.uleb128 0 | |
.uleb128 0 | |
.uleb128 .LEHB6-.LFB10067 | |
.uleb128 .LEHE6-.LEHB6 | |
.uleb128 .L63-.LFB10067 | |
.uleb128 0 | |
.uleb128 .LEHB7-.LFB10067 | |
.uleb128 .LEHE7-.LEHB7 | |
.uleb128 0 | |
.uleb128 0 | |
.LLSDACSE10067: | |
.section .text._ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE,"axG",@progbits,_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE,comdat | |
.size _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE, .-_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE | |
.section .text._ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE,"axG",@progbits,_ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE,comdat | |
.p2align 4 | |
.weak _ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE | |
.type _ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE, @function | |
_ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE: | |
.LFB9796: | |
.cfi_startproc | |
.cfi_personality 0x9b,DW.ref.__gxx_personality_v0 | |
.cfi_lsda 0x1b,.LLSDA9796 | |
endbr64 | |
pushq %r15 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 15, -16 | |
pushq %r14 | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 14, -24 | |
pushq %r13 | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 13, -32 | |
pushq %r12 | |
.cfi_def_cfa_offset 40 | |
.cfi_offset 12, -40 | |
pushq %rbp | |
.cfi_def_cfa_offset 48 | |
.cfi_offset 6, -48 | |
pushq %rbx | |
.cfi_def_cfa_offset 56 | |
.cfi_offset 3, -56 | |
subq $504, %rsp | |
.cfi_def_cfa_offset 560 | |
movzwl .LC9(%rip), %edx | |
movq %fs:40, %rax | |
movq %rax, 488(%rsp) | |
xorl %eax, %eax | |
leaq 240(%rsp), %rax | |
movq $0, 232(%rsp) | |
leaq 272(%rsp), %rcx | |
movq %rax, 24(%rsp) | |
leaq 256(%rsp), %rbx | |
leaq 336(%rsp), %rbp | |
movq %rax, 224(%rsp) | |
leaq 208(%rsp), %rax | |
leaq 368(%rsp), %r12 | |
movq %rax, (%rsp) | |
leaq 400(%rsp), %r13 | |
leaq 432(%rsp), %r14 | |
movq %rax, 192(%rsp) | |
leaq 176(%rsp), %rax | |
leaq 464(%rsp), %r15 | |
movq %rax, 40(%rsp) | |
movq %rax, 160(%rsp) | |
leaq 144(%rsp), %rax | |
movq %rax, 16(%rsp) | |
movq %rax, 128(%rsp) | |
leaq 112(%rsp), %rax | |
movq %rax, 56(%rsp) | |
movq %rax, 96(%rsp) | |
leaq 80(%rsp), %rax | |
movw %dx, 112(%rsp) | |
movq %rax, 32(%rsp) | |
movq %rax, 64(%rsp) | |
movb $0, 240(%rsp) | |
movq $0, 200(%rsp) | |
movb $0, 208(%rsp) | |
movq $0, 168(%rsp) | |
movb $0, 176(%rsp) | |
movq $0, 136(%rsp) | |
movb $0, 144(%rsp) | |
movq $1, 104(%rsp) | |
movq $1, 72(%rsp) | |
movzwl .LC10(%rip), %eax | |
movq %rcx, 48(%rsp) | |
movw %ax, 80(%rsp) | |
movw %ax, 464(%rsp) | |
movq .LC11(%rip), %rax | |
movq %rcx, 256(%rsp) | |
leaq 304(%rsp), %rcx | |
movw %dx, 400(%rsp) | |
movq %rbx, %rdx | |
movq $0, 264(%rsp) | |
movb $0, 272(%rsp) | |
movq %rcx, 8(%rsp) | |
movq %rcx, 288(%rsp) | |
movq $0, 296(%rsp) | |
movb $0, 304(%rsp) | |
movq %rbp, 320(%rsp) | |
movq $0, 328(%rsp) | |
movb $0, 336(%rsp) | |
movq %r12, 352(%rsp) | |
movq $0, 360(%rsp) | |
movb $0, 368(%rsp) | |
movq %r13, 384(%rsp) | |
movq $1, 392(%rsp) | |
movq %r14, 416(%rsp) | |
movq $0, 424(%rsp) | |
movb $0, 432(%rsp) | |
movq %r15, 448(%rsp) | |
movq $1, 456(%rsp) | |
movq %rax, 480(%rsp) | |
.LEHB8: | |
call _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS4_RKT_RKNS_8IOFormatE | |
.LEHE8: | |
movq 448(%rsp), %rdi | |
movq %rax, %rbx | |
cmpq %r15, %rdi | |
je .L84 | |
movq 464(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L84: | |
movq 416(%rsp), %rdi | |
cmpq %r14, %rdi | |
je .L85 | |
movq 432(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L85: | |
movq 384(%rsp), %rdi | |
cmpq %r13, %rdi | |
je .L86 | |
movq 400(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L86: | |
movq 352(%rsp), %rdi | |
cmpq %r12, %rdi | |
je .L87 | |
movq 368(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L87: | |
movq 320(%rsp), %rdi | |
cmpq %rbp, %rdi | |
je .L88 | |
movq 336(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L88: | |
movq 288(%rsp), %rdi | |
movq 8(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L89 | |
movq 304(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L89: | |
movq 256(%rsp), %rdi | |
movq 48(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L90 | |
movq 272(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L90: | |
movq 64(%rsp), %rdi | |
movq 32(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L91 | |
movq 80(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L91: | |
movq 96(%rsp), %rdi | |
movq 56(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L92 | |
movq 112(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L92: | |
movq 128(%rsp), %rdi | |
movq 16(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L93 | |
movq 144(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L93: | |
movq 160(%rsp), %rdi | |
movq 40(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L94 | |
movq 176(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L94: | |
movq 192(%rsp), %rdi | |
movq (%rsp), %rax | |
cmpq %rax, %rdi | |
je .L95 | |
movq 208(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L95: | |
movq 224(%rsp), %rdi | |
movq 24(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L83 | |
movq 240(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L83: | |
movq 488(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L102 | |
addq $504, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 56 | |
movq %rbx, %rax | |
popq %rbx | |
.cfi_def_cfa_offset 48 | |
popq %rbp | |
.cfi_def_cfa_offset 40 | |
popq %r12 | |
.cfi_def_cfa_offset 32 | |
popq %r13 | |
.cfi_def_cfa_offset 24 | |
popq %r14 | |
.cfi_def_cfa_offset 16 | |
popq %r15 | |
.cfi_def_cfa_offset 8 | |
ret | |
.L97: | |
.cfi_restore_state | |
movq %rbx, %rdi | |
call _ZN5Eigen8IOFormatD1Ev | |
leaq 64(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 96(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 128(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 160(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 192(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 224(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
movq 488(%rsp), %rax | |
subq %fs:40, %rax | |
je .L98 | |
.L102: | |
call __stack_chk_fail@PLT | |
.L100: | |
endbr64 | |
movq %rax, %rbp | |
jmp .L97 | |
.L98: | |
movq %rbp, %rdi | |
.LEHB9: | |
call _Unwind_Resume@PLT | |
.LEHE9: | |
.cfi_endproc | |
.LFE9796: | |
.section .gcc_except_table._ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE,"aG",@progbits,_ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE,comdat | |
.LLSDA9796: | |
.byte 0xff | |
.byte 0xff | |
.byte 0x1 | |
.uleb128 .LLSDACSE9796-.LLSDACSB9796 | |
.LLSDACSB9796: | |
.uleb128 .LEHB8-.LFB9796 | |
.uleb128 .LEHE8-.LEHB8 | |
.uleb128 .L100-.LFB9796 | |
.uleb128 0 | |
.uleb128 .LEHB9-.LFB9796 | |
.uleb128 .LEHE9-.LEHB9 | |
.uleb128 0 | |
.uleb128 0 | |
.LLSDACSE9796: | |
.section .text._ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE,"axG",@progbits,_ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE,comdat | |
.size _ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE, .-_ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE | |
.section .rodata.str1.1,"aMS",@progbits,1 | |
.LC13: | |
.string "Matrix3d: " | |
.LC14: | |
.string " microseconds" | |
.text | |
.p2align 4 | |
.globl _Z33benchmark_matrix3d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi3ELi3ELi0ELi3ELi3EEESaIS2_EE | |
.type _Z33benchmark_matrix3d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi3ELi3ELi0ELi3ELi3EEESaIS2_EE, @function | |
_Z33benchmark_matrix3d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi3ELi3ELi0ELi3ELi3EEESaIS2_EE: | |
.LFB9384: | |
.cfi_startproc | |
endbr64 | |
pushq %r12 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 12, -16 | |
pushq %rbp | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 6, -24 | |
pushq %rbx | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 3, -32 | |
movq %rdi, %rbx | |
subq $160, %rsp | |
.cfi_def_cfa_offset 192 | |
movq %fs:40, %rax | |
movq %rax, 152(%rsp) | |
xorl %eax, %eax | |
call _ZNSt6chrono3_V212system_clock3nowEv@PLT | |
pxor %xmm0, %xmm0 | |
xorl %ecx, %ecx | |
xorl %edx, %edx | |
movq .LC12(%rip), %xmm1 | |
movq %rax, %rbp | |
movaps %xmm0, 16(%rsp) | |
movq .LC3(%rip), %rax | |
movabsq $-8198552921648689607, %rsi | |
movaps %xmm0, 48(%rsp) | |
movq %rax, 64(%rsp) | |
movq (%rbx), %rax | |
movaps %xmm1, (%rsp) | |
movaps %xmm1, 32(%rsp) | |
cmpq %rax, 8(%rbx) | |
je .L107 | |
.p2align 4,,10 | |
.p2align 3 | |
.L104: | |
#APP | |
# 13 "tmp.cpp" 1 | |
# 3dmat mult start | |
# 0 "" 2 | |
#NO_APP | |
movq (%rbx), %rax | |
movsd 64(%rsp), %xmm1 | |
movsd 40(%rsp), %xmm5 | |
movsd 16(%rsp), %xmm4 | |
addq %rcx, %rax | |
movupd 24(%rsp), %xmm7 | |
movapd (%rsp), %xmm8 | |
movsd 8(%rax), %xmm0 | |
movsd 16(%rax), %xmm3 | |
movsd (%rax), %xmm9 | |
movsd 24(%rax), %xmm11 | |
movapd %xmm3, %xmm2 | |
movapd %xmm0, %xmm10 | |
movsd 32(%rax), %xmm12 | |
unpcklpd %xmm0, %xmm0 | |
mulsd %xmm5, %xmm10 | |
movapd 48(%rsp), %xmm6 | |
unpcklpd %xmm3, %xmm3 | |
mulsd %xmm1, %xmm2 | |
movapd %xmm12, %xmm13 | |
mulpd %xmm7, %xmm0 | |
unpcklpd %xmm13, %xmm13 | |
mulpd %xmm7, %xmm13 | |
mulsd %xmm5, %xmm12 | |
mulpd %xmm6, %xmm3 | |
addsd %xmm10, %xmm2 | |
movapd %xmm9, %xmm10 | |
unpcklpd %xmm9, %xmm9 | |
mulsd %xmm4, %xmm10 | |
mulpd %xmm8, %xmm9 | |
addsd %xmm10, %xmm2 | |
movapd %xmm11, %xmm10 | |
mulsd %xmm4, %xmm11 | |
unpcklpd %xmm10, %xmm10 | |
addpd %xmm9, %xmm0 | |
mulpd %xmm8, %xmm10 | |
movsd %xmm2, 96(%rsp) | |
movsd 40(%rax), %xmm2 | |
addpd %xmm3, %xmm0 | |
addpd %xmm13, %xmm10 | |
movapd %xmm2, %xmm13 | |
movaps %xmm0, (%rsp) | |
mulsd %xmm1, %xmm2 | |
unpcklpd %xmm13, %xmm13 | |
mulpd %xmm6, %xmm13 | |
addsd %xmm12, %xmm2 | |
addpd %xmm13, %xmm10 | |
addsd %xmm11, %xmm2 | |
movsd 64(%rax), %xmm11 | |
movups %xmm10, 104(%rsp) | |
movsd 56(%rax), %xmm10 | |
movapd 96(%rsp), %xmm0 | |
mulsd %xmm11, %xmm1 | |
movsd %xmm2, 120(%rsp) | |
movsd 48(%rax), %xmm2 | |
movapd 112(%rsp), %xmm3 | |
mulsd %xmm10, %xmm5 | |
movaps %xmm0, 16(%rsp) | |
movaps %xmm3, 32(%rsp) | |
movapd %xmm2, %xmm0 | |
movapd %xmm10, %xmm3 | |
mulsd %xmm2, %xmm4 | |
unpcklpd %xmm0, %xmm0 | |
unpcklpd %xmm3, %xmm3 | |
mulpd %xmm7, %xmm3 | |
mulpd %xmm8, %xmm0 | |
addsd %xmm5, %xmm1 | |
addsd %xmm4, %xmm1 | |
addpd %xmm3, %xmm0 | |
movapd %xmm11, %xmm3 | |
unpcklpd %xmm3, %xmm3 | |
movsd %xmm1, 64(%rsp) | |
mulpd %xmm6, %xmm3 | |
addpd %xmm3, %xmm0 | |
movaps %xmm0, 48(%rsp) | |
#APP | |
# 15 "tmp.cpp" 1 | |
# 3dmat mult end | |
# 0 "" 2 | |
#NO_APP | |
movq 8(%rbx), %rax | |
subq (%rbx), %rax | |
addq $1, %rdx | |
addq $72, %rcx | |
sarq $3, %rax | |
imulq %rsi, %rax | |
cmpq %rax, %rdx | |
jb .L104 | |
.L107: | |
call _ZNSt6chrono3_V212system_clock3nowEv@PLT | |
leaq _ZSt4cout(%rip), %r12 | |
movabsq $2361183241434822607, %rdx | |
leaq .LC13(%rip), %rsi | |
subq %rbp, %rax | |
movq %r12, %rdi | |
movq %rax, %rcx | |
imulq %rdx | |
sarq $63, %rcx | |
sarq $7, %rdx | |
subq %rcx, %rdx | |
movq %rdx, %rbx | |
movl $10, %edx | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq %rbx, %rsi | |
movq %r12, %rdi | |
call _ZNSo9_M_insertIlEERSoT_@PLT | |
movl $13, %edx | |
leaq .LC14(%rip), %rsi | |
movq %rax, %rbx | |
movq %rax, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq (%rbx), %rax | |
movq -24(%rax), %rax | |
movq 240(%rbx,%rax), %rbp | |
testq %rbp, %rbp | |
je .L105 | |
cmpb $0, 56(%rbp) | |
je .L109 | |
movsbl 67(%rbp), %esi | |
.L110: | |
movq %rbx, %rdi | |
call _ZNSo3putEc@PLT | |
movq %rax, %rdi | |
call _ZNSo5flushEv@PLT | |
movq %rsp, %rsi | |
movq %r12, %rdi | |
call _ZN5EigenlsINS_6MatrixIdLi3ELi3ELi0ELi3ELi3EEEEERSoS3_RKNS_9DenseBaseIT_EE | |
movq %rax, %rbx | |
movq (%rax), %rax | |
movq -24(%rax), %rax | |
movq 240(%rbx,%rax), %rbp | |
testq %rbp, %rbp | |
je .L105 | |
cmpb $0, 56(%rbp) | |
je .L111 | |
movsbl 67(%rbp), %esi | |
.L112: | |
movq %rbx, %rdi | |
call _ZNSo3putEc@PLT | |
movq %rax, %rdi | |
movq 152(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L129 | |
addq $160, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 32 | |
popq %rbx | |
.cfi_def_cfa_offset 24 | |
popq %rbp | |
.cfi_def_cfa_offset 16 | |
popq %r12 | |
.cfi_def_cfa_offset 8 | |
jmp _ZNSo5flushEv@PLT | |
.p2align 4,,10 | |
.p2align 3 | |
.L109: | |
.cfi_restore_state | |
movq %rbp, %rdi | |
call _ZNKSt5ctypeIcE13_M_widen_initEv@PLT | |
movq 0(%rbp), %rax | |
movl $10, %esi | |
leaq _ZNKSt5ctypeIcE8do_widenEc(%rip), %rdx | |
movq 48(%rax), %rax | |
cmpq %rdx, %rax | |
je .L110 | |
movq %rbp, %rdi | |
call *%rax | |
movsbl %al, %esi | |
jmp .L110 | |
.p2align 4,,10 | |
.p2align 3 | |
.L111: | |
movq %rbp, %rdi | |
call _ZNKSt5ctypeIcE13_M_widen_initEv@PLT | |
movq 0(%rbp), %rax | |
movl $10, %esi | |
leaq _ZNKSt5ctypeIcE8do_widenEc(%rip), %rdx | |
movq 48(%rax), %rax | |
cmpq %rdx, %rax | |
je .L112 | |
movq %rbp, %rdi | |
call *%rax | |
movsbl %al, %esi | |
jmp .L112 | |
.L129: | |
call __stack_chk_fail@PLT | |
.L105: | |
movq 152(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L129 | |
call _ZSt16__throw_bad_castv@PLT | |
.cfi_endproc | |
.LFE9384: | |
.size _Z33benchmark_matrix3d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi3ELi3ELi0ELi3ELi3EEESaIS2_EE, .-_Z33benchmark_matrix3d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi3ELi3ELi0ELi3ELi3EEESaIS2_EE | |
.section .text._ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE,"axG",@progbits,_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE,comdat | |
.p2align 4 | |
.weak _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE | |
.type _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE, @function | |
_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE: | |
.LFB10091: | |
.cfi_startproc | |
.cfi_personality 0x9b,DW.ref.__gxx_personality_v0 | |
.cfi_lsda 0x1b,.LLSDA10091 | |
endbr64 | |
pushq %r15 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 15, -16 | |
pushq %r14 | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 14, -24 | |
pushq %r13 | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 13, -32 | |
pushq %r12 | |
.cfi_def_cfa_offset 40 | |
.cfi_offset 12, -40 | |
pushq %rbp | |
.cfi_def_cfa_offset 48 | |
.cfi_offset 6, -48 | |
movq %rdx, %rbp | |
pushq %rbx | |
.cfi_def_cfa_offset 56 | |
.cfi_offset 3, -56 | |
movq %rdi, %rbx | |
subq $568, %rsp | |
.cfi_def_cfa_offset 624 | |
movq %rsi, 112(%rsp) | |
movq %fs:40, %rax | |
movq %rax, 552(%rsp) | |
xorl %eax, %eax | |
movslq 224(%rdx), %rax | |
cmpl $-1, %eax | |
je .L159 | |
cmpl $-2, %eax | |
je .L160 | |
movq %rax, 104(%rsp) | |
movq $0, 120(%rsp) | |
testq %rax, %rax | |
je .L131 | |
.L132: | |
movq (%rbx), %rax | |
movq -24(%rax), %rdx | |
addq %rbx, %rdx | |
movq %rdx, %rax | |
movq 8(%rdx), %rdx | |
movq %rdx, 120(%rsp) | |
movq 104(%rsp), %rdx | |
movq %rdx, 8(%rax) | |
.L131: | |
testb $1, 228(%rbp) | |
jne .L162 | |
.L182: | |
leaq 64+_ZTVNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 16+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %r12 | |
movq $0, 96(%rsp) | |
movq %rax, %xmm0 | |
movq 112(%rsp), %rax | |
movq $0, 16(%rsp) | |
movdqa %xmm0, %xmm3 | |
movdqa %xmm0, %xmm4 | |
movq 32+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %r13 | |
movq %rax, 40(%rsp) | |
leaq 160(%rsp), %rax | |
movhps .LC7(%rip), %xmm3 | |
movhps .LC8(%rip), %xmm4 | |
movq %rax, 56(%rsp) | |
leaq 288(%rsp), %rax | |
movq %rax, 8(%rsp) | |
movaps %xmm3, 64(%rsp) | |
movaps %xmm4, 80(%rsp) | |
.L134: | |
xorl %r15d, %r15d | |
.L148: | |
movq 8(%rsp), %rdi | |
call _ZNSt8ios_baseC2Ev@PLT | |
leaq 16+_ZTVSt9basic_iosIcSt11char_traitsIcEE(%rip), %rax | |
xorl %edx, %edx | |
xorl %esi, %esi | |
pxor %xmm0, %xmm0 | |
movw %dx, 512(%rsp) | |
movq 24+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rcx | |
movups %xmm0, 520(%rsp) | |
movups %xmm0, 536(%rsp) | |
movq %rax, 288(%rsp) | |
movq -24(%r12), %rax | |
movq $0, 504(%rsp) | |
movq %r12, 160(%rsp) | |
movq %rcx, 160(%rsp,%rax) | |
movq 56(%rsp), %rax | |
movq $0, 168(%rsp) | |
addq -24(%r12), %rax | |
movq %rax, %rdi | |
.LEHB10: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE4initEPSt15basic_streambufIcS1_E@PLT | |
.LEHE10: | |
movq -24(%r13), %rax | |
leaq 176(%rsp), %r14 | |
movq %r13, 176(%rsp) | |
xorl %esi, %esi | |
addq %r14, %rax | |
movq %rax, %rdi | |
movq 40+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq %rax, (%rdi) | |
.LEHB11: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE4initEPSt15basic_streambufIcS1_E@PLT | |
.LEHE11: | |
movq 8+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 48+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
pxor %xmm0, %xmm0 | |
movdqa 80(%rsp), %xmm1 | |
movq -24(%rax), %rax | |
movq %rdx, 160(%rsp,%rax) | |
leaq 24+_ZTVNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq %rax, 160(%rsp) | |
addq $80, %rax | |
movq %rax, 288(%rsp) | |
leaq 240(%rsp), %rax | |
movq %rax, %rdi | |
movq %rax, 24(%rsp) | |
movaps %xmm1, 176(%rsp) | |
movaps %xmm0, 192(%rsp) | |
movaps %xmm0, 208(%rsp) | |
movaps %xmm0, 224(%rsp) | |
call _ZNSt6localeC1Ev@PLT | |
leaq 16+_ZTVNSt7__cxx1115basic_stringbufIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 8(%rsp), %rdi | |
leaq 184(%rsp), %rsi | |
movq %rax, 184(%rsp) | |
leaq 272(%rsp), %rax | |
movl $24, 248(%rsp) | |
movq %rax, 32(%rsp) | |
movq %rax, 256(%rsp) | |
movq $0, 264(%rsp) | |
movb $0, 272(%rsp) | |
.LEHB12: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE4initEPSt15basic_streambufIcS1_E@PLT | |
.LEHE12: | |
movq (%rbx), %rax | |
movq 8(%rsp), %rdi | |
movq -24(%rax), %rsi | |
addq %rbx, %rsi | |
.LEHB13: | |
call _ZNSt9basic_iosIcSt11char_traitsIcEE7copyfmtERKS2_@PLT | |
movq 40(%rsp), %rax | |
movq %r14, %rdi | |
movsd (%rax,%r15,8), %xmm0 | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
.LEHE13: | |
movq 224(%rsp), %r8 | |
leaq 128(%rsp), %rdi | |
leaq 144(%rsp), %r14 | |
movq $0, 136(%rsp) | |
movq %rdi, 48(%rsp) | |
movq %r14, 128(%rsp) | |
movb $0, 144(%rsp) | |
testq %r8, %r8 | |
je .L140 | |
movq 208(%rsp), %rax | |
movq %r8, %rdx | |
movq 216(%rsp), %rcx | |
cmpq %r8, %rax | |
cmovnb %rax, %r8 | |
testq %rax, %rax | |
cmove %rdx, %r8 | |
xorl %edx, %edx | |
xorl %esi, %esi | |
subq %rcx, %r8 | |
.LEHB14: | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_replaceEmmPKcm@PLT | |
.LEHE14: | |
.L142: | |
movq 16(%rsp), %rcx | |
movq 136(%rsp), %rax | |
movq 128(%rsp), %rdi | |
cmpq %rax, %rcx | |
cmovge %rcx, %rax | |
movq %rax, 16(%rsp) | |
cmpq %r14, %rdi | |
je .L143 | |
movq 144(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L143: | |
leaq 24+_ZTVNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movdqa 64(%rsp), %xmm2 | |
movq 256(%rsp), %rdi | |
movq %rax, 160(%rsp) | |
addq $80, %rax | |
movq %rax, 288(%rsp) | |
movq 32(%rsp), %rax | |
movaps %xmm2, 176(%rsp) | |
cmpq %rax, %rdi | |
je .L147 | |
movq 272(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L147: | |
movq 24(%rsp), %rdi | |
leaq 16+_ZTVSt15basic_streambufIcSt11char_traitsIcEE(%rip), %rax | |
addq $1, %r15 | |
movq %rax, 184(%rsp) | |
call _ZNSt6localeD1Ev@PLT | |
movq 8+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 8(%rsp), %rdi | |
movq 48+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rcx | |
movq 40+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq -24(%rax), %rax | |
movq %rcx, 160(%rsp,%rax) | |
movq -24(%r13), %rax | |
movq %r13, 176(%rsp) | |
movq 24+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rcx | |
movq %rdx, 176(%rsp,%rax) | |
movq -24(%r12), %rax | |
movq %r12, 160(%rsp) | |
movq %rcx, 160(%rsp,%rax) | |
leaq 16+_ZTVSt9basic_iosIcSt11char_traitsIcEE(%rip), %rax | |
movq $0, 168(%rsp) | |
movq %rax, 288(%rsp) | |
call _ZNSt8ios_baseD2Ev@PLT | |
cmpq $4, %r15 | |
jne .L148 | |
addq $4, 96(%rsp) | |
movq 96(%rsp), %rax | |
addq $32, 40(%rsp) | |
cmpq $16, %rax | |
jne .L134 | |
.L133: | |
movq 8(%rbp), %rdx | |
movq 0(%rbp), %rsi | |
movq %rbx, %rdi | |
xorl %r14d, %r14d | |
.LEHB15: | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq %r14, 8(%rsp) | |
movq 112(%rsp), %r12 | |
movq 16(%rsp), %r15 | |
.L156: | |
movq 72(%rbp), %rdx | |
movq 64(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
testq %r15, %r15 | |
jne .L149 | |
movsd (%r12), %xmm0 | |
movq %rbx, %rdi | |
movq %r12, %r14 | |
leaq 96(%r12), %r13 | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
.L150: | |
movq 200(%rbp), %rdx | |
movq 192(%rbp), %rsi | |
movq %rbx, %rdi | |
addq $32, %r14 | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movsd (%r14), %xmm0 | |
movq %rbx, %rdi | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
cmpq %r13, %r14 | |
jne .L150 | |
.L152: | |
movq 104(%rbp), %rdx | |
movq 96(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
cmpq $3, 8(%rsp) | |
je .L181 | |
movq 136(%rbp), %rdx | |
movq 128(%rbp), %rsi | |
movq %rbx, %rdi | |
addq $8, %r12 | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq 168(%rbp), %rdx | |
movq %rbx, %rdi | |
movq 160(%rbp), %rsi | |
addq $1, 8(%rsp) | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
.LEHE15: | |
jmp .L156 | |
.p2align 4,,10 | |
.p2align 3 | |
.L160: | |
movq $15, 104(%rsp) | |
jmp .L132 | |
.p2align 4,,10 | |
.p2align 3 | |
.L140: | |
leaq 256(%rsp), %rsi | |
.LEHB16: | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE9_M_assignERKS4_@PLT | |
.LEHE16: | |
jmp .L142 | |
.p2align 4,,10 | |
.p2align 3 | |
.L149: | |
movq (%rbx), %rax | |
movsd (%r12), %xmm0 | |
movq %rbx, %rdi | |
movq %r12, %r14 | |
leaq 96(%r12), %r13 | |
movq -24(%rax), %rax | |
movq %r15, 16(%rbx,%rax) | |
.LEHB17: | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
.L151: | |
movq 200(%rbp), %rdx | |
movq 192(%rbp), %rsi | |
movq %rbx, %rdi | |
addq $32, %r14 | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq (%rbx), %rax | |
movsd (%r14), %xmm0 | |
movq %rbx, %rdi | |
movq -24(%rax), %rax | |
movq %r15, 16(%rbx,%rax) | |
call _ZNSo9_M_insertIdEERSoT_@PLT | |
cmpq %r13, %r14 | |
jne .L151 | |
jmp .L152 | |
.p2align 4,,10 | |
.p2align 3 | |
.L181: | |
movq 40(%rbp), %rdx | |
movq 32(%rbp), %rsi | |
movq %rbx, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
cmpq $0, 104(%rsp) | |
je .L155 | |
movq (%rbx), %rax | |
movq 120(%rsp), %rdx | |
movq -24(%rax), %rax | |
movq %rdx, 8(%rbx,%rax) | |
.L155: | |
movq 552(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L177 | |
addq $568, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 56 | |
movq %rbx, %rax | |
popq %rbx | |
.cfi_def_cfa_offset 48 | |
popq %rbp | |
.cfi_def_cfa_offset 40 | |
popq %r12 | |
.cfi_def_cfa_offset 32 | |
popq %r13 | |
.cfi_def_cfa_offset 24 | |
popq %r14 | |
.cfi_def_cfa_offset 16 | |
popq %r15 | |
.cfi_def_cfa_offset 8 | |
ret | |
.p2align 4,,10 | |
.p2align 3 | |
.L159: | |
.cfi_restore_state | |
movq $0, 104(%rsp) | |
movq $0, 120(%rsp) | |
testb $1, 228(%rbp) | |
je .L182 | |
.L162: | |
movq $0, 16(%rsp) | |
jmp .L133 | |
.L145: | |
movq 48(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
.L146: | |
movq 56(%rsp), %rdi | |
call _ZNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEED1Ev@PLT | |
movq 552(%rsp), %rax | |
subq %fs:40, %rax | |
je .L157 | |
.L177: | |
call __stack_chk_fail@PLT | |
.L164: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L137 | |
.L166: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L136 | |
.L163: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L146 | |
.L165: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L138 | |
.L167: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L145 | |
.L138: | |
leaq 16+_ZTVNSt7__cxx1115basic_stringbufIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
leaq 256(%rsp), %rdi | |
movq %rax, 184(%rsp) | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
movq 24(%rsp), %rdi | |
leaq 16+_ZTVSt15basic_streambufIcSt11char_traitsIcEE(%rip), %rax | |
movq %rax, 184(%rsp) | |
call _ZNSt6localeD1Ev@PLT | |
movq 8+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rax | |
movq 48+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq -24(%rax), %rax | |
movq %rdx, 160(%rsp,%rax) | |
movq -24(%r13), %rax | |
movq 40+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq %r13, 176(%rsp) | |
movq %rdx, 176(%rsp,%rax) | |
.L179: | |
movq -24(%r12), %rax | |
movq 24+_ZTTNSt7__cxx1118basic_stringstreamIcSt11char_traitsIcESaIcEEE(%rip), %rdx | |
movq %r12, 160(%rsp) | |
movq %rdx, 160(%rsp,%rax) | |
xorl %eax, %eax | |
movq %rax, 168(%rsp) | |
.L137: | |
movq 8(%rsp), %rdi | |
leaq 16+_ZTVSt9basic_iosIcSt11char_traitsIcEE(%rip), %rax | |
movq %rax, 288(%rsp) | |
call _ZNSt8ios_baseD2Ev@PLT | |
movq 552(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L177 | |
.L157: | |
movq %rbx, %rdi | |
call _Unwind_Resume@PLT | |
.LEHE17: | |
.L136: | |
jmp .L179 | |
.cfi_endproc | |
.LFE10091: | |
.section .gcc_except_table._ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE,"aG",@progbits,_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE,comdat | |
.LLSDA10091: | |
.byte 0xff | |
.byte 0xff | |
.byte 0x1 | |
.uleb128 .LLSDACSE10091-.LLSDACSB10091 | |
.LLSDACSB10091: | |
.uleb128 .LEHB10-.LFB10091 | |
.uleb128 .LEHE10-.LEHB10 | |
.uleb128 .L164-.LFB10091 | |
.uleb128 0 | |
.uleb128 .LEHB11-.LFB10091 | |
.uleb128 .LEHE11-.LEHB11 | |
.uleb128 .L166-.LFB10091 | |
.uleb128 0 | |
.uleb128 .LEHB12-.LFB10091 | |
.uleb128 .LEHE12-.LEHB12 | |
.uleb128 .L165-.LFB10091 | |
.uleb128 0 | |
.uleb128 .LEHB13-.LFB10091 | |
.uleb128 .LEHE13-.LEHB13 | |
.uleb128 .L163-.LFB10091 | |
.uleb128 0 | |
.uleb128 .LEHB14-.LFB10091 | |
.uleb128 .LEHE14-.LEHB14 | |
.uleb128 .L167-.LFB10091 | |
.uleb128 0 | |
.uleb128 .LEHB15-.LFB10091 | |
.uleb128 .LEHE15-.LEHB15 | |
.uleb128 0 | |
.uleb128 0 | |
.uleb128 .LEHB16-.LFB10091 | |
.uleb128 .LEHE16-.LEHB16 | |
.uleb128 .L167-.LFB10091 | |
.uleb128 0 | |
.uleb128 .LEHB17-.LFB10091 | |
.uleb128 .LEHE17-.LEHB17 | |
.uleb128 0 | |
.uleb128 0 | |
.LLSDACSE10091: | |
.section .text._ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE,"axG",@progbits,_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE,comdat | |
.size _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE, .-_ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE | |
.section .text._ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE,"axG",@progbits,_ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE,comdat | |
.p2align 4 | |
.weak _ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE | |
.type _ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE, @function | |
_ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE: | |
.LFB9808: | |
.cfi_startproc | |
.cfi_personality 0x9b,DW.ref.__gxx_personality_v0 | |
.cfi_lsda 0x1b,.LLSDA9808 | |
endbr64 | |
pushq %r15 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 15, -16 | |
pushq %r14 | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 14, -24 | |
pushq %r13 | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 13, -32 | |
pushq %r12 | |
.cfi_def_cfa_offset 40 | |
.cfi_offset 12, -40 | |
pushq %rbp | |
.cfi_def_cfa_offset 48 | |
.cfi_offset 6, -48 | |
pushq %rbx | |
.cfi_def_cfa_offset 56 | |
.cfi_offset 3, -56 | |
subq $504, %rsp | |
.cfi_def_cfa_offset 560 | |
movzwl .LC9(%rip), %edx | |
movq %fs:40, %rax | |
movq %rax, 488(%rsp) | |
xorl %eax, %eax | |
leaq 240(%rsp), %rax | |
movq $0, 232(%rsp) | |
leaq 272(%rsp), %rcx | |
movq %rax, 24(%rsp) | |
leaq 256(%rsp), %rbx | |
leaq 336(%rsp), %rbp | |
movq %rax, 224(%rsp) | |
leaq 208(%rsp), %rax | |
leaq 368(%rsp), %r12 | |
movq %rax, (%rsp) | |
leaq 400(%rsp), %r13 | |
leaq 432(%rsp), %r14 | |
movq %rax, 192(%rsp) | |
leaq 176(%rsp), %rax | |
leaq 464(%rsp), %r15 | |
movq %rax, 40(%rsp) | |
movq %rax, 160(%rsp) | |
leaq 144(%rsp), %rax | |
movq %rax, 16(%rsp) | |
movq %rax, 128(%rsp) | |
leaq 112(%rsp), %rax | |
movq %rax, 56(%rsp) | |
movq %rax, 96(%rsp) | |
leaq 80(%rsp), %rax | |
movw %dx, 112(%rsp) | |
movq %rax, 32(%rsp) | |
movq %rax, 64(%rsp) | |
movb $0, 240(%rsp) | |
movq $0, 200(%rsp) | |
movb $0, 208(%rsp) | |
movq $0, 168(%rsp) | |
movb $0, 176(%rsp) | |
movq $0, 136(%rsp) | |
movb $0, 144(%rsp) | |
movq $1, 104(%rsp) | |
movq $1, 72(%rsp) | |
movzwl .LC10(%rip), %eax | |
movq %rcx, 48(%rsp) | |
movw %ax, 80(%rsp) | |
movw %ax, 464(%rsp) | |
movq .LC11(%rip), %rax | |
movq %rcx, 256(%rsp) | |
leaq 304(%rsp), %rcx | |
movw %dx, 400(%rsp) | |
movq %rbx, %rdx | |
movq $0, 264(%rsp) | |
movb $0, 272(%rsp) | |
movq %rcx, 8(%rsp) | |
movq %rcx, 288(%rsp) | |
movq $0, 296(%rsp) | |
movb $0, 304(%rsp) | |
movq %rbp, 320(%rsp) | |
movq $0, 328(%rsp) | |
movb $0, 336(%rsp) | |
movq %r12, 352(%rsp) | |
movq $0, 360(%rsp) | |
movb $0, 368(%rsp) | |
movq %r13, 384(%rsp) | |
movq $1, 392(%rsp) | |
movq %r14, 416(%rsp) | |
movq $0, 424(%rsp) | |
movb $0, 432(%rsp) | |
movq %r15, 448(%rsp) | |
movq $1, 456(%rsp) | |
movq %rax, 480(%rsp) | |
.LEHB18: | |
call _ZN5Eigen8internal12print_matrixINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS4_RKT_RKNS_8IOFormatE | |
.LEHE18: | |
movq 448(%rsp), %rdi | |
movq %rax, %rbx | |
cmpq %r15, %rdi | |
je .L184 | |
movq 464(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L184: | |
movq 416(%rsp), %rdi | |
cmpq %r14, %rdi | |
je .L185 | |
movq 432(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L185: | |
movq 384(%rsp), %rdi | |
cmpq %r13, %rdi | |
je .L186 | |
movq 400(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L186: | |
movq 352(%rsp), %rdi | |
cmpq %r12, %rdi | |
je .L187 | |
movq 368(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L187: | |
movq 320(%rsp), %rdi | |
cmpq %rbp, %rdi | |
je .L188 | |
movq 336(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L188: | |
movq 288(%rsp), %rdi | |
movq 8(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L189 | |
movq 304(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L189: | |
movq 256(%rsp), %rdi | |
movq 48(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L190 | |
movq 272(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L190: | |
movq 64(%rsp), %rdi | |
movq 32(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L191 | |
movq 80(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L191: | |
movq 96(%rsp), %rdi | |
movq 56(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L192 | |
movq 112(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L192: | |
movq 128(%rsp), %rdi | |
movq 16(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L193 | |
movq 144(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L193: | |
movq 160(%rsp), %rdi | |
movq 40(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L194 | |
movq 176(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L194: | |
movq 192(%rsp), %rdi | |
movq (%rsp), %rax | |
cmpq %rax, %rdi | |
je .L195 | |
movq 208(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L195: | |
movq 224(%rsp), %rdi | |
movq 24(%rsp), %rax | |
cmpq %rax, %rdi | |
je .L183 | |
movq 240(%rsp), %rax | |
leaq 1(%rax), %rsi | |
call _ZdlPvm@PLT | |
.L183: | |
movq 488(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L202 | |
addq $504, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 56 | |
movq %rbx, %rax | |
popq %rbx | |
.cfi_def_cfa_offset 48 | |
popq %rbp | |
.cfi_def_cfa_offset 40 | |
popq %r12 | |
.cfi_def_cfa_offset 32 | |
popq %r13 | |
.cfi_def_cfa_offset 24 | |
popq %r14 | |
.cfi_def_cfa_offset 16 | |
popq %r15 | |
.cfi_def_cfa_offset 8 | |
ret | |
.L197: | |
.cfi_restore_state | |
movq %rbx, %rdi | |
call _ZN5Eigen8IOFormatD1Ev | |
leaq 64(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 96(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 128(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 160(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 192(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
leaq 224(%rsp), %rdi | |
call _ZNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE10_M_disposeEv@PLT | |
movq 488(%rsp), %rax | |
subq %fs:40, %rax | |
je .L198 | |
.L202: | |
call __stack_chk_fail@PLT | |
.L200: | |
endbr64 | |
movq %rax, %rbp | |
jmp .L197 | |
.L198: | |
movq %rbp, %rdi | |
.LEHB19: | |
call _Unwind_Resume@PLT | |
.LEHE19: | |
.cfi_endproc | |
.LFE9808: | |
.section .gcc_except_table._ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE,"aG",@progbits,_ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE,comdat | |
.LLSDA9808: | |
.byte 0xff | |
.byte 0xff | |
.byte 0x1 | |
.uleb128 .LLSDACSE9808-.LLSDACSB9808 | |
.LLSDACSB9808: | |
.uleb128 .LEHB18-.LFB9808 | |
.uleb128 .LEHE18-.LEHB18 | |
.uleb128 .L200-.LFB9808 | |
.uleb128 0 | |
.uleb128 .LEHB19-.LFB9808 | |
.uleb128 .LEHE19-.LEHB19 | |
.uleb128 0 | |
.uleb128 0 | |
.LLSDACSE9808: | |
.section .text._ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE,"axG",@progbits,_ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE,comdat | |
.size _ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE, .-_ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE | |
.section .rodata.str1.1 | |
.LC17: | |
.string "Matrix4d: " | |
.text | |
.p2align 4 | |
.globl _Z33benchmark_matrix4d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi4ELi4ELi0ELi4ELi4EEESaIS2_EE | |
.type _Z33benchmark_matrix4d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi4ELi4ELi0ELi4ELi4EEESaIS2_EE, @function | |
_Z33benchmark_matrix4d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi4ELi4ELi0ELi4ELi4EEESaIS2_EE: | |
.LFB9388: | |
.cfi_startproc | |
endbr64 | |
pushq %r12 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 12, -16 | |
pushq %rbp | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 6, -24 | |
pushq %rbx | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 3, -32 | |
movq %rdi, %rbx | |
subq $272, %rsp | |
.cfi_def_cfa_offset 304 | |
movq %fs:40, %rax | |
movq %rax, 264(%rsp) | |
xorl %eax, %eax | |
call _ZNSt6chrono3_V212system_clock3nowEv@PLT | |
movq .LC12(%rip), %xmm2 | |
pxor %xmm0, %xmm0 | |
xorl %edx, %edx | |
movapd .LC16(%rip), %xmm1 | |
movq %rax, %rbp | |
movaps %xmm0, 144(%rsp) | |
movq (%rbx), %rax | |
movaps %xmm2, 128(%rsp) | |
movaps %xmm1, 160(%rsp) | |
movaps %xmm0, 176(%rsp) | |
movaps %xmm0, 192(%rsp) | |
movaps %xmm2, 208(%rsp) | |
movaps %xmm0, 224(%rsp) | |
movaps %xmm1, 240(%rsp) | |
cmpq %rax, 8(%rbx) | |
je .L207 | |
.p2align 4,,10 | |
.p2align 3 | |
.L204: | |
#APP | |
# 27 "tmp.cpp" 1 | |
# 4dmat mult start | |
# 0 "" 2 | |
#NO_APP | |
movapd 128(%rsp), %xmm1 | |
movq %rdx, %rax | |
movapd 160(%rsp), %xmm7 | |
movapd 192(%rsp), %xmm6 | |
salq $7, %rax | |
addq (%rbx), %rax | |
movsd 64(%rax), %xmm15 | |
movsd 72(%rax), %xmm10 | |
movsd 8(%rax), %xmm14 | |
movsd (%rax), %xmm9 | |
unpcklpd %xmm15, %xmm15 | |
unpcklpd %xmm10, %xmm10 | |
movsd 16(%rax), %xmm3 | |
movsd 24(%rax), %xmm13 | |
movaps %xmm15, (%rsp) | |
movsd 80(%rax), %xmm15 | |
unpcklpd %xmm14, %xmm14 | |
unpcklpd %xmm9, %xmm9 | |
movaps %xmm10, 16(%rsp) | |
movsd 88(%rax), %xmm10 | |
unpcklpd %xmm3, %xmm3 | |
unpcklpd %xmm13, %xmm13 | |
unpcklpd %xmm15, %xmm15 | |
movsd 32(%rax), %xmm12 | |
movapd 144(%rsp), %xmm0 | |
unpcklpd %xmm10, %xmm10 | |
movaps %xmm15, 32(%rsp) | |
movsd 104(%rax), %xmm15 | |
movapd 176(%rsp), %xmm5 | |
movaps %xmm10, 48(%rsp) | |
movsd 96(%rax), %xmm10 | |
movsd 48(%rax), %xmm2 | |
unpcklpd %xmm12, %xmm12 | |
unpcklpd %xmm15, %xmm15 | |
movsd 40(%rax), %xmm8 | |
movapd 208(%rsp), %xmm4 | |
unpcklpd %xmm10, %xmm10 | |
movaps %xmm15, 80(%rsp) | |
movsd 120(%rax), %xmm15 | |
unpcklpd %xmm2, %xmm2 | |
movaps %xmm10, 64(%rsp) | |
movsd 112(%rax), %xmm10 | |
movsd 56(%rax), %xmm11 | |
unpcklpd %xmm8, %xmm8 | |
unpcklpd %xmm15, %xmm15 | |
unpcklpd %xmm10, %xmm10 | |
movaps %xmm15, 112(%rsp) | |
movapd %xmm14, %xmm15 | |
unpcklpd %xmm11, %xmm11 | |
movaps %xmm10, 96(%rsp) | |
mulpd %xmm7, %xmm15 | |
movapd %xmm1, %xmm10 | |
mulpd %xmm9, %xmm10 | |
mulpd %xmm5, %xmm14 | |
mulpd %xmm0, %xmm9 | |
addpd %xmm10, %xmm15 | |
movapd %xmm6, %xmm10 | |
mulpd %xmm3, %xmm10 | |
mulpd %xmm4, %xmm3 | |
addpd %xmm14, %xmm9 | |
addpd %xmm15, %xmm10 | |
movapd 224(%rsp), %xmm15 | |
addpd %xmm9, %xmm3 | |
movapd %xmm7, %xmm9 | |
mulpd %xmm13, %xmm15 | |
mulpd %xmm8, %xmm9 | |
mulpd %xmm5, %xmm8 | |
addpd %xmm15, %xmm10 | |
movaps %xmm10, 128(%rsp) | |
movapd 48(%rsp), %xmm14 | |
mulpd 240(%rsp), %xmm13 | |
addpd %xmm13, %xmm3 | |
movapd 32(%rsp), %xmm13 | |
movaps %xmm3, 144(%rsp) | |
movapd %xmm1, %xmm3 | |
mulpd %xmm12, %xmm3 | |
mulpd %xmm0, %xmm12 | |
addpd %xmm3, %xmm9 | |
movapd %xmm6, %xmm3 | |
mulpd %xmm2, %xmm3 | |
addpd %xmm12, %xmm8 | |
movapd 16(%rsp), %xmm12 | |
mulpd %xmm4, %xmm2 | |
addpd %xmm9, %xmm3 | |
movapd 224(%rsp), %xmm9 | |
addpd %xmm8, %xmm2 | |
movapd 80(%rsp), %xmm8 | |
mulpd %xmm11, %xmm9 | |
mulpd 240(%rsp), %xmm11 | |
addpd %xmm9, %xmm3 | |
addpd %xmm11, %xmm2 | |
movapd (%rsp), %xmm11 | |
movaps %xmm3, 160(%rsp) | |
movapd %xmm12, %xmm3 | |
movaps %xmm2, 176(%rsp) | |
movapd %xmm11, %xmm2 | |
mulpd %xmm1, %xmm2 | |
mulpd %xmm7, %xmm3 | |
mulpd %xmm8, %xmm7 | |
addpd %xmm2, %xmm3 | |
movapd %xmm13, %xmm2 | |
mulpd %xmm6, %xmm2 | |
addpd %xmm3, %xmm2 | |
movapd 224(%rsp), %xmm3 | |
mulpd %xmm14, %xmm3 | |
addpd %xmm3, %xmm2 | |
movapd %xmm12, %xmm3 | |
mulpd %xmm5, %xmm3 | |
mulpd %xmm8, %xmm5 | |
movaps %xmm2, 192(%rsp) | |
movapd %xmm11, %xmm2 | |
mulpd %xmm0, %xmm2 | |
addpd %xmm3, %xmm2 | |
movapd %xmm13, %xmm3 | |
mulpd %xmm4, %xmm3 | |
addpd %xmm3, %xmm2 | |
movapd 240(%rsp), %xmm3 | |
mulpd %xmm14, %xmm3 | |
addpd %xmm3, %xmm2 | |
movapd 64(%rsp), %xmm3 | |
mulpd %xmm3, %xmm1 | |
mulpd %xmm3, %xmm0 | |
movaps %xmm2, 208(%rsp) | |
movapd 224(%rsp), %xmm2 | |
addpd %xmm7, %xmm1 | |
movapd 96(%rsp), %xmm7 | |
addpd %xmm5, %xmm0 | |
mulpd %xmm7, %xmm6 | |
mulpd %xmm7, %xmm4 | |
addpd %xmm6, %xmm1 | |
movapd 112(%rsp), %xmm6 | |
addpd %xmm4, %xmm0 | |
mulpd %xmm6, %xmm2 | |
mulpd 240(%rsp), %xmm6 | |
addpd %xmm2, %xmm1 | |
addpd %xmm6, %xmm0 | |
movaps %xmm1, 224(%rsp) | |
movaps %xmm0, 240(%rsp) | |
#APP | |
# 29 "tmp.cpp" 1 | |
# 4dmat mult end | |
# 0 "" 2 | |
#NO_APP | |
movq 8(%rbx), %rax | |
subq (%rbx), %rax | |
addq $1, %rdx | |
sarq $7, %rax | |
cmpq %rax, %rdx | |
jb .L204 | |
.L207: | |
call _ZNSt6chrono3_V212system_clock3nowEv@PLT | |
leaq _ZSt4cout(%rip), %r12 | |
movabsq $2361183241434822607, %rdx | |
leaq .LC17(%rip), %rsi | |
subq %rbp, %rax | |
movq %r12, %rdi | |
movq %rax, %rcx | |
imulq %rdx | |
sarq $63, %rcx | |
sarq $7, %rdx | |
subq %rcx, %rdx | |
movq %rdx, %rbx | |
movl $10, %edx | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq %rbx, %rsi | |
movq %r12, %rdi | |
call _ZNSo9_M_insertIlEERSoT_@PLT | |
movl $13, %edx | |
leaq .LC14(%rip), %rsi | |
movq %rax, %rbx | |
movq %rax, %rdi | |
call _ZSt16__ostream_insertIcSt11char_traitsIcEERSt13basic_ostreamIT_T0_ES6_PKS3_l@PLT | |
movq (%rbx), %rax | |
movq -24(%rax), %rax | |
movq 240(%rbx,%rax), %rbp | |
testq %rbp, %rbp | |
je .L205 | |
cmpb $0, 56(%rbp) | |
je .L209 | |
movsbl 67(%rbp), %esi | |
.L210: | |
movq %rbx, %rdi | |
call _ZNSo3putEc@PLT | |
movq %rax, %rdi | |
call _ZNSo5flushEv@PLT | |
leaq 128(%rsp), %rsi | |
movq %r12, %rdi | |
call _ZN5EigenlsINS_6MatrixIdLi4ELi4ELi0ELi4ELi4EEEEERSoS3_RKNS_9DenseBaseIT_EE | |
movq %rax, %rbx | |
movq (%rax), %rax | |
movq -24(%rax), %rax | |
movq 240(%rbx,%rax), %rbp | |
testq %rbp, %rbp | |
je .L205 | |
cmpb $0, 56(%rbp) | |
je .L211 | |
movsbl 67(%rbp), %esi | |
.L212: | |
movq %rbx, %rdi | |
call _ZNSo3putEc@PLT | |
movq %rax, %rdi | |
movq 264(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L229 | |
addq $272, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 32 | |
popq %rbx | |
.cfi_def_cfa_offset 24 | |
popq %rbp | |
.cfi_def_cfa_offset 16 | |
popq %r12 | |
.cfi_def_cfa_offset 8 | |
jmp _ZNSo5flushEv@PLT | |
.p2align 4,,10 | |
.p2align 3 | |
.L209: | |
.cfi_restore_state | |
movq %rbp, %rdi | |
call _ZNKSt5ctypeIcE13_M_widen_initEv@PLT | |
movq 0(%rbp), %rax | |
movl $10, %esi | |
leaq _ZNKSt5ctypeIcE8do_widenEc(%rip), %rdx | |
movq 48(%rax), %rax | |
cmpq %rdx, %rax | |
je .L210 | |
movq %rbp, %rdi | |
call *%rax | |
movsbl %al, %esi | |
jmp .L210 | |
.p2align 4,,10 | |
.p2align 3 | |
.L211: | |
movq %rbp, %rdi | |
call _ZNKSt5ctypeIcE13_M_widen_initEv@PLT | |
movq 0(%rbp), %rax | |
movl $10, %esi | |
leaq _ZNKSt5ctypeIcE8do_widenEc(%rip), %rdx | |
movq 48(%rax), %rax | |
cmpq %rdx, %rax | |
je .L212 | |
movq %rbp, %rdi | |
call *%rax | |
movsbl %al, %esi | |
jmp .L212 | |
.L229: | |
call __stack_chk_fail@PLT | |
.L205: | |
movq 264(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L229 | |
call _ZSt16__throw_bad_castv@PLT | |
.cfi_endproc | |
.LFE9388: | |
.size _Z33benchmark_matrix4d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi4ELi4ELi0ELi4ELi4EEESaIS2_EE, .-_Z33benchmark_matrix4d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi4ELi4ELi0ELi4ELi4EEESaIS2_EE | |
.section .rodata.str1.8,"aMS",@progbits,1 | |
.align 8 | |
.LC18: | |
.string "Eigen::internal::plain_array<T, Size, MatrixOrArrayOptions, 16>::plain_array() [with T = double; int Size = 16; int MatrixOrArrayOptions = 0]" | |
.section .text.unlikely,"ax",@progbits | |
.LCOLDB20: | |
.text | |
.LHOTB20: | |
.p2align 4 | |
.globl _Z31benchmark_matrix_multiplicationv | |
.type _Z31benchmark_matrix_multiplicationv, @function | |
_Z31benchmark_matrix_multiplicationv: | |
.LFB9389: | |
.cfi_startproc | |
.cfi_personality 0x9b,DW.ref.__gxx_personality_v0 | |
.cfi_lsda 0x1b,.LLSDA9389 | |
endbr64 | |
pushq %r13 | |
.cfi_def_cfa_offset 16 | |
.cfi_offset 13, -16 | |
movl $7200000, %edi | |
pushq %r12 | |
.cfi_def_cfa_offset 24 | |
.cfi_offset 12, -24 | |
pushq %rbp | |
.cfi_def_cfa_offset 32 | |
.cfi_offset 6, -32 | |
pushq %rbx | |
.cfi_def_cfa_offset 40 | |
.cfi_offset 3, -40 | |
subq $152, %rsp | |
.cfi_def_cfa_offset 192 | |
movq %fs:40, %rax | |
movq %rax, 136(%rsp) | |
xorl %eax, %eax | |
leaq 80(%rsp), %r13 | |
.LEHB20: | |
call _Znwm@PLT | |
.LEHE20: | |
leaq 7200000(%rax), %r12 | |
movq %rax, 16(%rsp) | |
movq %rax, %rbp | |
movq %rax, %rbx | |
movq %r12, 32(%rsp) | |
movq %r12, 24(%rsp) | |
.p2align 4,,10 | |
.p2align 3 | |
.L231: | |
movq %r13, %rdi | |
addq $72, %rbx | |
call _ZN5Eigen10QuaternionIdLi0EE10UnitRandomEv | |
movsd 88(%rsp), %xmm5 | |
movsd 96(%rsp), %xmm2 | |
movsd 80(%rsp), %xmm1 | |
movsd 104(%rsp), %xmm10 | |
movapd %xmm5, %xmm7 | |
movapd %xmm2, %xmm4 | |
movq .LC3(%rip), %rax | |
addsd %xmm5, %xmm7 | |
addsd %xmm2, %xmm4 | |
movapd %xmm1, %xmm6 | |
movapd %xmm1, %xmm3 | |
addsd %xmm1, %xmm6 | |
movq %rax, %xmm8 | |
mulsd %xmm7, %xmm3 | |
movapd %xmm7, %xmm0 | |
mulsd %xmm5, %xmm7 | |
movapd %xmm6, %xmm9 | |
mulsd %xmm4, %xmm2 | |
mulsd %xmm10, %xmm9 | |
mulsd %xmm10, %xmm0 | |
mulsd %xmm4, %xmm10 | |
mulsd %xmm1, %xmm6 | |
movapd %xmm7, %xmm11 | |
addsd %xmm2, %xmm11 | |
mulsd %xmm4, %xmm1 | |
mulsd %xmm4, %xmm5 | |
movapd %xmm8, %xmm4 | |
subsd %xmm11, %xmm4 | |
movapd %xmm10, %xmm11 | |
addsd %xmm3, %xmm11 | |
subsd %xmm10, %xmm3 | |
addsd %xmm6, %xmm2 | |
addsd %xmm7, %xmm6 | |
unpcklpd %xmm11, %xmm4 | |
movups %xmm4, -72(%rbx) | |
movapd %xmm1, %xmm4 | |
subsd %xmm0, %xmm4 | |
addsd %xmm1, %xmm0 | |
movapd %xmm8, %xmm1 | |
subsd %xmm6, %xmm1 | |
unpcklpd %xmm3, %xmm4 | |
movapd %xmm8, %xmm3 | |
movups %xmm4, -56(%rbx) | |
subsd %xmm2, %xmm3 | |
movapd %xmm9, %xmm4 | |
addsd %xmm5, %xmm4 | |
subsd %xmm9, %xmm5 | |
movsd %xmm1, -8(%rbx) | |
movapd %xmm3, %xmm2 | |
unpcklpd %xmm4, %xmm2 | |
unpcklpd %xmm5, %xmm0 | |
movups %xmm2, -40(%rbx) | |
movups %xmm0, -24(%rbx) | |
cmpq %r12, %rbx | |
jne .L231 | |
pxor %xmm0, %xmm0 | |
movl $12800000, %edi | |
movups %xmm0, 56(%rsp) | |
.LEHB21: | |
call _Znwm@PLT | |
.LEHE21: | |
leaq 12800000(%rax), %rcx | |
movq %rax, 48(%rsp) | |
movq %rcx, 64(%rsp) | |
testb $15, %al | |
jne .L233 | |
movq %rax, %rdx | |
jmp .L232 | |
.p2align 4,,10 | |
.p2align 3 | |
.L234: | |
testb $15, %dl | |
jne .L233 | |
.L232: | |
subq $-128, %rdx | |
cmpq %rdx, %rcx | |
jne .L234 | |
movq %rcx, 56(%rsp) | |
.p2align 4,,10 | |
.p2align 3 | |
.L235: | |
movsd 16(%rbp), %xmm0 | |
movupd 0(%rbp), %xmm5 | |
addq $72, %rbp | |
subq $-128, %rax | |
movupd -48(%rbp), %xmm7 | |
movsd %xmm0, -112(%rax) | |
movsd -32(%rbp), %xmm0 | |
movups %xmm5, -128(%rax) | |
movupd -24(%rbp), %xmm5 | |
movsd %xmm0, -80(%rax) | |
movsd -8(%rbp), %xmm0 | |
movups %xmm7, -96(%rax) | |
movups %xmm5, -64(%rax) | |
movsd %xmm0, -48(%rax) | |
cmpq %rbp, %r12 | |
jne .L235 | |
movq $1129578500, 80(%rsp) | |
xorl %edx, %edx | |
movq %r13, %rax | |
movq $0, 88(%rsp) | |
movq $0, 96(%rsp) | |
movq $0, 104(%rsp) | |
movq $0, 112(%rsp) | |
movq $0, 120(%rsp) | |
#APP | |
# 50 "tmp.cpp" 1 | |
rolq $3, %rdi ; rolq $13, %rdi | |
rolq $61, %rdi ; rolq $51, %rdi | |
xchgq %rbx,%rbx | |
# 0 "" 2 | |
#NO_APP | |
leaq 16(%rsp), %rdi | |
movq %rdx, 8(%rsp) | |
movq 8(%rsp), %rax | |
.LEHB22: | |
call _Z33benchmark_matrix3d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi3ELi3ELi0ELi3ELi3EEESaIS2_EE | |
leaq 48(%rsp), %rdi | |
call _Z33benchmark_matrix4d_multiplicationRKSt6vectorIN5Eigen6MatrixIdLi4ELi4ELi0ELi4ELi4EEESaIS2_EE | |
.LEHE22: | |
movq 48(%rsp), %rdi | |
testq %rdi, %rdi | |
je .L236 | |
movq 64(%rsp), %rsi | |
subq %rdi, %rsi | |
call _ZdlPvm@PLT | |
.L236: | |
movq 16(%rsp), %rdi | |
testq %rdi, %rdi | |
je .L230 | |
movq 32(%rsp), %rsi | |
subq %rdi, %rsi | |
call _ZdlPvm@PLT | |
.L230: | |
movq 136(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L260 | |
addq $152, %rsp | |
.cfi_remember_state | |
.cfi_def_cfa_offset 40 | |
popq %rbx | |
.cfi_def_cfa_offset 32 | |
popq %rbp | |
.cfi_def_cfa_offset 24 | |
popq %r12 | |
.cfi_def_cfa_offset 16 | |
popq %r13 | |
.cfi_def_cfa_offset 8 | |
ret | |
.L233: | |
.cfi_restore_state | |
leaq .LC18(%rip), %rcx | |
movl $109, %edx | |
leaq .LC5(%rip), %rsi | |
leaq .LC6(%rip), %rdi | |
call __assert_fail@PLT | |
.L260: | |
call __stack_chk_fail@PLT | |
.L246: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L238 | |
.L247: | |
endbr64 | |
movq %rax, %rbx | |
jmp .L242 | |
.section .gcc_except_table,"a",@progbits | |
.LLSDA9389: | |
.byte 0xff | |
.byte 0xff | |
.byte 0x1 | |
.uleb128 .LLSDACSE9389-.LLSDACSB9389 | |
.LLSDACSB9389: | |
.uleb128 .LEHB20-.LFB9389 | |
.uleb128 .LEHE20-.LEHB20 | |
.uleb128 0 | |
.uleb128 0 | |
.uleb128 .LEHB21-.LFB9389 | |
.uleb128 .LEHE21-.LEHB21 | |
.uleb128 .L247-.LFB9389 | |
.uleb128 0 | |
.uleb128 .LEHB22-.LFB9389 | |
.uleb128 .LEHE22-.LEHB22 | |
.uleb128 .L246-.LFB9389 | |
.uleb128 0 | |
.LLSDACSE9389: | |
.text | |
.cfi_endproc | |
.section .text.unlikely | |
.cfi_startproc | |
.cfi_personality 0x9b,DW.ref.__gxx_personality_v0 | |
.cfi_lsda 0x1b,.LLSDAC9389 | |
.type _Z31benchmark_matrix_multiplicationv.cold, @function | |
_Z31benchmark_matrix_multiplicationv.cold: | |
.LFSB9389: | |
.L238: | |
.cfi_def_cfa_offset 192 | |
.cfi_offset 3, -40 | |
.cfi_offset 6, -32 | |
.cfi_offset 12, -24 | |
.cfi_offset 13, -16 | |
movq 48(%rsp), %rdi | |
movq 64(%rsp), %rsi | |
subq %rdi, %rsi | |
testq %rdi, %rdi | |
je .L239 | |
call _ZdlPvm@PLT | |
.L239: | |
movq 16(%rsp), %rdi | |
movq 32(%rsp), %rsi | |
subq %rdi, %rsi | |
testq %rdi, %rdi | |
je .L241 | |
.L240: | |
call _ZdlPvm@PLT | |
.L241: | |
movq 136(%rsp), %rax | |
subq %fs:40, %rax | |
jne .L261 | |
movq %rbx, %rdi | |
.LEHB23: | |
call _Unwind_Resume@PLT | |
.LEHE23: | |
.L242: | |
movq 16(%rsp), %rdi | |
movq 32(%rsp), %rsi | |
subq %rdi, %rsi | |
jmp .L240 | |
.L261: | |
call __stack_chk_fail@PLT | |
.cfi_endproc | |
.LFE9389: | |
.section .gcc_except_table | |
.LLSDAC9389: | |
.byte 0xff | |
.byte 0xff | |
.byte 0x1 | |
.uleb128 .LLSDACSEC9389-.LLSDACSBC9389 | |
.LLSDACSBC9389: | |
.uleb128 .LEHB23-.LCOLDB20 | |
.uleb128 .LEHE23-.LEHB23 | |
.uleb128 0 | |
.uleb128 0 | |
.LLSDACSEC9389: | |
.section .text.unlikely | |
.text | |
.size _Z31benchmark_matrix_multiplicationv, .-_Z31benchmark_matrix_multiplicationv | |
.section .text.unlikely | |
.size _Z31benchmark_matrix_multiplicationv.cold, .-_Z31benchmark_matrix_multiplicationv.cold | |
.LCOLDE20: | |
.text | |
.LHOTE20: | |
.section .text.startup,"ax",@progbits | |
.p2align 4 | |
.globl main | |
.type main, @function | |
main: | |
.LFB9391: | |
.cfi_startproc | |
endbr64 | |
subq $8, %rsp | |
.cfi_def_cfa_offset 16 | |
call _Z31benchmark_matrix_multiplicationv | |
xorl %eax, %eax | |
addq $8, %rsp | |
.cfi_def_cfa_offset 8 | |
ret | |
.cfi_endproc | |
.LFE9391: | |
.size main, .-main | |
.section .rodata.cst8,"aM",@progbits,8 | |
.align 8 | |
.LC0: | |
.long -4194304 | |
.long 1105199103 | |
.align 8 | |
.LC2: | |
.long 1413754136 | |
.long 1075388923 | |
.set .LC3,.LC12 | |
.section .data.rel.ro,"aw" | |
.align 8 | |
.LC7: | |
.quad _ZTVNSt7__cxx1115basic_stringbufIcSt11char_traitsIcESaIcEEE+16 | |
.align 8 | |
.LC8: | |
.quad _ZTVSt15basic_streambufIcSt11char_traitsIcEE+16 | |
.section .rodata.cst2,"aM",@progbits,2 | |
.align 2 | |
.LC9: | |
.byte 10 | |
.byte 0 | |
.align 2 | |
.LC10: | |
.byte 32 | |
.byte 0 | |
.section .rodata.cst8 | |
.align 8 | |
.LC11: | |
.long -1 | |
.long 0 | |
.section .rodata.cst16,"aM",@progbits,16 | |
.align 16 | |
.LC12: | |
.long 0 | |
.long 1072693248 | |
.long 0 | |
.long 0 | |
.align 16 | |
.LC16: | |
.long 0 | |
.long 0 | |
.long 0 | |
.long 1072693248 | |
.hidden DW.ref.__gxx_personality_v0 | |
.weak DW.ref.__gxx_personality_v0 | |
.section .data.rel.local.DW.ref.__gxx_personality_v0,"awG",@progbits,DW.ref.__gxx_personality_v0,comdat | |
.align 8 | |
.type DW.ref.__gxx_personality_v0, @object | |
.size DW.ref.__gxx_personality_v0, 8 | |
DW.ref.__gxx_personality_v0: | |
.quad __gxx_personality_v0 | |
.ident "GCC: (Ubuntu 13.1.0-8ubuntu1~20.04.2) 13.1.0" | |
.section .note.GNU-stack,"",@progbits | |
.section .note.gnu.property,"a" | |
.align 8 | |
.long 1f - 0f | |
.long 4f - 1f | |
.long 5 | |
0: | |
.string "GNU" | |
1: | |
.align 8 | |
.long 0xc0000002 | |
.long 3f - 2f | |
2: | |
.long 0x3 | |
3: | |
.align 8 | |
4: |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment