4 .globl sum_float64_sse4
6 .type sum_float64_sse4,@function
7 sum_float64_sse4: # @sum_float64_sse4
35 .LBB0_9: # =>This Inner Loop Header: Depth=1
36 movupd xmm2, xmmword ptr [rdi + 8*rcx]
37 movupd xmm3, xmmword ptr [rdi + 8*rcx + 16]
50 .LBB0_4: # =>This Inner Loop Header: Depth=1
51 addsd xmm0, qword ptr [rax]
56 movsd qword ptr [rdx], xmm0
70 lea rcx, [rdi + 8*rcx + 112]
72 .LBB0_12: # =>This Inner Loop Header: Depth=1
73 movupd xmm2, xmmword ptr [rcx - 112]
74 movupd xmm3, xmmword ptr [rcx - 96]
75 movupd xmm4, xmmword ptr [rcx - 80]
76 movupd xmm5, xmmword ptr [rcx - 64]
79 movupd xmm6, xmmword ptr [rcx - 48]
80 movupd xmm7, xmmword ptr [rcx - 32]
85 movupd xmm0, xmmword ptr [rcx - 16]
86 movupd xmm1, xmmword ptr [rcx]
99 .size sum_float64_sse4, .Lfunc_end0-sum_float64_sse4
102 .ident "Apple LLVM version 9.0.0 (clang-900.0.39.2)"
103 .section ".note.GNU-stack","",@progbits