gitee.com/quant1x/num@v0.3.2/asm/c2goasm/test/cpp/MaddMemcpy.s (about)

     1  	.section	__TEXT,__text,regular,pure_instructions
     2  	.macosx_version_min 10, 11
     3  	.intel_syntax noprefix
     4  	.globl	__Z10MaddMemcpyPfS_S_iiS_
     5  	.align	4, 0x90
     6  __Z10MaddMemcpyPfS_S_iiS_:              ## @_Z10MaddMemcpyPfS_S_iiS_
     7  ## BB#0:
     8  	push	rbp
     9  	mov	rbp, rsp
    10  	push	r15
    11  	push	r14
    12  	push	r13
    13  	push	r12
    14  	push	rbx
    15  	push	rax
    16  	mov	r14, r9
    17  	mov	r15d, r8d
    18  	mov	r12, rdx
    19  	mov	r13, rsi
    20  	mov	rbx, rdi
    21  	movsxd	rdx, ecx
    22  	mov	rdi, r13
    23  	mov	rsi, rbx
    24  	call	_memcpy
    25  	movsxd	rdx, r15d
    26  	mov	rdi, r12
    27  	mov	rsi, rbx
    28  	call	_memcpy
    29  	vmovups	ymm0, ymmword ptr [rbx]
    30  	vmovups	ymm1, ymmword ptr [r13]
    31  	vfmadd213ps	ymm1, ymm0, ymmword ptr [r12]
    32  	vmovups	ymmword ptr [r14], ymm1
    33  	add	rsp, 8
    34  	pop	rbx
    35  	pop	r12
    36  	pop	r13
    37  	pop	r14
    38  	pop	r15
    39  	pop	rbp
    40  	vzeroupper
    41  	ret
    42  
    43  
    44  .subsections_via_symbols