fix markers for gromacs-icx-avx512-sp
Signed-off-by: Rafael Ravedutti <rafaelravedutti@gmail.com>
This commit is contained in:
		
										
											Binary file not shown.
										
									
								
							@@ -1331,6 +1331,11 @@ computeForceLJ_2xnn_full:               #
 | 
				
			|||||||
	vxorps	%xmm8, %xmm8, %xmm8
 | 
						vxorps	%xmm8, %xmm8, %xmm8
 | 
				
			||||||
	vxorps	%xmm4, %xmm4, %xmm4
 | 
						vxorps	%xmm4, %xmm4, %xmm4
 | 
				
			||||||
	.p2align	4, 0x90
 | 
						.p2align	4, 0x90
 | 
				
			||||||
 | 
					# LLVM-MCA-BEGIN
 | 
				
			||||||
 | 
					movl      $111, %ebx # OSACA START MARKER
 | 
				
			||||||
 | 
					.byte     100        # OSACA START MARKER
 | 
				
			||||||
 | 
					.byte     103        # OSACA START MARKER
 | 
				
			||||||
 | 
					.byte     144        # OSACA START MARKER
 | 
				
			||||||
.LBB2_12:                               #   Parent Loop BB2_7 Depth=1
 | 
					.LBB2_12:                               #   Parent Loop BB2_7 Depth=1
 | 
				
			||||||
                                        # =>  This Inner Loop Header: Depth=2
 | 
					                                        # =>  This Inner Loop Header: Depth=2
 | 
				
			||||||
	movslq	(%r11,%rax,4), %rcx
 | 
						movslq	(%r11,%rax,4), %rcx
 | 
				
			||||||
@@ -1412,6 +1417,11 @@ computeForceLJ_2xnn_full:               #
 | 
				
			|||||||
	incq	%rax
 | 
						incq	%rax
 | 
				
			||||||
	cmpq	%rax, %r10
 | 
						cmpq	%rax, %r10
 | 
				
			||||||
	jne	.LBB2_12
 | 
						jne	.LBB2_12
 | 
				
			||||||
 | 
					# LLVM-MCA-END
 | 
				
			||||||
 | 
					movl      $222, %ebx # OSACA END MARKER
 | 
				
			||||||
 | 
					.byte     100        # OSACA END MARKER
 | 
				
			||||||
 | 
					.byte     103        # OSACA END MARKER
 | 
				
			||||||
 | 
					.byte     144        # OSACA END MARKER
 | 
				
			||||||
# %bb.13:                               #   in Loop: Header=BB2_7 Depth=1
 | 
					# %bb.13:                               #   in Loop: Header=BB2_7 Depth=1
 | 
				
			||||||
	movq	%r15, %r14
 | 
						movq	%r15, %r14
 | 
				
			||||||
	movq	8(%rsp), %rbp                   # 8-byte Reload
 | 
						movq	8(%rsp), %rbp                   # 8-byte Reload
 | 
				
			||||||
@@ -1655,12 +1665,7 @@ computeForceLJ_4xn_half:                #
 | 
				
			|||||||
	vmovups	64(%rsp), %zmm6                 # 64-byte Reload
 | 
						vmovups	64(%rsp), %zmm6                 # 64-byte Reload
 | 
				
			||||||
	vmovups	512(%rsp), %zmm7                # 64-byte Reload
 | 
						vmovups	512(%rsp), %zmm7                # 64-byte Reload
 | 
				
			||||||
	.p2align	4, 0x90
 | 
						.p2align	4, 0x90
 | 
				
			||||||
movl      $111, %ebx # OSACA START MARKER
 | 
					 | 
				
			||||||
.byte     100        # OSACA START MARKER
 | 
					 | 
				
			||||||
.byte     103        # OSACA START MARKER
 | 
					 | 
				
			||||||
.byte     144        # OSACA START MARKER
 | 
					 | 
				
			||||||
# pointer_increment=64 0f91ac4f7fe1a70d0c899f7f3e745649
 | 
					# pointer_increment=64 0f91ac4f7fe1a70d0c899f7f3e745649
 | 
				
			||||||
# LLVM-MCA-BEGIN
 | 
					 | 
				
			||||||
.LBB4_8:                                # =>This Inner Loop Header: Depth=1
 | 
					.LBB4_8:                                # =>This Inner Loop Header: Depth=1
 | 
				
			||||||
	movslq	(%r11,%rdx,4), %rax
 | 
						movslq	(%r11,%rdx,4), %rax
 | 
				
			||||||
	movq	%rax, %rsi
 | 
						movq	%rax, %rsi
 | 
				
			||||||
@@ -1793,11 +1798,6 @@ movl      $111, %ebx # OSACA START MARKER
 | 
				
			|||||||
	movq	160(%r15), %rdi
 | 
						movq	160(%r15), %rdi
 | 
				
			||||||
	incq	%rdx
 | 
						incq	%rdx
 | 
				
			||||||
	jmp	.LBB4_8
 | 
						jmp	.LBB4_8
 | 
				
			||||||
# LLVM-MCA-END
 | 
					 | 
				
			||||||
movl      $222, %ebx # OSACA END MARKER
 | 
					 | 
				
			||||||
.byte     100        # OSACA END MARKER
 | 
					 | 
				
			||||||
.byte     103        # OSACA END MARKER
 | 
					 | 
				
			||||||
.byte     144        # OSACA END MARKER
 | 
					 | 
				
			||||||
	.p2align	5, 0x90
 | 
						.p2align	5, 0x90
 | 
				
			||||||
.LBB4_18:
 | 
					.LBB4_18:
 | 
				
			||||||
	vzeroupper
 | 
						vzeroupper
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user