Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 7 of 7 for VPMOVMSKB (0.44 sec)

  1. src/internal/bytealg/count_amd64.s

    	LEAQ -64(SI)(BX*1), R11
    	LEAQ (SI)(BX*1), R13
    	VPBROADCASTB  X0, Y1
    	PCALIGN $32
    avx2_loop:
    	VMOVDQU (DI), Y2
    	VMOVDQU 32(DI), Y4
    	VPCMPEQB Y1, Y2, Y3
    	VPCMPEQB Y1, Y4, Y5
    	VPMOVMSKB Y3, DX
    	VPMOVMSKB Y5, CX
    	POPCNTL DX, DX
    	POPCNTL CX, CX
    	ADDQ DX, R12
    	ADDQ CX, R12
    	ADDQ $64, DI
    	CMPQ DI, R11
    	JLE avx2_loop
    
    	// If last block is already processed,
    	// skip to the end.
    	//
    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Fri Oct 06 20:54:43 UTC 2023
    - 4.7K bytes
    - Viewed (0)
  2. src/internal/bytealg/compare_amd64.s

    	// Loop is unrolled and uses AVX2.
    big_loop_avx2:
    	VMOVDQU	(SI), Y2
    	VMOVDQU	(DI), Y3
    	VMOVDQU	32(SI), Y4
    	VMOVDQU	32(DI), Y5
    	VPCMPEQB Y2, Y3, Y0
    	VPMOVMSKB Y0, AX
    	XORL	$0xffffffff, AX
    	JNE	diff32_avx2
    	VPCMPEQB Y4, Y5, Y6
    	VPMOVMSKB Y6, AX
    	XORL	$0xffffffff, AX
    	JNE	diff64_avx2
    
    	ADDQ	$64, SI
    	ADDQ	$64, DI
    	SUBQ	$64, R8
    	CMPQ	R8, $64
    	JB	big_loop_avx2_exit
    	JMP	big_loop_avx2
    
    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Thu Aug 18 17:17:01 UTC 2022
    - 4.3K bytes
    - Viewed (0)
  3. src/internal/bytealg/index_amd64.s

    loop32:
    	VMOVDQU (DI), Y2
    	VPCMPEQB Y1, Y2, Y3
    	VPMOVMSKB Y3, SI
    	CMPL  SI, $0xffffffff
    	JE   success_avx2
    	ADDQ $1,DI
    	CMPQ DI,DX
    	JB loop32
    	JMP fail_avx2
    _33_to_63:
    	LEAQ 1(DI)(DX*1), DX
    	SUBQ AX, DX
    	VMOVDQU -32(R8)(AX*1), Y0
    	VMOVDQU (R8), Y1
    loop33to63:
    	VMOVDQU (DI), Y2
    	VPCMPEQB Y1, Y2, Y3
    	VPMOVMSKB Y3, SI
    	CMPL  SI, $0xffffffff
    	JE   partial_success33to63
    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Mon Aug 07 00:20:48 UTC 2023
    - 5.1K bytes
    - Viewed (0)
  4. src/internal/bytealg/equal_amd64.s

    	PCALIGN $16
    hugeloop_avx2:
    	CMPQ	BX, $64
    	JB	bigloop_avx2
    	VMOVDQU	(SI), Y0
    	VMOVDQU	(DI), Y1
    	VMOVDQU	32(SI), Y2
    	VMOVDQU	32(DI), Y3
    	VPCMPEQB	Y1, Y0, Y4
    	VPCMPEQB	Y2, Y3, Y5
    	VPAND	Y4, Y5, Y6
    	VPMOVMSKB Y6, DX
    	ADDQ	$64, SI
    	ADDQ	$64, DI
    	SUBQ	$64, BX
    	CMPL	DX, $0xffffffff
    	JEQ	hugeloop_avx2
    	VZEROUPPER
    	XORQ	AX, AX	// return 0
    	RET
    
    bigloop_avx2:
    	VZEROUPPER
    
    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Fri Nov 17 16:34:40 UTC 2023
    - 2.8K bytes
    - Viewed (0)
  5. src/internal/bytealg/indexbyte_amd64.s

    	ADDQ $32, DI
    	CMPQ DI, R11
    	JLT avx2_loop
    	MOVQ R11, DI
    	VMOVDQU (DI), Y2
    	VPCMPEQB Y1, Y2, Y3
    	VPTEST Y3, Y3
    	JNZ avx2success
    	VZEROUPPER
    	MOVQ $-1, (R8)
    	RET
    
    avx2success:
    	VPMOVMSKB Y3, DX
    	BSFL DX, DX
    	SUBQ SI, DI
    	ADDQ DI, DX
    	MOVQ DX, (R8)
    	VZEROUPPER
    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Wed Nov 01 19:06:01 UTC 2023
    - 3.1K bytes
    - Viewed (0)
  6. src/cmd/internal/obj/x86/anames.go

    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Tue Apr 11 18:32:50 UTC 2023
    - 19.1K bytes
    - Viewed (0)
  7. src/cmd/asm/internal/asm/testdata/amd64enc.s

    	VPMINUW Y11, Y15, Y11                   // c442053adb
    	VPMOVMSKB X2, DX                        // c4e179d7d2 or c5f9d7d2
    	VPMOVMSKB X11, DX                       // c4c179d7d3
    	VPMOVMSKB X2, R11                       // c46179d7da or c579d7da
    	VPMOVMSKB X11, R11                      // c44179d7db
    	VPMOVMSKB Y2, DX                        // c4e17dd7d2 or c5fdd7d2
    	VPMOVMSKB Y11, DX                       // c4c17dd7d3
    Registered: Wed Jun 12 16:32:35 UTC 2024
    - Last Modified: Fri Oct 08 21:38:44 UTC 2021
    - 581.9K bytes
    - Viewed (0)
Back to top