294 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			294 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: llc < %s -mtriple=x86_64-apple-macosx10.9 -verify-machineinstrs -mattr=cx16 | FileCheck %s
 | |
| 
 | |
| @var = global i128 0
 | |
| 
 | |
| define i128 @val_compare_and_swap(i128* %p, i128 %oldval, i128 %newval) {
 | |
| ; CHECK-LABEL: val_compare_and_swap:
 | |
| ; Due to the scheduling right after isel for cmpxchg and given the
 | |
| ; machine scheduler and copy coalescer do not mess up with physical
 | |
| ; register live-ranges, we end up with a useless copy.
 | |
| ;
 | |
| ; CHECK: movq %rcx, [[TMP:%r[0-9a-z]+]]
 | |
| ; CHECK: movq %rsi, %rax
 | |
| ; CHECK: movq %r8, %rcx
 | |
| ; CHECK: movq [[TMP]], %rbx
 | |
| ; CHECK: lock
 | |
| ; CHECK: cmpxchg16b (%rdi)
 | |
| 
 | |
|   %pair = cmpxchg i128* %p, i128 %oldval, i128 %newval acquire acquire
 | |
|   %val = extractvalue { i128, i1 } %pair, 0
 | |
|   ret i128 %val
 | |
| }
 | |
| 
 | |
| define void @fetch_and_nand(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_nand:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         andq [[INCHI]], %rcx
 | |
| ; CHECK:         movq %rax, %rbx
 | |
|   ; INCLO equivalent comes in in %rsi, so it makes sense it stays there.
 | |
| ; CHECK:         andq %rsi, %rbx
 | |
| ; CHECK:         notq %rbx
 | |
| ; CHECK:         notq %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
|   %val = atomicrmw nand i128* %p, i128 %bits release
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_or(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_or:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         movq %rax, %rbx
 | |
|   ; INCLO equivalent comes in in %rsi, so it makes sense it stays there.
 | |
| ; CHECK:         orq %rsi, %rbx
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         orq [[INCHI]], %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw or i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_add(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_add:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         movq %rax, %rbx
 | |
|   ; INCLO equivalent comes in in %rsi, so it makes sense it stays there.
 | |
| ; CHECK:         addq %rsi, %rbx
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         adcq [[INCHI]], %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw add i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_sub(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_sub:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         movq %rax, %rbx
 | |
|   ; INCLO equivalent comes in in %rsi, so it makes sense it stays there.
 | |
| ; CHECK:         subq %rsi, %rbx
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         sbbq [[INCHI]], %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw sub i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_min(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_min:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         cmpq
 | |
| ; CHECK:         sbbq
 | |
| ; CHECK:         setg
 | |
| ; CHECK:         cmovneq %rax, %rbx
 | |
| ; CHECK:         movq [[INCHI]], %rcx
 | |
| ; CHECK:         cmovneq %rdx, %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw min i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_max(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_max:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         cmpq
 | |
| ; CHECK:         sbbq
 | |
| ; CHECK:         setge
 | |
| ; CHECK:         cmovneq %rax, %rbx
 | |
| ; CHECK:         movq [[INCHI]], %rcx
 | |
| ; CHECK:         cmovneq %rdx, %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw max i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_umin(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_umin:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         cmpq
 | |
| ; CHECK:         sbbq
 | |
| ; CHECK:         seta
 | |
| ; CHECK:         cmovneq %rax, %rbx
 | |
| ; CHECK:         movq [[INCHI]], %rcx
 | |
| ; CHECK:         cmovneq %rdx, %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw umin i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define void @fetch_and_umax(i128* %p, i128 %bits) {
 | |
| ; CHECK-LABEL: fetch_and_umax:
 | |
| ; CHECK-DAG:     movq %rdx, [[INCHI:%[a-z0-9]+]]
 | |
| ; CHECK-DAG:     movq (%rdi), %rax
 | |
| ; CHECK-DAG:     movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         cmpq
 | |
| ; CHECK:         sbbq
 | |
| ; CHECK:         setb
 | |
| ; CHECK:         cmovneq %rax, %rbx
 | |
| ; CHECK:         movq [[INCHI]], %rcx
 | |
| ; CHECK:         cmovneq %rdx, %rcx
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
| ; CHECK:         movq %rax, _var
 | |
| ; CHECK:         movq %rdx, _var+8
 | |
| 
 | |
|   %val = atomicrmw umax i128* %p, i128 %bits seq_cst
 | |
|   store i128 %val, i128* @var, align 16
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define i128 @atomic_load_seq_cst(i128* %p) {
 | |
| ; CHECK-LABEL: atomic_load_seq_cst:
 | |
| ; CHECK: xorl %eax, %eax
 | |
| ; CHECK: xorl %edx, %edx
 | |
| ; CHECK: xorl %ecx, %ecx
 | |
| ; CHECK: xorl %ebx, %ebx
 | |
| ; CHECK: lock
 | |
| ; CHECK: cmpxchg16b (%rdi)
 | |
| 
 | |
|    %r = load atomic i128, i128* %p seq_cst, align 16
 | |
|    ret i128 %r
 | |
| }
 | |
| 
 | |
| define i128 @atomic_load_relaxed(i128* %p) {
 | |
| ; CHECK: atomic_load_relaxed:
 | |
| ; CHECK: xorl %eax, %eax
 | |
| ; CHECK: xorl %edx, %edx
 | |
| ; CHECK: xorl %ecx, %ecx
 | |
| ; CHECK: xorl %ebx, %ebx
 | |
| ; CHECK: lock
 | |
| ; CHECK: cmpxchg16b (%rdi)
 | |
| 
 | |
|    %r = load atomic i128, i128* %p monotonic, align 16
 | |
|    ret i128 %r
 | |
| }
 | |
| 
 | |
| define void @atomic_store_seq_cst(i128* %p, i128 %in) {
 | |
| ; CHECK-LABEL: atomic_store_seq_cst:
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         movq %rsi, %rbx
 | |
| ; CHECK:         movq (%rdi), %rax
 | |
| ; CHECK:         movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| ; CHECK-NOT:     callq ___sync_lock_test_and_set_16
 | |
| 
 | |
|    store atomic i128 %in, i128* %p seq_cst, align 16
 | |
|    ret void
 | |
| }
 | |
| 
 | |
| define void @atomic_store_release(i128* %p, i128 %in) {
 | |
| ; CHECK-LABEL: atomic_store_release:
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         movq %rsi, %rbx
 | |
| ; CHECK:         movq (%rdi), %rax
 | |
| ; CHECK:         movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
|    store atomic i128 %in, i128* %p release, align 16
 | |
|    ret void
 | |
| }
 | |
| 
 | |
| define void @atomic_store_relaxed(i128* %p, i128 %in) {
 | |
| ; CHECK-LABEL: atomic_store_relaxed:
 | |
| ; CHECK:         movq %rdx, %rcx
 | |
| ; CHECK:         movq %rsi, %rbx
 | |
| ; CHECK:         movq (%rdi), %rax
 | |
| ; CHECK:         movq 8(%rdi), %rdx
 | |
| 
 | |
| ; CHECK: [[LOOP:.?LBB[0-9]+_[0-9]+]]:
 | |
| ; CHECK:         lock
 | |
| ; CHECK:         cmpxchg16b (%rdi)
 | |
| ; CHECK:         jne [[LOOP]]
 | |
| 
 | |
|    store atomic i128 %in, i128* %p unordered, align 16
 | |
|    ret void
 | |
| }
 |