Diff 12264

test/CodeGen/X86/atomic_mi.ll

Show All 12 Lines
; The binary operations supported are currently add, and, or, xor.		; The binary operations supported are currently add, and, or, xor.
; sub is not supported because they are translated by an addition of the		; sub is not supported because they are translated by an addition of the
; negated immediate.		; negated immediate.
; Finally, we also check the same kind of pattern for inc/dec		; Finally, we also check the same kind of pattern for inc/dec

; seq_cst stores are left as (lock) xchgl, but we try to check every other		; seq_cst stores are left as (lock) xchgl, but we try to check every other
; attribute at least once.		; attribute at least once.

		; Please note that these operations do not require the lock prefix: only
		; sequentially consistent stores require this kind of protection on X86.

define void @store_atomic_imm_8(i8* %p) {		define void @store_atomic_imm_8(i8* %p) {
; X64-LABEL: store_atomic_imm_8		; X64-LABEL: store_atomic_imm_8
; X64: movb		; X64: movb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: store_atomic_imm_8		; X32-LABEL: store_atomic_imm_8
; X32: movb		; X32: movb
; X32-NOT: movb		; X32-NOT: movb
store atomic i8 42, i8* %p release, align 1		store atomic i8 42, i8* %p release, align 1
▲ Show 20 Lines • Show All 56 Lines • ▼ Show 20 Lines	; X32: xchgl
store atomic i32 42, i32* %p seq_cst, align 4		store atomic i32 42, i32* %p seq_cst, align 4
ret void		ret void
}		}

; ----- ADD -----		; ----- ADD -----

define void @add_8(i8* %p) {		define void @add_8(i8* %p) {
; X64-LABEL: add_8		; X64-LABEL: add_8
		; X64-NOT: lock
; X64: addb		; X64: addb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: add_8		; X32-LABEL: add_8
		; X32-NOT: lock
; X32: addb		; X32: addb
; X32-NOT: movb		; X32-NOT: movb
%1 = load atomic i8* %p seq_cst, align 1		%1 = load atomic i8* %p seq_cst, align 1
%2 = add i8 %1, 2		%2 = add i8 %1, 2
store atomic i8 %2, i8* %p release, align 1		store atomic i8 %2, i8* %p release, align 1
ret void		ret void
}		}

define void @add_16(i16* %p) {		define void @add_16(i16* %p) {
; Currently the transformation is not done on 16 bit accesses, as the backend		; Currently the transformation is not done on 16 bit accesses, as the backend
; treat 16 bit arithmetic as expensive on X86/X86_64.		; treat 16 bit arithmetic as expensive on X86/X86_64.
; X64-LABEL: add_16		; X64-LABEL: add_16
; X64-NOT: addw		; X64-NOT: addw
; X32-LABEL: add_16		; X32-LABEL: add_16
; X32-NOT: addw		; X32-NOT: addw
%1 = load atomic i16* %p acquire, align 2		%1 = load atomic i16* %p acquire, align 2
%2 = add i16 %1, 2		%2 = add i16 %1, 2
store atomic i16 %2, i16* %p release, align 2		store atomic i16 %2, i16* %p release, align 2
ret void		ret void
}		}

define void @add_32(i32* %p) {		define void @add_32(i32* %p) {
; X64-LABEL: add_32		; X64-LABEL: add_32
		; X64-NOT: lock
; X64: addl		; X64: addl
; X64-NOT: movl		; X64-NOT: movl
; X32-LABEL: add_32		; X32-LABEL: add_32
		; X32-NOT: lock
; X32: addl		; X32: addl
; X32-NOT: movl		; X32-NOT: movl
%1 = load atomic i32* %p acquire, align 4		%1 = load atomic i32* %p acquire, align 4
%2 = add i32 %1, 2		%2 = add i32 %1, 2
store atomic i32 %2, i32* %p monotonic, align 4		store atomic i32 %2, i32* %p monotonic, align 4
ret void		ret void
}		}

define void @add_64(i64* %p) {		define void @add_64(i64* %p) {
; X64-LABEL: add_64		; X64-LABEL: add_64
		; X64-NOT: lock
; X64: addq		; X64: addq
; X64-NOT: movq		; X64-NOT: movq
; We do not check X86-32 as it cannot do 'addq'.		; We do not check X86-32 as it cannot do 'addq'.
; X32-LABEL: add_64		; X32-LABEL: add_64
%1 = load atomic i64* %p acquire, align 8		%1 = load atomic i64* %p acquire, align 8
%2 = add i64 %1, 2		%2 = add i64 %1, 2
store atomic i64 %2, i64* %p release, align 8		store atomic i64 %2, i64* %p release, align 8
ret void		ret void
Show All 9 Lines	; X32: xchgl
store atomic i32 %2, i32* %p seq_cst, align 4		store atomic i32 %2, i32* %p seq_cst, align 4
ret void		ret void
}		}

; ----- AND -----		; ----- AND -----

define void @and_8(i8* %p) {		define void @and_8(i8* %p) {
; X64-LABEL: and_8		; X64-LABEL: and_8
		; X64-NOT: lock
; X64: andb		; X64: andb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: and_8		; X32-LABEL: and_8
		; X32-NOT: lock
; X32: andb		; X32: andb
; X32-NOT: movb		; X32-NOT: movb
%1 = load atomic i8* %p monotonic, align 1		%1 = load atomic i8* %p monotonic, align 1
%2 = and i8 %1, 2		%2 = and i8 %1, 2
store atomic i8 %2, i8* %p release, align 1		store atomic i8 %2, i8* %p release, align 1
ret void		ret void
}		}

define void @and_16(i16* %p) {		define void @and_16(i16* %p) {
; Currently the transformation is not done on 16 bit accesses, as the backend		; Currently the transformation is not done on 16 bit accesses, as the backend
; treat 16 bit arithmetic as expensive on X86/X86_64.		; treat 16 bit arithmetic as expensive on X86/X86_64.
; X64-LABEL: and_16		; X64-LABEL: and_16
; X64-NOT: andw		; X64-NOT: andw
; X32-LABEL: and_16		; X32-LABEL: and_16
; X32-NOT: andw		; X32-NOT: andw
%1 = load atomic i16* %p acquire, align 2		%1 = load atomic i16* %p acquire, align 2
%2 = and i16 %1, 2		%2 = and i16 %1, 2
store atomic i16 %2, i16* %p release, align 2		store atomic i16 %2, i16* %p release, align 2
ret void		ret void
}		}

define void @and_32(i32* %p) {		define void @and_32(i32* %p) {
; X64-LABEL: and_32		; X64-LABEL: and_32
		; X64-NOT: lock
; X64: andl		; X64: andl
; X64-NOT: movl		; X64-NOT: movl
; X32-LABEL: and_32		; X32-LABEL: and_32
		; X32-NOT: lock
; X32: andl		; X32: andl
; X32-NOT: movl		; X32-NOT: movl
%1 = load atomic i32* %p acquire, align 4		%1 = load atomic i32* %p acquire, align 4
%2 = and i32 %1, 2		%2 = and i32 %1, 2
store atomic i32 %2, i32* %p release, align 4		store atomic i32 %2, i32* %p release, align 4
ret void		ret void
}		}

define void @and_64(i64* %p) {		define void @and_64(i64* %p) {
; X64-LABEL: and_64		; X64-LABEL: and_64
		; X64-NOT: lock
; X64: andq		; X64: andq
; X64-NOT: movq		; X64-NOT: movq
; We do not check X86-32 as it cannot do 'andq'.		; We do not check X86-32 as it cannot do 'andq'.
; X32-LABEL: and_64		; X32-LABEL: and_64
%1 = load atomic i64* %p acquire, align 8		%1 = load atomic i64* %p acquire, align 8
%2 = and i64 %1, 2		%2 = and i64 %1, 2
store atomic i64 %2, i64* %p release, align 8		store atomic i64 %2, i64* %p release, align 8
ret void		ret void
}		}

		define void @and_32_seq_cst(i32* %p) {
		; X64-LABEL: and_32_seq_cst
		; X64: xchgl
		; X32-LABEL: and_32_seq_cst
		; X32: xchgl
		reamesUnsubmitted Not Done Reply Inline Actions Shouldn't there be a lock prefix on this one to enforce the StoreLoad barrier required by cst? cst is w.r.t. all addresses (unlike every other ordering mode...) reames: Shouldn't there be a lock prefix on this one to enforce the StoreLoad barrier required by cst?
		%1 = load atomic i32* %p monotonic, align 4
		%2 = and i32 %1, 2
		store atomic i32 %2, i32* %p seq_cst, align 4
		ret void
		}

; ----- OR -----		; ----- OR -----

define void @or_8(i8* %p) {		define void @or_8(i8* %p) {
; X64-LABEL: or_8		; X64-LABEL: or_8
		; X64-NOT: lock
; X64: orb		; X64: orb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: or_8		; X32-LABEL: or_8
		; X32-NOT: lock
; X32: orb		; X32: orb
; X32-NOT: movb		; X32-NOT: movb
%1 = load atomic i8* %p acquire, align 1		%1 = load atomic i8* %p acquire, align 1
%2 = or i8 %1, 2		%2 = or i8 %1, 2
store atomic i8 %2, i8* %p release, align 1		store atomic i8 %2, i8* %p release, align 1
ret void		ret void
}		}

define void @or_16(i16* %p) {		define void @or_16(i16* %p) {
; X64-LABEL: or_16		; X64-LABEL: or_16
; X64-NOT: orw		; X64-NOT: orw
; X32-LABEL: or_16		; X32-LABEL: or_16
; X32-NOT: orw		; X32-NOT: orw
%1 = load atomic i16* %p acquire, align 2		%1 = load atomic i16* %p acquire, align 2
%2 = or i16 %1, 2		%2 = or i16 %1, 2
store atomic i16 %2, i16* %p release, align 2		store atomic i16 %2, i16* %p release, align 2
ret void		ret void
}		}

define void @or_32(i32* %p) {		define void @or_32(i32* %p) {
; X64-LABEL: or_32		; X64-LABEL: or_32
		; X64-NOT: lock
; X64: orl		; X64: orl
; X64-NOT: movl		; X64-NOT: movl
; X32-LABEL: or_32		; X32-LABEL: or_32
		; X32-NOT: lock
; X32: orl		; X32: orl
; X32-NOT: movl		; X32-NOT: movl
%1 = load atomic i32* %p acquire, align 4		%1 = load atomic i32* %p acquire, align 4
%2 = or i32 %1, 2		%2 = or i32 %1, 2
store atomic i32 %2, i32* %p release, align 4		store atomic i32 %2, i32* %p release, align 4
ret void		ret void
}		}

define void @or_64(i64* %p) {		define void @or_64(i64* %p) {
; X64-LABEL: or_64		; X64-LABEL: or_64
		; X64-NOT: lock
; X64: orq		; X64: orq
; X64-NOT: movq		; X64-NOT: movq
; We do not check X86-32 as it cannot do 'orq'.		; We do not check X86-32 as it cannot do 'orq'.
; X32-LABEL: or_64		; X32-LABEL: or_64
%1 = load atomic i64* %p acquire, align 8		%1 = load atomic i64* %p acquire, align 8
%2 = or i64 %1, 2		%2 = or i64 %1, 2
store atomic i64 %2, i64* %p release, align 8		store atomic i64 %2, i64* %p release, align 8
ret void		ret void
}		}

		define void @or_32_seq_cst(i32* %p) {
		; X64-LABEL: or_32_seq_cst
		; X64: xchgl
		; X32-LABEL: or_32_seq_cst
		; X32: xchgl
		%1 = load atomic i32* %p monotonic, align 4
		%2 = or i32 %1, 2
		store atomic i32 %2, i32* %p seq_cst, align 4
		reamesUnsubmitted Not Done Reply Inline Actions Same here. reames: Same here.
		ret void
		}

; ----- XOR -----		; ----- XOR -----

define void @xor_8(i8* %p) {		define void @xor_8(i8* %p) {
; X64-LABEL: xor_8		; X64-LABEL: xor_8
		; X64-NOT: lock
; X64: xorb		; X64: xorb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: xor_8		; X32-LABEL: xor_8
		; X32-NOT: lock
; X32: xorb		; X32: xorb
; X32-NOT: movb		; X32-NOT: movb
%1 = load atomic i8* %p acquire, align 1		%1 = load atomic i8* %p acquire, align 1
%2 = xor i8 %1, 2		%2 = xor i8 %1, 2
store atomic i8 %2, i8* %p release, align 1		store atomic i8 %2, i8* %p release, align 1
ret void		ret void
}		}

define void @xor_16(i16* %p) {		define void @xor_16(i16* %p) {
; X64-LABEL: xor_16		; X64-LABEL: xor_16
; X64-NOT: xorw		; X64-NOT: xorw
; X32-LABEL: xor_16		; X32-LABEL: xor_16
; X32-NOT: xorw		; X32-NOT: xorw
%1 = load atomic i16* %p acquire, align 2		%1 = load atomic i16* %p acquire, align 2
%2 = xor i16 %1, 2		%2 = xor i16 %1, 2
store atomic i16 %2, i16* %p release, align 2		store atomic i16 %2, i16* %p release, align 2
ret void		ret void
}		}

define void @xor_32(i32* %p) {		define void @xor_32(i32* %p) {
; X64-LABEL: xor_32		; X64-LABEL: xor_32
		; X64-NOT: lock
; X64: xorl		; X64: xorl
; X64-NOT: movl		; X64-NOT: movl
; X32-LABEL: xor_32		; X32-LABEL: xor_32
		; X32-NOT: lock
; X32: xorl		; X32: xorl
; X32-NOT: movl		; X32-NOT: movl
%1 = load atomic i32* %p acquire, align 4		%1 = load atomic i32* %p acquire, align 4
%2 = xor i32 %1, 2		%2 = xor i32 %1, 2
store atomic i32 %2, i32* %p release, align 4		store atomic i32 %2, i32* %p release, align 4
ret void		ret void
}		}

define void @xor_64(i64* %p) {		define void @xor_64(i64* %p) {
; X64-LABEL: xor_64		; X64-LABEL: xor_64
		; X64-NOT: lock
; X64: xorq		; X64: xorq
; X64-NOT: movq		; X64-NOT: movq
; We do not check X86-32 as it cannot do 'xorq'.		; We do not check X86-32 as it cannot do 'xorq'.
; X32-LABEL: xor_64		; X32-LABEL: xor_64
%1 = load atomic i64* %p acquire, align 8		%1 = load atomic i64* %p acquire, align 8
%2 = xor i64 %1, 2		%2 = xor i64 %1, 2
store atomic i64 %2, i64* %p release, align 8		store atomic i64 %2, i64* %p release, align 8
ret void		ret void
}		}

		define void @xor_32_seq_cst(i32* %p) {
		; X64-LABEL: xor_32_seq_cst
		; X64: xchgl
		; X32-LABEL: xor_32_seq_cst
		; X32: xchgl
		reamesUnsubmitted Not Done Reply Inline Actions Again, lock prefix? reames: Again, lock prefix?
		%1 = load atomic i32* %p monotonic, align 4
		%2 = xor i32 %1, 2
		store atomic i32 %2, i32* %p seq_cst, align 4
		ret void
		}

; ----- INC -----		; ----- INC -----

define void @inc_8(i8* %p) {		define void @inc_8(i8* %p) {
; X64-LABEL: inc_8		; X64-LABEL: inc_8
		; X64-NOT: lock
; X64: incb		; X64: incb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: inc_8		; X32-LABEL: inc_8
		; X32-NOT: lock
; X32: incb		; X32: incb
; X32-NOT: movb		; X32-NOT: movb
%1 = load atomic i8* %p seq_cst, align 1		%1 = load atomic i8* %p seq_cst, align 1
%2 = add i8 %1, 1		%2 = add i8 %1, 1
store atomic i8 %2, i8* %p release, align 1		store atomic i8 %2, i8* %p release, align 1
ret void		ret void
}		}

define void @inc_16(i16* %p) {		define void @inc_16(i16* %p) {
; Currently the transformation is not done on 16 bit accesses, as the backend		; Currently the transformation is not done on 16 bit accesses, as the backend
; treat 16 bit arithmetic as expensive on X86/X86_64.		; treat 16 bit arithmetic as expensive on X86/X86_64.
; X64-LABEL: inc_16		; X64-LABEL: inc_16
; X64-NOT: incw		; X64-NOT: incw
; X32-LABEL: inc_16		; X32-LABEL: inc_16
; X32-NOT: incw		; X32-NOT: incw
%1 = load atomic i16* %p acquire, align 2		%1 = load atomic i16* %p acquire, align 2
%2 = add i16 %1, 1		%2 = add i16 %1, 1
store atomic i16 %2, i16* %p release, align 2		store atomic i16 %2, i16* %p release, align 2
ret void		ret void
}		}

define void @inc_32(i32* %p) {		define void @inc_32(i32* %p) {
; X64-LABEL: inc_32		; X64-LABEL: inc_32
		; X64-NOT: lock
; X64: incl		; X64: incl
; X64-NOT: movl		; X64-NOT: movl
; X32-LABEL: inc_32		; X32-LABEL: inc_32
		; X32-NOT: lock
; X32: incl		; X32: incl
; X32-NOT: movl		; X32-NOT: movl
%1 = load atomic i32* %p acquire, align 4		%1 = load atomic i32* %p acquire, align 4
%2 = add i32 %1, 1		%2 = add i32 %1, 1
store atomic i32 %2, i32* %p monotonic, align 4		store atomic i32 %2, i32* %p monotonic, align 4
ret void		ret void
}		}

define void @inc_64(i64* %p) {		define void @inc_64(i64* %p) {
; X64-LABEL: inc_64		; X64-LABEL: inc_64
		; X64-NOT: lock
; X64: incq		; X64: incq
; X64-NOT: movq		; X64-NOT: movq
; We do not check X86-32 as it cannot do 'incq'.		; We do not check X86-32 as it cannot do 'incq'.
; X32-LABEL: inc_64		; X32-LABEL: inc_64
%1 = load atomic i64* %p acquire, align 8		%1 = load atomic i64* %p acquire, align 8
%2 = add i64 %1, 1		%2 = add i64 %1, 1
store atomic i64 %2, i64* %p release, align 8		store atomic i64 %2, i64* %p release, align 8
ret void		ret void
Show All 9 Lines	; X32: xchgl
store atomic i32 %2, i32* %p seq_cst, align 4		store atomic i32 %2, i32* %p seq_cst, align 4
ret void		ret void
}		}

; ----- DEC -----		; ----- DEC -----

define void @dec_8(i8* %p) {		define void @dec_8(i8* %p) {
; X64-LABEL: dec_8		; X64-LABEL: dec_8
		; X64-NOT: lock
; X64: decb		; X64: decb
; X64-NOT: movb		; X64-NOT: movb
; X32-LABEL: dec_8		; X32-LABEL: dec_8
		; X32-NOT: lock
; X32: decb		; X32: decb
; X32-NOT: movb		; X32-NOT: movb
%1 = load atomic i8* %p seq_cst, align 1		%1 = load atomic i8* %p seq_cst, align 1
%2 = sub i8 %1, 1		%2 = sub i8 %1, 1
store atomic i8 %2, i8* %p release, align 1		store atomic i8 %2, i8* %p release, align 1
ret void		ret void
}		}

define void @dec_16(i16* %p) {		define void @dec_16(i16* %p) {
; Currently the transformation is not done on 16 bit accesses, as the backend		; Currently the transformation is not done on 16 bit accesses, as the backend
; treat 16 bit arithmetic as expensive on X86/X86_64.		; treat 16 bit arithmetic as expensive on X86/X86_64.
; X64-LABEL: dec_16		; X64-LABEL: dec_16
; X64-NOT: decw		; X64-NOT: decw
; X32-LABEL: dec_16		; X32-LABEL: dec_16
; X32-NOT: decw		; X32-NOT: decw
%1 = load atomic i16* %p acquire, align 2		%1 = load atomic i16* %p acquire, align 2
%2 = sub i16 %1, 1		%2 = sub i16 %1, 1
store atomic i16 %2, i16* %p release, align 2		store atomic i16 %2, i16* %p release, align 2
ret void		ret void
}		}

define void @dec_32(i32* %p) {		define void @dec_32(i32* %p) {
; X64-LABEL: dec_32		; X64-LABEL: dec_32
		; X64-NOT: lock
; X64: decl		; X64: decl
; X64-NOT: movl		; X64-NOT: movl
; X32-LABEL: dec_32		; X32-LABEL: dec_32
		; X32-NOT: lock
; X32: decl		; X32: decl
; X32-NOT: movl		; X32-NOT: movl
%1 = load atomic i32* %p acquire, align 4		%1 = load atomic i32* %p acquire, align 4
%2 = sub i32 %1, 1		%2 = sub i32 %1, 1
store atomic i32 %2, i32* %p monotonic, align 4		store atomic i32 %2, i32* %p monotonic, align 4
ret void		ret void
}		}

define void @dec_64(i64* %p) {		define void @dec_64(i64* %p) {
; X64-LABEL: dec_64		; X64-LABEL: dec_64
		; X64-NOT: lock
; X64: decq		; X64: decq
; X64-NOT: movq		; X64-NOT: movq
; We do not check X86-32 as it cannot do 'decq'.		; We do not check X86-32 as it cannot do 'decq'.
; X32-LABEL: dec_64		; X32-LABEL: dec_64
%1 = load atomic i64* %p acquire, align 8		%1 = load atomic i64* %p acquire, align 8
%2 = sub i64 %1, 1		%2 = sub i64 %1, 1
store atomic i64 %2, i64* %p release, align 8		store atomic i64 %2, i64* %p release, align 8
ret void		ret void
Show All 12 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Allow atomic operations using immediates to avoid using a register
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 12264

test/CodeGen/X86/atomic_mi.ll

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Allow atomic operations using immediates to avoid using a registerClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 12264

test/CodeGen/X86/atomic_mi.ll

[X86] Allow atomic operations using immediates to avoid using a register
ClosedPublic