main/exp-bbv/tests/x86/fldcw_check.S - platform/external/valgrind - Git at Google


 .globl _start

 _start:
         # This code tests for the fldcw "load floating point command word"
 	#   instruction.  On most x86 processors the retired_instruction
 	#   performance counter counts this as one instruction.  However,
 	#   on Pentium 4 systems it counts as two.  Therefore this can
 	#   affect BBV results on such a system.
 	# fldcw is most often used to set the rouding mode when doing
 	#   floating point to integer conversions

 	# It is encoded as "d9 /5" which means
 	#   1101 1001 xx10 1yyy
 	# Where xx is the "mod" which will be 00, 01, or 10 indicating offset
 	#   and yyy is the register field


         # these are instructions with similar encodings to fldcw
 	# that can cause false positives if the test isn't explicit enough
 similar:
         fld1   	   	       		# d9 e8
 	fldl2t				# d9 e9
 	fldl2e				# d9 ea
 	fldpi				# d9 eb
 	fldlg2				# d9 ec
 	fldln2				# d9 ed
 	fldz				# d9 ee

 	# check some varied ways of calling fldcw


 	# offset on stack
 stack:
 	sub	$4,%esp			# allocate space on stack
 	fnstcw	2(%esp)
 	fldcw	2(%esp)
 	add	$4,%esp			# restore stack

 	# 32-bit register

 	fnstcw	cw
 	mov	$cw,%eax
 	fldcw	0(%eax)			# eax
 	mov	$cw,%ebx
 	fldcw	0(%ebx)			# ebx
 	mov	$cw,%ecx
 	fldcw	0(%ecx)			# ecx
 	mov	$cw,%edx
 	fldcw	0(%edx)			# edx

 	# register + 8-bit offset
 eight_bit:
 	mov	$cw,%eax
 	sub	$32,%eax

 	fldcw	32(%eax)		# eax + 8 bit offset
 	mov	%eax,%ebx
 	fldcw	32(%ebx)		# ebx + 8 bit offset
 	mov	%eax,%ecx
 	fldcw	32(%ecx)		# ecx + 8 bit offset
 	mov	%eax,%edx
 	fldcw	32(%edx)		# edx + 8 bit offset

 	# register + 32-bit offset
 thirtytwo_bit:
 	mov	$cw,%eax
 	sub	$30000,%eax

 	fldcw	30000(%eax)		# eax + 16 bit offset
 	mov	%eax,%ebx
 	fldcw	30000(%ebx)		# ebx + 16 bit offset
 	mov	%eax,%ecx
 	fldcw	30000(%ecx)		# ecx + 16 bit offset
 	mov	%eax,%edx
 	fldcw	30000(%edx)		# edx + 16 bit offset

 	# check an fp/integer conversion
 	# in a loop to give a bigger count

 	mov	$1024,%ecx
 big_loop:

 	fldl	three			# load value onto fp stack
 	fnstcw	saved_cw		# store control word to mem
 	movzwl	saved_cw, %eax		# load cw from mem, zero extending
 	movb	$12, %ah		# set cw for "round to zero"
 	movw	%ax, cw			# store back to memory
 	fldcw	cw   			# save new rounding mode
 	fistpl	result			# save stack value as integer to mem
 	fldcw	saved_cw		# restore old cw

 	loop	big_loop		# loop to make the count more obvious

 	movl	result, %ebx		# sanity check to see if the
 	cmp	$3,%ebx			# result is the expected one
 	je	exit

 print_error:
 	mov 	$4,%eax			# write syscall
 #ifdef VGO_darwin
 	pushl	$1
 	pushl	$error
 	pushl	$22
 #else
 	mov	$1,%ebx			# stdout
 	mov	$error,%ecx		# string
 	mov 	$22,%edx		# length of string
 #endif
 	int 	$0x80

 exit:
 #ifdef VGO_darwin
 	pushl	result
 #else
 	movl	result, %ebx		# load converted value
 #endif
 	movl	$1,	%eax		# SYSCALL_EXIT
 	int	$0x80


 .data
 saved_cw:	.long 0
 cw:  	.long	0
 result: .long	0
 three:	.long	0			# a floating point 3.0
 	.long	1074266112
 error:	.asciz  "Error!  Wrong result!\n"

	.globl _start

	_start:
	# This code tests for the fldcw "load floating point command word"
	# instruction. On most x86 processors the retired_instruction
	# performance counter counts this as one instruction. However,
	# on Pentium 4 systems it counts as two. Therefore this can
	# affect BBV results on such a system.
	# fldcw is most often used to set the rouding mode when doing
	# floating point to integer conversions

	# It is encoded as "d9 /5" which means
	# 1101 1001 xx10 1yyy
	# Where xx is the "mod" which will be 00, 01, or 10 indicating offset
	# and yyy is the register field



	# these are instructions with similar encodings to fldcw
	# that can cause false positives if the test isn't explicit enough
	similar:
	fld1 # d9 e8
	fldl2t # d9 e9
	fldl2e # d9 ea
	fldpi # d9 eb
	fldlg2 # d9 ec
	fldln2 # d9 ed
	fldz # d9 ee

	# check some varied ways of calling fldcw


	# offset on stack
	stack:
	sub $4,%esp # allocate space on stack
	fnstcw 2(%esp)
	fldcw 2(%esp)
	add $4,%esp # restore stack

	# 32-bit register

	fnstcw cw
	mov $cw,%eax
	fldcw 0(%eax) # eax
	mov $cw,%ebx
	fldcw 0(%ebx) # ebx
	mov $cw,%ecx
	fldcw 0(%ecx) # ecx
	mov $cw,%edx
	fldcw 0(%edx) # edx

	# register + 8-bit offset
	eight_bit:
	mov $cw,%eax
	sub $32,%eax

	fldcw 32(%eax) # eax + 8 bit offset
	mov %eax,%ebx
	fldcw 32(%ebx) # ebx + 8 bit offset
	mov %eax,%ecx
	fldcw 32(%ecx) # ecx + 8 bit offset
	mov %eax,%edx
	fldcw 32(%edx) # edx + 8 bit offset

	# register + 32-bit offset
	thirtytwo_bit:
	mov $cw,%eax
	sub $30000,%eax

	fldcw 30000(%eax) # eax + 16 bit offset
	mov %eax,%ebx
	fldcw 30000(%ebx) # ebx + 16 bit offset
	mov %eax,%ecx
	fldcw 30000(%ecx) # ecx + 16 bit offset
	mov %eax,%edx
	fldcw 30000(%edx) # edx + 16 bit offset

	# check an fp/integer conversion
	# in a loop to give a bigger count

	mov $1024,%ecx
	big_loop:

	fldl three # load value onto fp stack
	fnstcw saved_cw # store control word to mem
	movzwl saved_cw, %eax # load cw from mem, zero extending
	movb $12, %ah # set cw for "round to zero"
	movw %ax, cw # store back to memory
	fldcw cw # save new rounding mode
	fistpl result # save stack value as integer to mem
	fldcw saved_cw # restore old cw

	loop big_loop # loop to make the count more obvious

	movl result, %ebx # sanity check to see if the
	cmp $3,%ebx # result is the expected one
	je exit

	print_error:
	mov $4,%eax # write syscall
	#ifdef VGO_darwin
	pushl $1
	pushl $error
	pushl $22
	#else
	mov $1,%ebx # stdout
	mov $error,%ecx # string
	mov $22,%edx # length of string
	#endif
	int $0x80

	exit:
	#ifdef VGO_darwin
	pushl result
	#else
	movl result, %ebx # load converted value
	#endif
	movl $1, %eax # SYSCALL_EXIT
	int $0x80



	.data
	saved_cw: .long 0
	cw: .long 0
	result: .long 0
	three: .long 0 # a floating point 3.0
	.long 1074266112
	error: .asciz "Error! Wrong result!\n"