| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | 	.file	"shr_Xsig.S" | 
 | 2 | /*---------------------------------------------------------------------------+ | 
 | 3 |  |  shr_Xsig.S                                                               | | 
 | 4 |  |                                                                           | | 
 | 5 |  | 12 byte right shift function                                              | | 
 | 6 |  |                                                                           | | 
 | 7 |  | Copyright (C) 1992,1994,1995                                              | | 
 | 8 |  |                       W. Metzenthen, 22 Parker St, Ormond, Vic 3163,      | | 
 | 9 |  |                       Australia.  E-mail billm@jacobi.maths.monash.edu.au | | 
 | 10 |  |                                                                           | | 
 | 11 |  | Call from C as:                                                           | | 
 | 12 |  |   void shr_Xsig(Xsig *arg, unsigned nr)                                   | | 
 | 13 |  |                                                                           | | 
 | 14 |  |   Extended shift right function.                                          | | 
 | 15 |  |   Fastest for small shifts.                                               | | 
 | 16 |  |   Shifts the 12 byte quantity pointed to by the first arg (arg)           | | 
 | 17 |  |   right by the number of bits specified by the second arg (nr).           | | 
 | 18 |  |                                                                           | | 
 | 19 |  +---------------------------------------------------------------------------*/ | 
 | 20 |  | 
 | 21 | #include "fpu_emu.h" | 
 | 22 |  | 
 | 23 | .text | 
 | 24 | ENTRY(shr_Xsig) | 
 | 25 | 	push	%ebp | 
 | 26 | 	movl	%esp,%ebp | 
 | 27 | 	pushl	%esi | 
 | 28 | 	movl	PARAM2,%ecx | 
 | 29 | 	movl	PARAM1,%esi | 
 | 30 | 	cmpl	$32,%ecx	/* shrd only works for 0..31 bits */ | 
 | 31 | 	jnc	L_more_than_31 | 
 | 32 |  | 
 | 33 | /* less than 32 bits */ | 
 | 34 | 	pushl	%ebx | 
 | 35 | 	movl	(%esi),%eax	/* lsl */ | 
 | 36 | 	movl	4(%esi),%ebx	/* midl */ | 
 | 37 | 	movl	8(%esi),%edx	/* msl */ | 
 | 38 | 	shrd	%cl,%ebx,%eax | 
 | 39 | 	shrd	%cl,%edx,%ebx | 
 | 40 | 	shr	%cl,%edx | 
 | 41 | 	movl	%eax,(%esi) | 
 | 42 | 	movl	%ebx,4(%esi) | 
 | 43 | 	movl	%edx,8(%esi) | 
 | 44 | 	popl	%ebx | 
 | 45 | 	popl	%esi | 
 | 46 | 	leave | 
 | 47 | 	ret | 
 | 48 |  | 
 | 49 | L_more_than_31: | 
 | 50 | 	cmpl	$64,%ecx | 
 | 51 | 	jnc	L_more_than_63 | 
 | 52 |  | 
 | 53 | 	subb	$32,%cl | 
 | 54 | 	movl	4(%esi),%eax	/* midl */ | 
 | 55 | 	movl	8(%esi),%edx	/* msl */ | 
 | 56 | 	shrd	%cl,%edx,%eax | 
 | 57 | 	shr	%cl,%edx | 
 | 58 | 	movl	%eax,(%esi) | 
 | 59 | 	movl	%edx,4(%esi) | 
 | 60 | 	movl	$0,8(%esi) | 
 | 61 | 	popl	%esi | 
 | 62 | 	leave | 
 | 63 | 	ret | 
 | 64 |  | 
 | 65 | L_more_than_63: | 
 | 66 | 	cmpl	$96,%ecx | 
 | 67 | 	jnc	L_more_than_95 | 
 | 68 |  | 
 | 69 | 	subb	$64,%cl | 
 | 70 | 	movl	8(%esi),%eax	/* msl */ | 
 | 71 | 	shr	%cl,%eax | 
 | 72 | 	xorl	%edx,%edx | 
 | 73 | 	movl	%eax,(%esi) | 
 | 74 | 	movl	%edx,4(%esi) | 
 | 75 | 	movl	%edx,8(%esi) | 
 | 76 | 	popl	%esi | 
 | 77 | 	leave | 
 | 78 | 	ret | 
 | 79 |  | 
 | 80 | L_more_than_95: | 
 | 81 | 	xorl	%eax,%eax | 
 | 82 | 	movl	%eax,(%esi) | 
 | 83 | 	movl	%eax,4(%esi) | 
 | 84 | 	movl	%eax,8(%esi) | 
 | 85 | 	popl	%esi | 
 | 86 | 	leave | 
 | 87 | 	ret |