24 ani în urmă · fea1b23bcf
--- a/libc/sysdeps/linux/sparc/Makefile
+++ b/libc/sysdeps/linux/sparc/Makefile
@@ -25,13 +25,14 @@ TOPDIR=../../../../
 
				 include $(TOPDIR)Rules.mak
			
 
				 ASFLAGS=$(CFLAGS)
			
 
				 
			
 
				-CRT0=crt0.S
			
 
				-CRT0_OBJ=$(patsubst %.S,%.o, $(CRT0))
			
 
				+CRT0=crt0.c
			
 
				+CRT0_OBJ=$(patsubst %.c,%.o, $(CRT0))
			
 
				 
			
 
				-SSRC=__longjmp.S setjmp.S vfork.S
			
 
				+SSRC=__longjmp.S fork.S vfork.S clone.S setjmp.S bsd-setjmp.S bsd-_setjmp.S \
			
 
				+	urem.S udiv.S umul.S sdiv.S rem.S
			
 
				 SOBJS=$(patsubst %.S,%.o, $(SSRC))
			
 
				 
			
 
				-CSRC=fork.c
			
 
				+CSRC=brk.c
			
 
				 COBJS=$(patsubst %.c,%.o, $(CSRC))
			
 
				 
			
 
				 OBJS=$(SOBJS) $(MOBJ) $(COBJS)
			
@@ -46,7 +47,7 @@ ar-target: $(OBJS) $(CRT0_OBJ)
 
				 	$(AR) $(ARFLAGS) $(LIBC) $(OBJS)
			
 
				 	cp $(CRT0_OBJ) $(TOPDIR)libc/$(CRT0_OBJ)
			
 
				 
			
 
				-$(CRT0_OBJ): %.o : %.S
			
 
				+$(CRT0_OBJ): %.o : %.c
			
 
				 	$(CC) $(CFLAGS) -c $< -o $@
			
 
				 	$(STRIPTOOL) -x -R .note -R .comment $*.o
			
 
				 
			
--- a/libc/sysdeps/linux/sparc/__longjmp.S
+++ b/libc/sysdeps/linux/sparc/__longjmp.S
@@ -2,21 +2,19 @@
 
				    This file is part of the GNU C Library.
			
 
				 
			
 
				    The GNU C Library is free software; you can redistribute it and/or
			
 
				-   modify it under the terms of the GNU Library General Public License as
			
 
				-   published by the Free Software Foundation; either version 2 of the
			
 
				-   License, or (at your option) any later version.
			
 
				+   modify it under the terms of the GNU Lesser General Public
			
 
				+   License as published by the Free Software Foundation; either
			
 
				+   version 2.1 of the License, or (at your option) any later version.
			
 
				 
			
 
				    The GNU C Library is distributed in the hope that it will be useful,
			
 
				    but WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
			
 
				-   Library General Public License for more details.
			
 
				+   Lesser General Public License for more details.
			
 
				 
			
 
				-   You should have received a copy of the GNU Library General Public
			
 
				-   License along with the GNU C Library; see the file COPYING.LIB.  If not,
			
 
				-   write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
			
 
				-   Boston, MA 02111-1307, USA.  */
			
 
				-
			
 
				-/* Code taken from glibc/sysdeps/sparc/sparc32/  (glibc 2.2.2) */
			
 
				+   You should have received a copy of the GNU Lesser General Public
			
 
				+   License along with the GNU C Library; if not, write to the Free
			
 
				+   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
			
 
				+   02111-1307 USA.  */
			
 
				 
			
 
				 #include <sysdep.h>
			
 
				 
			
@@ -27,7 +25,11 @@
 
				 #define ST_FLUSH_WINDOWS 3
			
 
				 #define RW_FP [%fp + 0x48]
			
 
				 
			
 
				-ENTRY(__longjmp)
			
 
				+.global   __longjmp;
			
 
				+.align 4;
			
 
				+__longjmp: ; 
			
 
				+.type __longjmp ,@function; 
			
 
				+
			
 
				 	/* Store our arguments in global registers so we can still
			
 
				 	   use them while unwinding frames and their register windows.  */
			
 
				 
			
@@ -40,27 +42,21 @@ ENTRY(__longjmp)
 
				 	xor %fp, %g3, %o0
			
 
				 	add %fp, 512, %o1
			
 
				 	andncc %o0, 4095, %o0
			
 
				-	bne thread
			
 
				-	//bne LOC(thread)
			
 
				+	bne .Lthread
			
 
				 	 cmp %o1, %g3
			
 
				-	bl thread
			
 
				-	//bl LOC(thread)
			
 
				+	bl .Lthread
			
 
				 
			
 
				 	/* Now we will loop, unwinding the register windows up the stack
			
 
				 	   until the restored %fp value matches the target value in %g3.  */
			
 
				 
			
 
				-//LOC(loop):
			
 
				-loop:
			
 
				+.Lloop:
			
 
				 	cmp %fp, %g3		/* Have we reached the target frame? */
			
 
				-	bl,a loop		/* Loop while current fp is below target.  */
			
 
				-	//bl,a LOC(loop)	/* Loop while current fp is below target.  */
			
 
				+	bl,a .Lloop		/* Loop while current fp is below target.  */
			
 
				 	 restore		/* Unwind register window in delay slot.  */
			
 
				-	be,a found		/* Better have hit it exactly.  */
			
 
				-	//be,a LOC(found)	/* Better have hit it exactly.  */
			
 
				+	be,a .Lfound		/* Better have hit it exactly.  */
			
 
				 	 ld ENV(g1,JB_SP), %o0	/* Delay slot: extract target SP.  */
			
 
				 
			
 
				-thread:
			
 
				-//LOC(thread):
			
 
				+.Lthread:
			
 
				 	/*
			
 
				 	 * Do a "flush register windows trap".  The trap handler in the
			
 
				 	 * kernel writes all the register windows to their stack slots, and
			
@@ -77,15 +73,13 @@ thread:
 
				 	retl
			
 
				 	 restore %g2, 0, %o0	/* Restore values from above register frame. */
			
 
				 
			
 
				-found:
			
 
				-//LOC(found):
			
 
				+.Lfound:
			
 
				 	/* We have unwound register windows so %fp matches the target.  */
			
 
				 	mov %o0, %sp		/* OK, install new SP.  */
			
 
				 
			
 
				-//LOC(sp_ok):
			
 
				-sp_ok:
			
 
				+.Lsp_ok:
			
 
				 	ld ENV(g1,JB_PC), %o0	/* Extract target return PC.  */
			
 
				 	jmp %o0 + 8		/* Return there.  */
			
 
				 	 mov %g2, %o0		/* Delay slot: set return value.  */
			
 
				 
			
 
				-END(__longjmp)
			
 
				+.size  __longjmp , . -  __longjmp
			
--- a/libc/sysdeps/linux/sparc/brk.c
+++ b/libc/sysdeps/linux/sparc/brk.c
@@ -0,0 +1,49 @@
 
				+/* brk system call for Linux/i386.
			
 
				+   Copyright (C) 1995, 1996, 2000 Free Software Foundation, Inc.
			
 
				+   This file is part of the GNU C Library.
			
 
				+
			
 
				+   The GNU C Library is free software; you can redistribute it and/or
			
 
				+   modify it under the terms of the GNU Lesser General Public
			
 
				+   License as published by the Free Software Foundation; either
			
 
				+   version 2.1 of the License, or (at your option) any later version.
			
 
				+
			
 
				+   The GNU C Library is distributed in the hope that it will be useful,
			
 
				+   but WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
			
 
				+   Lesser General Public License for more details.
			
 
				+
			
 
				+   You should have received a copy of the GNU Lesser General Public
			
 
				+   License along with the GNU C Library; if not, write to the Free
			
 
				+   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
			
 
				+   02111-1307 USA.  */
			
 
				+
			
 
				+#include <errno.h>
			
 
				+#include <unistd.h>
			
 
				+#include <sys/syscall.h>
			
 
				+
			
 
				+
			
 
				+/* This must be initialized data because commons can't have aliases.  */
			
 
				+void *___brk_addr = 0;
			
 
				+
			
 
				+
			
 
				+int brk (void *addr)
			
 
				+{
			
 
				+    void *newbrk;
			
 
				+
			
 
				+    {
			
 
				+	register void *o0 __asm__("%o0") = addr;
			
 
				+	register int g1 __asm__("%g1") = 17 ;
			
 
				+	__asm ("t 0x10" : "=r"(o0) : "r"(g1), "0"(o0) : "cc");
			
 
				+	newbrk = o0;
			
 
				+    }
			
 
				+
			
 
				+    ___brk_addr = newbrk;
			
 
				+
			
 
				+    if (newbrk < addr)
			
 
				+    {
			
 
				+	__set_errno (ENOMEM);
			
 
				+	return -1;
			
 
				+    }
			
 
				+
			
 
				+    return 0;
			
 
				+}
			
--- a/libc/sysdeps/linux/sparc/bsd-_setjmp.S
+++ b/libc/sysdeps/linux/sparc/bsd-_setjmp.S
@@ -0,0 +1 @@
 
				+/* _setjmp is in setjmp.S  */
			
--- a/libc/sysdeps/linux/sparc/bsd-setjmp.S
+++ b/libc/sysdeps/linux/sparc/bsd-setjmp.S
@@ -0,0 +1 @@
 
				+/* setjmp is in setjmp.S  */
			
--- a/libc/sysdeps/linux/sparc/clone.S
+++ b/libc/sysdeps/linux/sparc/clone.S
@@ -0,0 +1,72 @@
 
				+/* Copyright (C) 1996, 1997, 1998, 2000 Free Software Foundation, Inc.
			
 
				+   This file is part of the GNU C Library.
			
 
				+   Contributed by Richard Henderson (rth@tamu.edu).
			
 
				+
			
 
				+   The GNU C Library is free software; you can redistribute it and/or
			
 
				+   modify it under the terms of the GNU Lesser General Public
			
 
				+   License as published by the Free Software Foundation; either
			
 
				+   version 2.1 of the License, or (at your option) any later version.
			
 
				+
			
 
				+   The GNU C Library is distributed in the hope that it will be useful,
			
 
				+   but WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
			
 
				+   Lesser General Public License for more details.
			
 
				+
			
 
				+   You should have received a copy of the GNU Lesser General Public
			
 
				+   License along with the GNU C Library; if not, write to the Free
			
 
				+   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
			
 
				+   02111-1307 USA.  */
			
 
				+
			
 
				+/* clone() is even more special than fork() as it mucks with stacks
			
 
				+   and invokes a function in the right context after its all over.  */
			
 
				+
			
 
				+#include <asm/errno.h>
			
 
				+#include <asm/unistd.h>
			
 
				+
			
 
				+/* int clone(int (*fn)(void *arg), void *child_stack, int flags, void *arg); */
			
 
				+
			
 
				+	.text
			
 
				+	.align	4
			
 
				+	.globl	__clone
			
 
				+	.type	__clone,@function
			
 
				+
			
 
				+__clone:
			
 
				+	save	%sp,-96,%sp
			
 
				+
			
 
				+	/* sanity check arguments */
			
 
				+	tst	%i0
			
 
				+	be	.Lerror
			
 
				+	 orcc	%i1,%g0,%o1
			
 
				+	be	.Lerror
			
 
				+	 mov	%i2,%o0
			
 
				+
			
 
				+	/* Do the system call */
			
 
				+	set	__NR_clone,%g1
			
 
				+	ta	0x10
			
 
				+	bcs	.Lerror
			
 
				+	 tst	%o1
			
 
				+	bne	__thread_start
			
 
				+	 nop
			
 
				+	ret
			
 
				+	 restore %o0,%g0,%o0
			
 
				+
			
 
				+.Lerror:
			
 
				+	call	__errno_location
			
 
				+	 or	%g0,EINVAL,%i0
			
 
				+	st	%i0,[%o0]
			
 
				+	ret
			
 
				+	 restore %g0,-1,%o0
			
 
				+
			
 
				+	.size	__clone, .-__clone
			
 
				+
			
 
				+	.type	__thread_start,@function
			
 
				+
			
 
				+__thread_start:
			
 
				+	call	%i0
			
 
				+	 mov	%i3,%o0
			
 
				+	call	_exit,0
			
 
				+	 nop
			
 
				+
			
 
				+	.size	__thread_start, .-__thread_start
			
 
				+
			
 
				+.weak    clone    ;        clone    =   __clone
			
--- a/libc/sysdeps/linux/sparc/crt0.S
+++ b/libc/sysdeps/linux/sparc/crt0.S
@@ -1,90 +0,0 @@
 
				-/*
			
 
				- * xrt0.s for ERC32. 
			
 
				- *
			
 
				- * This program is free software; you can redistribute it and/or modify it under
			
 
				- * the terms of the GNU General Public License as published by the Free
			
 
				- * Software Foundation; either version 2 of the License, or (at your option)
			
 
				- * any later version.
			
 
				- *
			
 
				- * This program is distributed in the hope that it will be useful, but WITHOUT
			
 
				- * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
			
 
				- * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
			
 
				- * more details.
			
 
				- *
			
 
				- * You should have received a copy of the GNU General Public License along with
			
 
				- * this program; if not, write to the Free Software Foundation, Inc., 675
			
 
				- * Mass Ave, Cambridge, MA 02139, USA.
			
 
				- *
			
 
				- */
			
 
				-
			
 
				-/* code taken from leonccs 1.0 leon/src/libio/crt0.S 
			
 
				-	I don't know if this is available anymore, now that LECCS
			
 
				-	is out.  And I'm not sure if this source is in the LECCS distro  :(
			
 
				-*/
			
 
				-
			
 
				-	.text
			
 
				-! Original : 
			
 
				-!	.global __start, _main
			
 
				-! uC-libc version : 
			
 
				-	.global _start
			
 
				-	.global __uClibc_main
			
 
				-
			
 
				-! Start the real-time clock with a tick of 14 clocks
			
 
				-!
			
 
				-
			
 
				-_start:
			
 
				-
			
 
				-	save	%sp, -64, %sp
			
 
				-
			
 
				-        /* clear the bss */
			
 
				- 
			
 
				-        sethi %hi(edata),%g2
			
 
				-        or    %g2,%lo(edata),%g2  ! g2 = start of bss
			
 
				-        sethi %hi(_end),%g3
			
 
				-        or    %g3,%lo(_end),%g3         ! g3 = end of bss
			
 
				-        mov   %g0,%g1                   ! so std has two zeros
			
 
				-zerobss:
			
 
				-        std    %g0,[%g2]
			
 
				-        add    %g2,8,%g2
			
 
				-        cmp    %g2,%g3
			
 
				-        bleu,a zerobss
			
 
				-        nop
			
 
				-
			
 
				-        /* move data segment to proper location */
			
 
				- 
			
 
				-relocd:
			
 
				-        set (_endtext),%g2 		! g2 = start of data in aout file
			
 
				-        set (_environ),%g4		! g4 = start of where data should go
			
 
				-        set (_edata),%g3 		! g3 = end of where data should go
			
 
				-	subcc	%g3, %g4, %g5		! g5 = length of data
			
 
				-
			
 
				-	subcc	%g4, %g2, %g0		! need to relocate data ?
			
 
				-	ble	initok
			
 
				-	ld	[%g4], %g6
			
 
				-!	subcc	%g6, 1, %g0
			
 
				-!	be	initok
			
 
				-mvdata:
			
 
				-	subcc	%g5, 8, %g5
			
 
				-	ldd	[%g2 + %g5], %g6
			
 
				-	bg	mvdata
			
 
				-        std    	%g6, [%g4 + %g5]
			
 
				-
			
 
				-initok:
			
 
				-
			
 
				-!	call    _main
			
 
				-	call	__uClibc_main
			
 
				-        nop
			
 
				-! Should not return from uClibc main()
			
 
				-!	ret
			
 
				-!	nop
			
 
				-
			
 
				-        .seg    "data"
			
 
				-        .global .bdata
			
 
				-.bdata:
			
 
				-        .align  8
			
 
				-        .global _environ                ! first symbol in sdata
			
 
				-_environ:
			
 
				-        .word   1
			
 
				-
			
 
				-
			
 
				-
			
--- a/libc/sysdeps/linux/sparc/crt0.c
+++ b/libc/sysdeps/linux/sparc/crt0.c
@@ -1,9 +1,8 @@
 
				 /* vi: set sw=4 ts=4: */
			
 
				-/* fork for uClibc
			
 
				+/* uClibc/sysdeps/linux/i386/crt0.S
			
 
				+ * Pull stuff off the stack and get uClibc moving.
			
 
				  *
			
 
				- * Copyright (C) 2000 by Lineo, inc. and Erik Andersen
			
 
				  * Copyright (C) 2000,2001 by Erik Andersen <andersen@uclibc.org>
			
 
				- * Written by Erik Andersen <andersen@uclibc.org>
			
 
				  *
			
 
				  * This program is free software; you can redistribute it and/or modify it
			
 
				  * under the terms of the GNU Library General Public License as published by
			
@@ -20,15 +19,26 @@
 
				  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
			
 
				  */
			
 
				 
			
 
				-#include <errno.h>
			
 
				-#include <features.h>
			
 
				-#include <sys/types.h>
			
 
				-#include <sys/syscall.h>
			
 
				+extern void __uClibc_main(int argc,void *argv,void *envp);
			
 
				 
			
 
				-#ifndef __HAS_NO_MMU__
			
 
				+/* a little bit of stuff to support C++ */
			
 
				+__asm__(".section .ctors,\"aw\"\n.align 4\n.global __CTOR_LIST__\n"
			
 
				+	"__CTOR_LIST__:\n.long -1\n");
			
 
				 
			
 
				-//#define __NR_fork             2
			
 
				-#include <unistd.h>
			
 
				-_syscall0(pid_t, fork);
			
 
				+__asm__(".section .dtors,\"aw\"\n.align 4\n.global __DTOR_LIST__\n"
			
 
				+	"__DTOR_LIST__:\n.long -1\n");
			
 
				+
			
 
				+void _start(unsigned int first_arg)
			
 
				+{
			
 
				+	unsigned int argc;
			
 
				+	char **argv, **envp;
			
 
				+	unsigned long *stack;
			
 
				+
			
 
				+	stack = (unsigned long*) &first_arg;
			
 
				+	argc = *(stack - 1);
			
 
				+	argv = (char **) stack;
			
 
				+	envp = (char **)stack + argc + 1;
			
 
				+
			
 
				+	__uClibc_main(argc, argv, envp);
			
 
				+}
			
 
				 
			
 
				-#endif
			
--- a/libc/sysdeps/linux/sparc/fork.S
+++ b/libc/sysdeps/linux/sparc/fork.S
@@ -0,0 +1,46 @@
 
				+/* Copyright (C) 1991, 92, 94, 95, 97, 99 Free Software Foundation, Inc.
			
 
				+   This file is part of the GNU C Library.
			
 
				+
			
 
				+   The GNU C Library is free software; you can redistribute it and/or
			
 
				+   modify it under the terms of the GNU Lesser General Public
			
 
				+   License as published by the Free Software Foundation; either
			
 
				+   version 2.1 of the License, or (at your option) any later version.
			
 
				+
			
 
				+   The GNU C Library is distributed in the hope that it will be useful,
			
 
				+   but WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
			
 
				+   Lesser General Public License for more details.
			
 
				+
			
 
				+   You should have received a copy of the GNU Lesser General Public
			
 
				+   License along with the GNU C Library; if not, write to the Free
			
 
				+   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
			
 
				+   02111-1307 USA.  */
			
 
				+
			
 
				+#include <sysdep.h>
			
 
				+
			
 
				+.text;  
			
 
				+.global    fork;
			
 
				+.align 4;      
			
 
				+fork: ;
			
 
				+.type   fork  ,@function; ;      
			
 
				+
			
 
				+	mov	2, %g1 ; 
			
 
				+	ta	0x10;
			
 
				+	bcc,a 9000f;
			
 
				+	nop;
			
 
				+	save    %sp,-96,%sp;
			
 
				+	call __errno_location;
			
 
				+	nop;    
			
 
				+	st	%i0,[%o0];
			
 
				+	jmpl    %i7+8,%g0;
			
 
				+	restore %g0,-1,%o0; ;
			
 
				+	9000:;
			
 
				+
			
 
				+	/* %o1 is now 0 for the parent and 1 for the child.  Decrement it to
			
 
				+	   make it -1 (all bits set) for the parent, and 0 (no bits set)
			
 
				+	   for the child.  Then AND it with %o0, so the parent gets
			
 
				+	   %o0&-1==pid, and the child gets %o0&0==0.  */
			
 
				+	sub %o1, 1, %o1
			
 
				+	retl
			
 
				+	and %o0, %o1, %o0
			
 
				+
			
--- a/libc/sysdeps/linux/sparc/rem.S
+++ b/libc/sysdeps/linux/sparc/rem.S
@@ -0,0 +1,367 @@
 
				+   /* This file is generated from divrem.m4; DO NOT EDIT! */
			
 
				+/*
			
 
				+ * Division and remainder, from Appendix E of the Sparc Version 8
			
 
				+ * Architecture Manual, with fixes from Gordon Irlam.
			
 
				+ */
			
 
				+
			
 
				+/*
			
 
				+ * Input: dividend and divisor in %o0 and %o1 respectively.
			
 
				+ *
			
 
				+ * m4 parameters:
			
 
				+ *  .rem	name of function to generate
			
 
				+ *  rem		rem=div => %o0 / %o1; rem=rem => %o0 % %o1
			
 
				+ *  true		true=true => signed; true=false => unsigned
			
 
				+ *
			
 
				+ * Algorithm parameters:
			
 
				+ *  N		how many bits per iteration we try to get (4)
			
 
				+ *  WORDSIZE	total number of bits (32)
			
 
				+ *
			
 
				+ * Derived constants:
			
 
				+ *  TOPBITS	number of bits in the top decade of a number
			
 
				+ *
			
 
				+ * Important variables:
			
 
				+ *  Q		the partial quotient under development (initially 0)
			
 
				+ *  R		the remainder so far, initially the dividend
			
 
				+ *  ITER	number of main division loop iterations required;
			
 
				+ *		equal to ceil(log2(quotient) / N).  Note that this
			
 
				+ *		is the log base (2^N) of the quotient.
			
 
				+ *  V		the current comparand, initially divisor*2^(ITER*N-1)
			
 
				+ *
			
 
				+ * Cost:
			
 
				+ *  Current estimate for non-large dividend is
			
 
				+ *	ceil(log2(quotient) / N) * (10 + 7N/2) + C
			
 
				+ *  A large dividend is one greater than 2^(31-TOPBITS) and takes a
			
 
				+ *  different path, as the upper bits of the quotient must be developed
			
 
				+ *  one bit at a time.
			
 
				+ */
			
 
				+
			
 
				+
			
 
				+
			
 
				+#include <sysdep.h>
			
 
				+
			
 
				+
			
 
				+.global   .rem;
			
 
				+.align 4;
			
 
				+.type  .rem ,@function; 
			
 
				+
			
 
				+.rem: 
			
 
				+	! compute sign of result; if neither is negative, no problem
			
 
				+	orcc	%o1, %o0, %g0	! either negative?
			
 
				+	bge	2f			! no, go do the divide
			
 
				+	mov	%o0, %g3		! sign of remainder matches %o0
			
 
				+	tst	%o1
			
 
				+	bge	1f
			
 
				+	tst	%o0
			
 
				+	! %o1 is definitely negative; %o0 might also be negative
			
 
				+	bge	2f			! if %o0 not negative...
			
 
				+	sub	%g0, %o1, %o1	! in any case, make %o1 nonneg
			
 
				+1:	! %o0 is negative, %o1 is nonnegative
			
 
				+	sub	%g0, %o0, %o0	! make %o0 nonnegative
			
 
				+2:
			
 
				+
			
 
				+	! Ready to divide.  Compute size of quotient; scale comparand.
			
 
				+	orcc	%o1, %g0, %o5
			
 
				+	bne	1f
			
 
				+	mov	%o0, %o3
			
 
				+
			
 
				+		! Divide by zero trap.  If it returns, return 0 (about as
			
 
				+		! wrong as possible, but that is what SunOS does...).
			
 
				+		ta	0x02
			
 
				+		retl
			
 
				+		clr	%o0
			
 
				+
			
 
				+1:
			
 
				+	cmp	%o3, %o5			! if %o1 exceeds %o0, done
			
 
				+	blu	.Lgot_result		! (and algorithm fails otherwise)
			
 
				+	clr	%o2
			
 
				+	sethi	%hi(1 << (32 - 4 - 1)), %g1
			
 
				+	cmp	%o3, %g1
			
 
				+	blu	.Lnot_really_big
			
 
				+	clr	%o4
			
 
				+
			
 
				+	! Here the dividend is >= 2**(31-N) or so.  We must be careful here,
			
 
				+	! as our usual N-at-a-shot divide step will cause overflow and havoc.
			
 
				+	! The number of bits in the result here is N*ITER+SC, where SC <= N.
			
 
				+	! Compute ITER in an unorthodox manner: know we need to shift V into
			
 
				+	! the top decade: so do not even bother to compare to R.
			
 
				+	1:
			
 
				+		cmp	%o5, %g1
			
 
				+		bgeu	3f
			
 
				+		mov	1, %g2
			
 
				+		sll	%o5, 4, %o5
			
 
				+		b	1b
			
 
				+		add	%o4, 1, %o4
			
 
				+
			
 
				+	! Now compute %g2.
			
 
				+	2:	addcc	%o5, %o5, %o5
			
 
				+		bcc	.Lnot_too_big
			
 
				+		add	%g2, 1, %g2
			
 
				+
			
 
				+		! We get here if the %o1 overflowed while shifting.
			
 
				+		! This means that %o3 has the high-order bit set.
			
 
				+		! Restore %o5 and subtract from %o3.
			
 
				+		sll	%g1, 4, %g1	! high order bit
			
 
				+		srl	%o5, 1, %o5		! rest of %o5
			
 
				+		add	%o5, %g1, %o5
			
 
				+		b	.Ldo_single_div
			
 
				+		sub	%g2, 1, %g2
			
 
				+
			
 
				+	.Lnot_too_big:
			
 
				+	3:	cmp	%o5, %o3
			
 
				+		blu	2b
			
 
				+		nop
			
 
				+		be	.Ldo_single_div
			
 
				+		nop
			
 
				+	/* NB: these are commented out in the V8-Sparc manual as well */
			
 
				+	/* (I do not understand this) */
			
 
				+	! %o5 > %o3: went too far: back up 1 step
			
 
				+	!	srl	%o5, 1, %o5
			
 
				+	!	dec	%g2
			
 
				+	! do single-bit divide steps
			
 
				+	!
			
 
				+	! We have to be careful here.  We know that %o3 >= %o5, so we can do the
			
 
				+	! first divide step without thinking.  BUT, the others are conditional,
			
 
				+	! and are only done if %o3 >= 0.  Because both %o3 and %o5 may have the high-
			
 
				+	! order bit set in the first step, just falling into the regular
			
 
				+	! division loop will mess up the first time around.
			
 
				+	! So we unroll slightly...
			
 
				+	.Ldo_single_div:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bl	.Lend_regular_divide
			
 
				+		nop
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		mov	1, %o2
			
 
				+		b	.Lend_single_divloop
			
 
				+		nop
			
 
				+	.Lsingle_divloop:
			
 
				+		sll	%o2, 1, %o2
			
 
				+		bl	1f
			
 
				+		srl	%o5, 1, %o5
			
 
				+		! %o3 >= 0
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		b	2f
			
 
				+		add	%o2, 1, %o2
			
 
				+	1:	! %o3 < 0
			
 
				+		add	%o3, %o5, %o3
			
 
				+		sub	%o2, 1, %o2
			
 
				+	2:
			
 
				+	.Lend_single_divloop:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bge	.Lsingle_divloop
			
 
				+		tst	%o3
			
 
				+		b,a	.Lend_regular_divide
			
 
				+
			
 
				+.Lnot_really_big:
			
 
				+1:
			
 
				+	sll	%o5, 4, %o5
			
 
				+	cmp	%o5, %o3
			
 
				+	bleu	1b
			
 
				+	addcc	%o4, 1, %o4
			
 
				+	be	.Lgot_result
			
 
				+	sub	%o4, 1, %o4
			
 
				+
			
 
				+	tst	%o3	! set up for initial iteration
			
 
				+.Ldivloop:
			
 
				+	sll	%o2, 4, %o2
			
 
				+		! depth 1, accumulated bits 0
			
 
				+	bl	.L1.16
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits 1
			
 
				+	bl	.L2.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 3
			
 
				+	bl	.L3.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 7
			
 
				+	bl	.L4.23
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2+1), %o2
			
 
				+	
			
 
				+.L4.23:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 5
			
 
				+	bl	.L4.21
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2+1), %o2
			
 
				+	
			
 
				+.L4.21:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 1
			
 
				+	bl	.L3.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 3
			
 
				+	bl	.L4.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2+1), %o2
			
 
				+	
			
 
				+.L4.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 1
			
 
				+	bl	.L4.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2+1), %o2
			
 
				+	
			
 
				+.L4.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L1.16:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits -1
			
 
				+	bl	.L2.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -1
			
 
				+	bl	.L3.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -1
			
 
				+	bl	.L4.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2+1), %o2
			
 
				+	
			
 
				+.L4.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -3
			
 
				+	bl	.L4.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2+1), %o2
			
 
				+	
			
 
				+.L4.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -3
			
 
				+	bl	.L3.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -5
			
 
				+	bl	.L4.11
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2+1), %o2
			
 
				+	
			
 
				+.L4.11:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -7
			
 
				+	bl	.L4.9
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2+1), %o2
			
 
				+	
			
 
				+.L4.9:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	9:
			
 
				+.Lend_regular_divide:
			
 
				+	subcc	%o4, 1, %o4
			
 
				+	bge	.Ldivloop
			
 
				+	tst	%o3
			
 
				+	bl,a	.Lgot_result
			
 
				+	! non-restoring fixup here (one instruction only!)
			
 
				+	add	%o3, %o1, %o3
			
 
				+
			
 
				+
			
 
				+.Lgot_result:
			
 
				+	! check to see if answer should be < 0
			
 
				+	tst	%g3
			
 
				+	bl,a	1f
			
 
				+	sub %g0, %o3, %o3
			
 
				+1:
			
 
				+	retl
			
 
				+	mov %o3, %o0
			
 
				+
			
 
				+END(.rem)
			
--- a/libc/sysdeps/linux/sparc/sdiv.S
+++ b/libc/sysdeps/linux/sparc/sdiv.S
@@ -0,0 +1,366 @@
 
				+   /* This file is generated from divrem.m4; DO NOT EDIT! */
			
 
				+/*
			
 
				+ * Division and remainder, from Appendix E of the Sparc Version 8
			
 
				+ * Architecture Manual, with fixes from Gordon Irlam.
			
 
				+ */
			
 
				+
			
 
				+/*
			
 
				+ * Input: dividend and divisor in %o0 and %o1 respectively.
			
 
				+ *
			
 
				+ * m4 parameters:
			
 
				+ *  .div	name of function to generate
			
 
				+ *  div		div=div => %o0 / %o1; div=rem => %o0 % %o1
			
 
				+ *  true		true=true => signed; true=false => unsigned
			
 
				+ *
			
 
				+ * Algorithm parameters:
			
 
				+ *  N		how many bits per iteration we try to get (4)
			
 
				+ *  WORDSIZE	total number of bits (32)
			
 
				+ *
			
 
				+ * Derived constants:
			
 
				+ *  TOPBITS	number of bits in the top decade of a number
			
 
				+ *
			
 
				+ * Important variables:
			
 
				+ *  Q		the partial quotient under development (initially 0)
			
 
				+ *  R		the remainder so far, initially the dividend
			
 
				+ *  ITER	number of main division loop iterations required;
			
 
				+ *		equal to ceil(log2(quotient) / N).  Note that this
			
 
				+ *		is the log base (2^N) of the quotient.
			
 
				+ *  V		the current comparand, initially divisor*2^(ITER*N-1)
			
 
				+ *
			
 
				+ * Cost:
			
 
				+ *  Current estimate for non-large dividend is
			
 
				+ *	ceil(log2(quotient) / N) * (10 + 7N/2) + C
			
 
				+ *  A large dividend is one greater than 2^(31-TOPBITS) and takes a
			
 
				+ *  different path, as the upper bits of the quotient must be developed
			
 
				+ *  one bit at a time.
			
 
				+ */
			
 
				+
			
 
				+
			
 
				+
			
 
				+#include <sysdep.h>
			
 
				+
			
 
				+.global   .div;
			
 
				+.align 4;
			
 
				+.type  .div ,@function; 
			
 
				+
			
 
				+.div: 
			
 
				+	! compute sign of result; if neither is negative, no problem
			
 
				+	orcc	%o1, %o0, %g0	! either negative?
			
 
				+	bge	2f			! no, go do the divide
			
 
				+	xor	%o1, %o0, %g3	! compute sign in any case
			
 
				+	tst	%o1
			
 
				+	bge	1f
			
 
				+	tst	%o0
			
 
				+	! %o1 is definitely negative; %o0 might also be negative
			
 
				+	bge	2f			! if %o0 not negative...
			
 
				+	sub	%g0, %o1, %o1	! in any case, make %o1 nonneg
			
 
				+1:	! %o0 is negative, %o1 is nonnegative
			
 
				+	sub	%g0, %o0, %o0	! make %o0 nonnegative
			
 
				+2:
			
 
				+
			
 
				+	! Ready to divide.  Compute size of quotient; scale comparand.
			
 
				+	orcc	%o1, %g0, %o5
			
 
				+	bne	1f
			
 
				+	mov	%o0, %o3
			
 
				+
			
 
				+		! Divide by zero trap.  If it returns, return 0 (about as
			
 
				+		! wrong as possible, but that is what SunOS does...).
			
 
				+		ta	0x02
			
 
				+		retl
			
 
				+		clr	%o0
			
 
				+
			
 
				+1:
			
 
				+	cmp	%o3, %o5			! if %o1 exceeds %o0, done
			
 
				+	blu	.Lgot_result		! (and algorithm fails otherwise)
			
 
				+	clr	%o2
			
 
				+	sethi	%hi(1 << (32 - 4 - 1)), %g1
			
 
				+	cmp	%o3, %g1
			
 
				+	blu	.Lnot_really_big
			
 
				+	clr	%o4
			
 
				+
			
 
				+	! Here the dividend is >= 2**(31-N) or so.  We must be careful here,
			
 
				+	! as our usual N-at-a-shot divide step will cause overflow and havoc.
			
 
				+	! The number of bits in the result here is N*ITER+SC, where SC <= N.
			
 
				+	! Compute ITER in an unorthodox manner: know we need to shift V into
			
 
				+	! the top decade: so do not even bother to compare to R.
			
 
				+	1:
			
 
				+		cmp	%o5, %g1
			
 
				+		bgeu	3f
			
 
				+		mov	1, %g2
			
 
				+		sll	%o5, 4, %o5
			
 
				+		b	1b
			
 
				+		add	%o4, 1, %o4
			
 
				+
			
 
				+	! Now compute %g2.
			
 
				+	2:	addcc	%o5, %o5, %o5
			
 
				+		bcc	.Lnot_too_big
			
 
				+		add	%g2, 1, %g2
			
 
				+
			
 
				+		! We get here if the %o1 overflowed while shifting.
			
 
				+		! This means that %o3 has the high-order bit set.
			
 
				+		! Restore %o5 and subtract from %o3.
			
 
				+		sll	%g1, 4, %g1	! high order bit
			
 
				+		srl	%o5, 1, %o5		! rest of %o5
			
 
				+		add	%o5, %g1, %o5
			
 
				+		b	.Ldo_single_div
			
 
				+		sub	%g2, 1, %g2
			
 
				+
			
 
				+	.Lnot_too_big:
			
 
				+	3:	cmp	%o5, %o3
			
 
				+		blu	2b
			
 
				+		nop
			
 
				+		be	.Ldo_single_div
			
 
				+		nop
			
 
				+	/* NB: these are commented out in the V8-Sparc manual as well */
			
 
				+	/* (I do not understand this) */
			
 
				+	! %o5 > %o3: went too far: back up 1 step
			
 
				+	!	srl	%o5, 1, %o5
			
 
				+	!	dec	%g2
			
 
				+	! do single-bit divide steps
			
 
				+	!
			
 
				+	! We have to be careful here.  We know that %o3 >= %o5, so we can do the
			
 
				+	! first divide step without thinking.  BUT, the others are conditional,
			
 
				+	! and are only done if %o3 >= 0.  Because both %o3 and %o5 may have the high-
			
 
				+	! order bit set in the first step, just falling into the regular
			
 
				+	! division loop will mess up the first time around.
			
 
				+	! So we unroll slightly...
			
 
				+	.Ldo_single_div:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bl	.Lend_regular_divide
			
 
				+		nop
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		mov	1, %o2
			
 
				+		b	.Lend_single_divloop
			
 
				+		nop
			
 
				+	.Lsingle_divloop:
			
 
				+		sll	%o2, 1, %o2
			
 
				+		bl	1f
			
 
				+		srl	%o5, 1, %o5
			
 
				+		! %o3 >= 0
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		b	2f
			
 
				+		add	%o2, 1, %o2
			
 
				+	1:	! %o3 < 0
			
 
				+		add	%o3, %o5, %o3
			
 
				+		sub	%o2, 1, %o2
			
 
				+	2:
			
 
				+	.Lend_single_divloop:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bge	.Lsingle_divloop
			
 
				+		tst	%o3
			
 
				+		b,a	.Lend_regular_divide
			
 
				+
			
 
				+.Lnot_really_big:
			
 
				+1:
			
 
				+	sll	%o5, 4, %o5
			
 
				+	cmp	%o5, %o3
			
 
				+	bleu	1b
			
 
				+	addcc	%o4, 1, %o4
			
 
				+	be	.Lgot_result
			
 
				+	sub	%o4, 1, %o4
			
 
				+
			
 
				+	tst	%o3	! set up for initial iteration
			
 
				+.Ldivloop:
			
 
				+	sll	%o2, 4, %o2
			
 
				+		! depth 1, accumulated bits 0
			
 
				+	bl	.L1.16
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits 1
			
 
				+	bl	.L2.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 3
			
 
				+	bl	.L3.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 7
			
 
				+	bl	.L4.23
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2+1), %o2
			
 
				+	
			
 
				+.L4.23:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 5
			
 
				+	bl	.L4.21
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2+1), %o2
			
 
				+	
			
 
				+.L4.21:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 1
			
 
				+	bl	.L3.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 3
			
 
				+	bl	.L4.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2+1), %o2
			
 
				+	
			
 
				+.L4.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 1
			
 
				+	bl	.L4.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2+1), %o2
			
 
				+	
			
 
				+.L4.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L1.16:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits -1
			
 
				+	bl	.L2.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -1
			
 
				+	bl	.L3.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -1
			
 
				+	bl	.L4.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2+1), %o2
			
 
				+	
			
 
				+.L4.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -3
			
 
				+	bl	.L4.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2+1), %o2
			
 
				+	
			
 
				+.L4.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -3
			
 
				+	bl	.L3.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -5
			
 
				+	bl	.L4.11
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2+1), %o2
			
 
				+	
			
 
				+.L4.11:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -7
			
 
				+	bl	.L4.9
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2+1), %o2
			
 
				+	
			
 
				+.L4.9:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	9:
			
 
				+.Lend_regular_divide:
			
 
				+	subcc	%o4, 1, %o4
			
 
				+	bge	.Ldivloop
			
 
				+	tst	%o3
			
 
				+	bl,a	.Lgot_result
			
 
				+	! non-restoring fixup here (one instruction only!)
			
 
				+	sub	%o2, 1, %o2
			
 
				+
			
 
				+
			
 
				+.Lgot_result:
			
 
				+	! check to see if answer should be < 0
			
 
				+	tst	%g3
			
 
				+	bl,a	1f
			
 
				+	sub %g0, %o2, %o2
			
 
				+1:
			
 
				+	retl
			
 
				+	mov %o2, %o0
			
 
				+
			
 
				+END(.div)
			
--- a/libc/sysdeps/linux/sparc/setjmp.S
+++ b/libc/sysdeps/linux/sparc/setjmp.S
@@ -2,24 +2,21 @@
 
				    This file is part of the GNU C Library.
			
 
				 
			
 
				    The GNU C Library is free software; you can redistribute it and/or
			
 
				-   modify it under the terms of the GNU Library General Public License as
			
 
				-   published by the Free Software Foundation; either version 2 of the
			
 
				-   License, or (at your option) any later version.
			
 
				+   modify it under the terms of the GNU Lesser General Public
			
 
				+   License as published by the Free Software Foundation; either
			
 
				+   version 2.1 of the License, or (at your option) any later version.
			
 
				 
			
 
				    The GNU C Library is distributed in the hope that it will be useful,
			
 
				    but WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
			
 
				-   Library General Public License for more details.
			
 
				+   Lesser General Public License for more details.
			
 
				 
			
 
				-   You should have received a copy of the GNU Library General Public
			
 
				-   License along with the GNU C Library; see the file COPYING.LIB.  If not,
			
 
				-   write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
			
 
				-   Boston, MA 02111-1307, USA.  */
			
 
				-
			
 
				-/* Code taken from glibc2.2.2/sysdeps/sparc/sparc32/setjmp.S */
			
 
				+   You should have received a copy of the GNU Lesser General Public
			
 
				+   License along with the GNU C Library; if not, write to the Free
			
 
				+   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
			
 
				+   02111-1307 USA.  */
			
 
				 
			
 
				 #include <sysdep.h>
			
 
				-#include "sysdep.h"
			
 
				 
			
 
				 #define _ASM 1
			
 
				 #define _SETJMP_H
			
@@ -49,5 +46,5 @@ ENTRY (__sigsetjmp)
 
				 	 mov	%g1, %o7
			
 
				 END(__sigsetjmp)
			
 
				 
			
 
				-//weak_extern(_setjmp)
			
 
				-//weak_extern(setjmp)
			
 
				+.weak   _setjmp    
			
 
				+.weak   setjmp  
			
--- a/libc/sysdeps/linux/sparc/udiv.S
+++ b/libc/sysdeps/linux/sparc/udiv.S
@@ -0,0 +1,348 @@
 
				+   /* This file is generated from divrem.m4; DO NOT EDIT! */
			
 
				+/*
			
 
				+ * Division and remainder, from Appendix E of the Sparc Version 8
			
 
				+ * Architecture Manual, with fixes from Gordon Irlam.
			
 
				+ */
			
 
				+
			
 
				+/*
			
 
				+ * Input: dividend and divisor in %o0 and %o1 respectively.
			
 
				+ *
			
 
				+ * m4 parameters:
			
 
				+ *  .udiv	name of function to generate
			
 
				+ *  div		div=div => %o0 / %o1; div=rem => %o0 % %o1
			
 
				+ *  false		false=true => signed; false=false => unsigned
			
 
				+ *
			
 
				+ * Algorithm parameters:
			
 
				+ *  N		how many bits per iteration we try to get (4)
			
 
				+ *  WORDSIZE	total number of bits (32)
			
 
				+ *
			
 
				+ * Derived constants:
			
 
				+ *  TOPBITS	number of bits in the top decade of a number
			
 
				+ *
			
 
				+ * Important variables:
			
 
				+ *  Q		the partial quotient under development (initially 0)
			
 
				+ *  R		the remainder so far, initially the dividend
			
 
				+ *  ITER	number of main division loop iterations required;
			
 
				+ *		equal to ceil(log2(quotient) / N).  Note that this
			
 
				+ *		is the log base (2^N) of the quotient.
			
 
				+ *  V		the current comparand, initially divisor*2^(ITER*N-1)
			
 
				+ *
			
 
				+ * Cost:
			
 
				+ *  Current estimate for non-large dividend is
			
 
				+ *	ceil(log2(quotient) / N) * (10 + 7N/2) + C
			
 
				+ *  A large dividend is one greater than 2^(31-TOPBITS) and takes a
			
 
				+ *  different path, as the upper bits of the quotient must be developed
			
 
				+ *  one bit at a time.
			
 
				+ */
			
 
				+
			
 
				+
			
 
				+
			
 
				+#include <sysdep.h>
			
 
				+
			
 
				+.global   .udiv;
			
 
				+.align 4;
			
 
				+.type  .udiv ,@function; 
			
 
				+
			
 
				+.udiv: 
			
 
				+	! Ready to divide.  Compute size of quotient; scale comparand.
			
 
				+	orcc	%o1, %g0, %o5
			
 
				+	bne	1f
			
 
				+	mov	%o0, %o3
			
 
				+
			
 
				+		! Divide by zero trap.  If it returns, return 0 (about as
			
 
				+		! wrong as possible, but that is what SunOS does...).
			
 
				+		ta	0x02
			
 
				+		retl
			
 
				+		clr	%o0
			
 
				+
			
 
				+1:
			
 
				+	cmp	%o3, %o5			! if %o1 exceeds %o0, done
			
 
				+	blu	.Lgot_result  		! (and algorithm fails otherwise)
			
 
				+	clr	%o2
			
 
				+	sethi	%hi(1 << (32 - 4 - 1)), %g1
			
 
				+	cmp	%o3, %g1
			
 
				+	blu	.Lnot_really_big  
			
 
				+	clr	%o4
			
 
				+
			
 
				+	! Here the dividend is >= 2**(31-N) or so.  We must be careful here,
			
 
				+	! as our usual N-at-a-shot divide step will cause overflow and havoc.
			
 
				+	! The number of bits in the result here is N*ITER+SC, where SC <= N.
			
 
				+	! Compute ITER in an unorthodox manner: know we need to shift V into
			
 
				+	! the top decade: so do not even bother to compare to R.
			
 
				+	1:
			
 
				+		cmp	%o5, %g1
			
 
				+		bgeu	3f
			
 
				+		mov	1, %g2
			
 
				+		sll	%o5, 4, %o5
			
 
				+		b	1b
			
 
				+		add	%o4, 1, %o4
			
 
				+
			
 
				+	! Now compute %g2.
			
 
				+	2:	addcc	%o5, %o5, %o5
			
 
				+		bcc	.Lnot_too_big  
			
 
				+		add	%g2, 1, %g2
			
 
				+
			
 
				+		! We get here if the %o1 overflowed while shifting.
			
 
				+		! This means that %o3 has the high-order bit set.
			
 
				+		! Restore %o5 and subtract from %o3.
			
 
				+		sll	%g1, 4, %g1	! high order bit
			
 
				+		srl	%o5, 1, %o5		! rest of %o5
			
 
				+		add	%o5, %g1, %o5
			
 
				+		b	.Ldo_single_div
			
 
				+		sub	%g2, 1, %g2
			
 
				+
			
 
				+	.Lnot_too_big:
			
 
				+	3:	cmp	%o5, %o3
			
 
				+		blu	2b
			
 
				+		nop
			
 
				+		be	.Ldo_single_div
			
 
				+		nop
			
 
				+	/* NB: these are commented out in the V8-Sparc manual as well */
			
 
				+	/* (I do not understand this) */
			
 
				+	! %o5 > %o3: went too far: back up 1 step
			
 
				+	!	srl	%o5, 1, %o5
			
 
				+	!	dec	%g2
			
 
				+	! do single-bit divide steps
			
 
				+	!
			
 
				+	! We have to be careful here.  We know that %o3 >= %o5, so we can do the
			
 
				+	! first divide step without thinking.  BUT, the others are conditional,
			
 
				+	! and are only done if %o3 >= 0.  Because both %o3 and %o5 may have the high-
			
 
				+	! order bit set in the first step, just falling into the regular
			
 
				+	! division loop will mess up the first time around.
			
 
				+	! So we unroll slightly...
			
 
				+	.Ldo_single_div:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bl	.Lend_regular_divide
			
 
				+		nop
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		mov	1, %o2
			
 
				+		b	.Lend_single_divloop
			
 
				+		nop
			
 
				+	.Lsingle_divloop:
			
 
				+		sll	%o2, 1, %o2
			
 
				+		bl	1f
			
 
				+		srl	%o5, 1, %o5
			
 
				+		! %o3 >= 0
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		b	2f
			
 
				+		add	%o2, 1, %o2
			
 
				+	1:	! %o3 < 0
			
 
				+		add	%o3, %o5, %o3
			
 
				+		sub	%o2, 1, %o2
			
 
				+	2:
			
 
				+	.Lend_single_divloop:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bge	.Lsingle_divloop
			
 
				+		tst	%o3
			
 
				+		b,a	.Lend_regular_divide
			
 
				+
			
 
				+.Lnot_really_big:
			
 
				+1:
			
 
				+	sll	%o5, 4, %o5
			
 
				+	cmp	%o5, %o3
			
 
				+	bleu	1b
			
 
				+	addcc	%o4, 1, %o4
			
 
				+	be	.Lgot_result
			
 
				+	sub	%o4, 1, %o4
			
 
				+
			
 
				+	tst	%o3	! set up for initial iteration
			
 
				+.Ldivloop:
			
 
				+	sll	%o2, 4, %o2
			
 
				+		! depth 1, accumulated bits 0
			
 
				+	bl	.L1.16
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits 1
			
 
				+	bl	.L2.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 3
			
 
				+	bl	.L3.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 7
			
 
				+	bl	.L4.23
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2+1), %o2
			
 
				+	
			
 
				+.L4.23:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 5
			
 
				+	bl	.L4.21
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2+1), %o2
			
 
				+	
			
 
				+.L4.21:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 1
			
 
				+	bl	.L3.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 3
			
 
				+	bl	.L4.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2+1), %o2
			
 
				+	
			
 
				+.L4.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 1
			
 
				+	bl	.L4.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2+1), %o2
			
 
				+	
			
 
				+.L4.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L1.16:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits -1
			
 
				+	bl	.L2.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -1
			
 
				+	bl	.L3.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -1
			
 
				+	bl	.L4.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2+1), %o2
			
 
				+	
			
 
				+.L4.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -3
			
 
				+	bl	.L4.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2+1), %o2
			
 
				+	
			
 
				+.L4.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -3
			
 
				+	bl	.L3.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -5
			
 
				+	bl	.L4.11
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2+1), %o2
			
 
				+	
			
 
				+.L4.11:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -7
			
 
				+	bl	.L4.9
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2+1), %o2
			
 
				+	
			
 
				+.L4.9:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	9:
			
 
				+.Lend_regular_divide:
			
 
				+	subcc	%o4, 1, %o4
			
 
				+	bge	.Ldivloop
			
 
				+	tst	%o3
			
 
				+	bl,a	.Lgot_result
			
 
				+	! non-restoring fixup here (one instruction only!)
			
 
				+	sub	%o2, 1, %o2
			
 
				+
			
 
				+
			
 
				+.Lgot_result:
			
 
				+
			
 
				+	retl
			
 
				+	mov %o2, %o0
			
 
				+
			
 
				+END(.udiv)
			
--- a/libc/sysdeps/linux/sparc/umul.S
+++ b/libc/sysdeps/linux/sparc/umul.S
@@ -0,0 +1,160 @@
 
				+/*
			
 
				+ * Unsigned multiply.  Returns %o0 * %o1 in %o1%o0 (i.e., %o1 holds the
			
 
				+ * upper 32 bits of the 64-bit product).
			
 
				+ *
			
 
				+ * This code optimizes short (less than 13-bit) multiplies.  Short
			
 
				+ * multiplies require 25 instruction cycles, and long ones require
			
 
				+ * 45 instruction cycles.
			
 
				+ *
			
 
				+ * On return, overflow has occurred (%o1 is not zero) if and only if
			
 
				+ * the Z condition code is clear, allowing, e.g., the following:
			
 
				+ *
			
 
				+ *	call	.umul
			
 
				+ *	nop
			
 
				+ *	bnz	overflow	(or tnz)
			
 
				+ */
			
 
				+
			
 
				+#include <sysdep.h>
			
 
				+
			
 
				+
			
 
				+.global   .umul;
			
 
				+.align 4;
			
 
				+.type  .umul ,@function; 
			
 
				+
			
 
				+.umul: 
			
 
				+	or	%o0, %o1, %o4
			
 
				+	mov	%o0, %y			! multiplier -> Y
			
 
				+	andncc	%o4, 0xfff, %g0		! test bits 12..31 of *both* args
			
 
				+	be	.Lmul_shortway	! if zero, can do it the short way
			
 
				+	 andcc	%g0, %g0, %o4		! zero the partial product; clear N & V
			
 
				+
			
 
				+	/*
			
 
				+	 * Long multiply.  32 steps, followed by a final shift step.
			
 
				+	 */
			
 
				+	mulscc	%o4, %o1, %o4	! 1
			
 
				+	mulscc	%o4, %o1, %o4	! 2
			
 
				+	mulscc	%o4, %o1, %o4	! 3
			
 
				+	mulscc	%o4, %o1, %o4	! 4
			
 
				+	mulscc	%o4, %o1, %o4	! 5
			
 
				+	mulscc	%o4, %o1, %o4	! 6
			
 
				+	mulscc	%o4, %o1, %o4	! 7
			
 
				+	mulscc	%o4, %o1, %o4	! 8
			
 
				+	mulscc	%o4, %o1, %o4	! 9
			
 
				+	mulscc	%o4, %o1, %o4	! 10
			
 
				+	mulscc	%o4, %o1, %o4	! 11
			
 
				+	mulscc	%o4, %o1, %o4	! 12
			
 
				+	mulscc	%o4, %o1, %o4	! 13
			
 
				+	mulscc	%o4, %o1, %o4	! 14
			
 
				+	mulscc	%o4, %o1, %o4	! 15
			
 
				+	mulscc	%o4, %o1, %o4	! 16
			
 
				+	mulscc	%o4, %o1, %o4	! 17
			
 
				+	mulscc	%o4, %o1, %o4	! 18
			
 
				+	mulscc	%o4, %o1, %o4	! 19
			
 
				+	mulscc	%o4, %o1, %o4	! 20
			
 
				+	mulscc	%o4, %o1, %o4	! 21
			
 
				+	mulscc	%o4, %o1, %o4	! 22
			
 
				+	mulscc	%o4, %o1, %o4	! 23
			
 
				+	mulscc	%o4, %o1, %o4	! 24
			
 
				+	mulscc	%o4, %o1, %o4	! 25
			
 
				+	mulscc	%o4, %o1, %o4	! 26
			
 
				+	mulscc	%o4, %o1, %o4	! 27
			
 
				+	mulscc	%o4, %o1, %o4	! 28
			
 
				+	mulscc	%o4, %o1, %o4	! 29
			
 
				+	mulscc	%o4, %o1, %o4	! 30
			
 
				+	mulscc	%o4, %o1, %o4	! 31
			
 
				+	mulscc	%o4, %o1, %o4	! 32
			
 
				+	mulscc	%o4, %g0, %o4	! final shift
			
 
				+
			
 
				+	/*
			
 
				+	 * Normally, with the shift-and-add approach, if both numbers are
			
 
				+	 * positive you get the correct result.  With 32-bit two's-complement
			
 
				+	 * numbers, -x is represented as
			
 
				+	 *
			
 
				+	 *		  x		    32
			
 
				+	 *	( 2  -  ------ ) mod 2  *  2
			
 
				+	 *		   32
			
 
				+	 *		  2
			
 
				+	 *
			
 
				+	 * (the `mod 2' subtracts 1 from 1.bbbb).  To avoid lots of 2^32s,
			
 
				+	 * we can treat this as if the radix point were just to the left
			
 
				+	 * of the sign bit (multiply by 2^32), and get
			
 
				+	 *
			
 
				+	 *	-x  =  (2 - x) mod 2
			
 
				+	 *
			
 
				+	 * Then, ignoring the `mod 2's for convenience:
			
 
				+	 *
			
 
				+	 *   x *  y	= xy
			
 
				+	 *  -x *  y	= 2y - xy
			
 
				+	 *   x * -y	= 2x - xy
			
 
				+	 *  -x * -y	= 4 - 2x - 2y + xy
			
 
				+	 *
			
 
				+	 * For signed multiplies, we subtract (x << 32) from the partial
			
 
				+	 * product to fix this problem for negative multipliers (see mul.s).
			
 
				+	 * Because of the way the shift into the partial product is calculated
			
 
				+	 * (N xor V), this term is automatically removed for the multiplicand,
			
 
				+	 * so we don't have to adjust.
			
 
				+	 *
			
 
				+	 * But for unsigned multiplies, the high order bit wasn't a sign bit,
			
 
				+	 * and the correction is wrong.  So for unsigned multiplies where the
			
 
				+	 * high order bit is one, we end up with xy - (y << 32).  To fix it
			
 
				+	 * we add y << 32.
			
 
				+	 */
			
 
				+#if 0
			
 
				+	tst	%o1
			
 
				+	bl,a	1f		! if %o1 < 0 (high order bit = 1),
			
 
				+	 add	%o4, %o0, %o4	! %o4 += %o0 (add y to upper half)
			
 
				+1:	rd	%y, %o0		! get lower half of product
			
 
				+	retl
			
 
				+	 addcc	%o4, %g0, %o1	! put upper half in place and set Z for %o1==0
			
 
				+#else
			
 
				+	/* Faster code from tege@sics.se.  */
			
 
				+	sra	%o1, 31, %o2	! make mask from sign bit
			
 
				+	and	%o0, %o2, %o2	! %o2 = 0 or %o0, depending on sign of %o1
			
 
				+	rd	%y, %o0		! get lower half of product
			
 
				+	retl
			
 
				+	 addcc	%o4, %o2, %o1	! add compensation and put upper half in place
			
 
				+#endif
			
 
				+
			
 
				+.Lmul_shortway:
			
 
				+	/*
			
 
				+	 * Short multiply.  12 steps, followed by a final shift step.
			
 
				+	 * The resulting bits are off by 12 and (32-12) = 20 bit positions,
			
 
				+	 * but there is no problem with %o0 being negative (unlike above),
			
 
				+	 * and overflow is impossible (the answer is at most 24 bits long).
			
 
				+	 */
			
 
				+	mulscc	%o4, %o1, %o4	! 1
			
 
				+	mulscc	%o4, %o1, %o4	! 2
			
 
				+	mulscc	%o4, %o1, %o4	! 3
			
 
				+	mulscc	%o4, %o1, %o4	! 4
			
 
				+	mulscc	%o4, %o1, %o4	! 5
			
 
				+	mulscc	%o4, %o1, %o4	! 6
			
 
				+	mulscc	%o4, %o1, %o4	! 7
			
 
				+	mulscc	%o4, %o1, %o4	! 8
			
 
				+	mulscc	%o4, %o1, %o4	! 9
			
 
				+	mulscc	%o4, %o1, %o4	! 10
			
 
				+	mulscc	%o4, %o1, %o4	! 11
			
 
				+	mulscc	%o4, %o1, %o4	! 12
			
 
				+	mulscc	%o4, %g0, %o4	! final shift
			
 
				+
			
 
				+	/*
			
 
				+	 * %o4 has 20 of the bits that should be in the result; %y has
			
 
				+	 * the bottom 12 (as %y's top 12).  That is:
			
 
				+	 *
			
 
				+	 *	  %o4		    %y
			
 
				+	 * +----------------+----------------+
			
 
				+	 * | -12- |   -20-  | -12- |   -20-  |
			
 
				+	 * +------(---------+------)---------+
			
 
				+	 *	   -----result-----
			
 
				+	 *
			
 
				+	 * The 12 bits of %o4 left of the `result' area are all zero;
			
 
				+	 * in fact, all top 20 bits of %o4 are zero.
			
 
				+	 */
			
 
				+
			
 
				+	rd	%y, %o5
			
 
				+	sll	%o4, 12, %o0	! shift middle bits left 12
			
 
				+	srl	%o5, 20, %o5	! shift low bits right 20
			
 
				+	or	%o5, %o0, %o0
			
 
				+	retl
			
 
				+	 addcc	%g0, %g0, %o1	! %o1 = zero, and set Z
			
 
				+
			
 
				+.size  .umul , . -.umul
			
--- a/libc/sysdeps/linux/sparc/urem.S
+++ b/libc/sysdeps/linux/sparc/urem.S
@@ -0,0 +1,350 @@
 
				+   /* This file is generated from divrem.m4; DO NOT EDIT! */
			
 
				+/*
			
 
				+ * Division and remainder, from Appendix E of the Sparc Version 8
			
 
				+ * Architecture Manual, with fixes from Gordon Irlam.
			
 
				+ */
			
 
				+
			
 
				+/*
			
 
				+ * Input: dividend and divisor in %o0 and %o1 respectively.
			
 
				+ *
			
 
				+ * m4 parameters:
			
 
				+ *  .urem	name of function to generate
			
 
				+ *  rem		rem=div => %o0 / %o1; rem=rem => %o0 % %o1
			
 
				+ *  false		false=true => signed; false=false => unsigned
			
 
				+ *
			
 
				+ * Algorithm parameters:
			
 
				+ *  N		how many bits per iteration we try to get (4)
			
 
				+ *  WORDSIZE	total number of bits (32)
			
 
				+ *
			
 
				+ * Derived constants:
			
 
				+ *  TOPBITS	number of bits in the top decade of a number
			
 
				+ *
			
 
				+ * Important variables:
			
 
				+ *  Q		the partial quotient under development (initially 0)
			
 
				+ *  R		the remainder so far, initially the dividend
			
 
				+ *  ITER	number of main division loop iterations required;
			
 
				+ *		equal to ceil(log2(quotient) / N).  Note that this
			
 
				+ *		is the log base (2^N) of the quotient.
			
 
				+ *  V		the current comparand, initially divisor*2^(ITER*N-1)
			
 
				+ *
			
 
				+ * Cost:
			
 
				+ *  Current estimate for non-large dividend is
			
 
				+ *	ceil(log2(quotient) / N) * (10 + 7N/2) + C
			
 
				+ *  A large dividend is one greater than 2^(31-TOPBITS) and takes a
			
 
				+ *  different path, as the upper bits of the quotient must be developed
			
 
				+ *  one bit at a time.
			
 
				+ */
			
 
				+
			
 
				+
			
 
				+
			
 
				+#include <sysdep.h>
			
 
				+
			
 
				+
			
 
				+.global   .urem;
			
 
				+.align 4;
			
 
				+.type  .urem ,@function; 
			
 
				+
			
 
				+.urem: 
			
 
				+
			
 
				+	! Ready to divide.  Compute size of quotient; scale comparand.
			
 
				+	orcc	%o1, %g0, %o5
			
 
				+	bne	1f
			
 
				+	mov	%o0, %o3
			
 
				+
			
 
				+		! Divide by zero trap.  If it returns, return 0 (about as
			
 
				+		! wrong as possible, but that is what SunOS does...).
			
 
				+		ta	0x02 
			
 
				+		retl
			
 
				+		clr	%o0
			
 
				+
			
 
				+1:
			
 
				+	cmp	%o3, %o5			! if %o1 exceeds %o0, done
			
 
				+	blu	.Lgot_result		! (and algorithm fails otherwise)
			
 
				+	clr	%o2
			
 
				+	sethi	%hi(1 << (32 - 4 - 1)), %g1
			
 
				+	cmp	%o3, %g1
			
 
				+	blu	.Lnot_really_big
			
 
				+	clr	%o4
			
 
				+
			
 
				+	! Here the dividend is >= 2**(31-N) or so.  We must be careful here,
			
 
				+	! as our usual N-at-a-shot divide step will cause overflow and havoc.
			
 
				+	! The number of bits in the result here is N*ITER+SC, where SC <= N.
			
 
				+	! Compute ITER in an unorthodox manner: know we need to shift V into
			
 
				+	! the top decade: so do not even bother to compare to R.
			
 
				+	1:
			
 
				+		cmp	%o5, %g1
			
 
				+		bgeu	3f
			
 
				+		mov	1, %g2
			
 
				+		sll	%o5, 4, %o5
			
 
				+		b	1b
			
 
				+		add	%o4, 1, %o4
			
 
				+
			
 
				+	! Now compute %g2.
			
 
				+	2:	addcc	%o5, %o5, %o5
			
 
				+		bcc	.Lnot_too_big
			
 
				+		add	%g2, 1, %g2
			
 
				+
			
 
				+		! We get here if the %o1 overflowed while shifting.
			
 
				+		! This means that %o3 has the high-order bit set.
			
 
				+		! Restore %o5 and subtract from %o3.
			
 
				+		sll	%g1, 4, %g1	! high order bit
			
 
				+		srl	%o5, 1, %o5		! rest of %o5
			
 
				+		add	%o5, %g1, %o5
			
 
				+		b	.Ldo_single_div
			
 
				+		sub	%g2, 1, %g2
			
 
				+
			
 
				+	.Lnot_too_big:
			
 
				+	3:	cmp	%o5, %o3
			
 
				+		blu	2b
			
 
				+		nop
			
 
				+		be	.Ldo_single_div
			
 
				+		nop
			
 
				+	/* NB: these are commented out in the V8-Sparc manual as well */
			
 
				+	/* (I do not understand this) */
			
 
				+	! %o5 > %o3: went too far: back up 1 step
			
 
				+	!	srl	%o5, 1, %o5
			
 
				+	!	dec	%g2
			
 
				+	! do single-bit divide steps
			
 
				+	!
			
 
				+	! We have to be careful here.  We know that %o3 >= %o5, so we can do the
			
 
				+	! first divide step without thinking.  BUT, the others are conditional,
			
 
				+	! and are only done if %o3 >= 0.  Because both %o3 and %o5 may have the high-
			
 
				+	! order bit set in the first step, just falling into the regular
			
 
				+	! division loop will mess up the first time around.
			
 
				+	! So we unroll slightly...
			
 
				+	.Ldo_single_div:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bl	.Lend_regular_divide
			
 
				+		nop
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		mov	1, %o2
			
 
				+		b	.Lend_single_divloop
			
 
				+		nop
			
 
				+	.Lsingle_divloop:
			
 
				+		sll	%o2, 1, %o2
			
 
				+		bl	1f
			
 
				+		srl	%o5, 1, %o5
			
 
				+		! %o3 >= 0
			
 
				+		sub	%o3, %o5, %o3
			
 
				+		b	2f
			
 
				+		add	%o2, 1, %o2
			
 
				+	1:	! %o3 < 0
			
 
				+		add	%o3, %o5, %o3
			
 
				+		sub	%o2, 1, %o2
			
 
				+	2:
			
 
				+	.Lend_single_divloop:
			
 
				+		subcc	%g2, 1, %g2
			
 
				+		bge	.Lsingle_divloop
			
 
				+		tst	%o3
			
 
				+		b,a	.Lend_regular_divide
			
 
				+
			
 
				+.Lnot_really_big:
			
 
				+1:
			
 
				+	sll	%o5, 4, %o5
			
 
				+	cmp	%o5, %o3
			
 
				+	bleu	1b
			
 
				+	addcc	%o4, 1, %o4
			
 
				+	be	.Lgot_result
			
 
				+	sub	%o4, 1, %o4
			
 
				+
			
 
				+	tst	%o3	! set up for initial iteration
			
 
				+.Ldivloop:
			
 
				+	sll	%o2, 4, %o2
			
 
				+		! depth 1, accumulated bits 0
			
 
				+	bl	.L1.16
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits 1
			
 
				+	bl	.L2.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 3
			
 
				+	bl	.L3.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 7
			
 
				+	bl	.L4.23
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2+1), %o2
			
 
				+	
			
 
				+.L4.23:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 5
			
 
				+	bl	.L4.21
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2+1), %o2
			
 
				+	
			
 
				+.L4.21:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits 1
			
 
				+	bl	.L3.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 3
			
 
				+	bl	.L4.19
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2+1), %o2
			
 
				+	
			
 
				+.L4.19:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits 1
			
 
				+	bl	.L4.17
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2+1), %o2
			
 
				+	
			
 
				+.L4.17:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L1.16:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 2, accumulated bits -1
			
 
				+	bl	.L2.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -1
			
 
				+	bl	.L3.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -1
			
 
				+	bl	.L4.15
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2+1), %o2
			
 
				+	
			
 
				+.L4.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-1*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -3
			
 
				+	bl	.L4.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2+1), %o2
			
 
				+	
			
 
				+.L4.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-3*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+.L2.15:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 3, accumulated bits -3
			
 
				+	bl	.L3.13
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -5
			
 
				+	bl	.L4.11
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2+1), %o2
			
 
				+	
			
 
				+.L4.11:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-5*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+.L3.13:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+			! depth 4, accumulated bits -7
			
 
				+	bl	.L4.9
			
 
				+	srl	%o5,1,%o5
			
 
				+	! remainder is positive
			
 
				+	subcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2+1), %o2
			
 
				+	
			
 
				+.L4.9:
			
 
				+	! remainder is negative
			
 
				+	addcc	%o3,%o5,%o3
			
 
				+		b	9f
			
 
				+		add	%o2, (-7*2-1), %o2
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	
			
 
				+	9:
			
 
				+.Lend_regular_divide:
			
 
				+	subcc	%o4, 1, %o4
			
 
				+	bge	.Ldivloop
			
 
				+	tst	%o3
			
 
				+	bl,a	.Lgot_result
			
 
				+	! non-restoring fixup here (one instruction only!)
			
 
				+	add	%o3, %o1, %o3
			
 
				+
			
 
				+
			
 
				+.Lgot_result:
			
 
				+
			
 
				+	retl
			
 
				+	mov %o3, %o0
			
 
				+
			
 
				+END(.urem)