ttmath/ttmath/ttmathuint64.h

/*
 * This file is a part of TTMath Mathematical Library
 * and is distributed under the (new) BSD licence.
 * Author: Tomasz Sowa <t.sowa@slimaczek.pl>
 */

/* 
 * Copyright (c) 2006-2007, Tomasz Sowa
 * All rights reserved.
 * 
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 * 
 *  * Redistributions of source code must retain the above copyright notice,
 *    this list of conditions and the following disclaimer.
 *    
 *  * Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *    
 *  * Neither the name Tomasz Sowa nor the names of contributors to this
 *    project may be used to endorse or promote products derived
 *    from this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
 * THE POSSIBILITY OF SUCH DAMAGE.
 */


/*!
	\file ttmathuint.h
    \brief template class UInt<uint> for 64bit processors
*/


namespace ttmath
{

	/*!
	*
	*	basic mathematic functions
	*
	*/

#if defined _M_X64 || defined __x86_64__

	/*!
		this method adding ss2 to the this and adding carry if it's defined
		(this = this + ss2 + c)

		c must be zero or one (might be a bigger value than 1)
		function returns carry (1) (if it was)
	*/
	template<uint value_size>
	uint UInt<value_size>::Add(const UInt<value_size> & ss2, uint c)
	{
	register uint b = value_size;
	register uint * p1 = table;
	register uint * p2 = const_cast<uint*>(ss2.table);


		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			/*
				this part might be compiled with for example visual c
			*/
			__asm
			{
			}
		#endif		
			

		#ifdef __GNUC__
			/*
				this part should be compiled with gcc
			*/
			__asm__ __volatile__(
			
				"push %%rbx				\n"
				"push %%rcx				\n"
				"push %%rdx				\n"
			
				"movq $0, %%rax			\n"
				"subq %%rsi, %%rax		\n"

			"1:							\n"
				"movq (%%rbx),%%rax		\n"
				"adcq (%%rdx),%%rax		\n"
				"movq %%rax,(%%rbx)		\n"
				
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				
			"loop 1b					\n"

				"movq $0, %%rax			\n"
				"adcq %%rax,%%rax		\n"
				"movq %%rax, %%rsi		\n" 

				"pop %%rdx				\n"
				"pop %%rcx				\n"
				"pop %%rbx				\n"

				: "=S" (c)
				: "0" (c), "c" (b), "b" (p1), "d" (p2)
				: "%rax", "cc", "memory" );

		#endif


	return c;
	}


	/*!
		this method adds one word (at a specific position)
		and returns a carry (if it was)

		e.g.

		if we've got (value_size=3):
			table[0] = 10;
			table[1] = 30;
			table[2] = 5;	
		and we call:
			AddInt(2,1)
		then it'll be:
			table[0] = 10;
			table[1] = 30 + 2;
			table[2] = 5;

		of course if there was a carry from table[3] it would be returned
	*/
	template<uint value_size>
	uint UInt<value_size>::AddInt(uint value, uint index)
	{
	register uint b = value_size;
	register uint * p1 = table;
	register uint c;

		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif		


		#ifdef __GNUC__
			__asm__ __volatile__(
				"push %%rbx						\n"
				"push %%rcx						\n"
				"push %%rdx						\n"

				"subq %%rdx, %%rcx 				\n"

				"leaq (%%rbx,%%rdx,8), %%rbx 	\n"

				"movq %4, %%rdx					\n"
				"clc							\n"
			"1:									\n"

				"movq (%%rbx), %%rax			\n"
				"adcq %%rdx, %%rax				\n"
				"movq %%rax, (%%rbx)			\n"

			"jnc 2f								\n"

				"movq $0, %%rdx					\n"

				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"

			"loop 1b							\n"

			"2:									\n"

				"movq $0, %%rax					\n"
				"adcq %%rax,%%rax				\n"

				"pop %%rdx						\n"
				"pop %%rcx						\n"
				"pop %%rbx						\n"

				: "=a" (c)
				: "c" (b), "d" (index), "b" (p1), "q" (value)
				: "cc", "memory" );

		#endif

	
	return c;
	}


	/*!
		this method adds only two unsigned words to the existing value
		and these words begin on the 'index' position
		(it's used in the multiplication algorithm 2)

		index should be equal or smaller than value_size-2 (index <= value_size-2)
		x1 - lower word, x2 - higher word

		for example if we've got value_size equal 4 and:
			table[0] = 3
			table[1] = 4
			table[2] = 5
			table[3] = 6
		then let
			x1 = 10
			x2 = 20
		and
			index = 1

		the result of this method will be:
			table[0] = 3
			table[1] = 4 + x1 = 14
			table[2] = 5 + x2 = 25
			table[3] = 6
		
		and no carry at the end of table[3]

		(of course if there was a carry in table[2](5+20) then 
		this carry would be passed to the table[3] etc.)
	*/
	template<uint value_size>
	uint UInt<value_size>::AddTwoInts(uint x2, uint x1, uint index)
	{
	register uint b = value_size;
	register uint * p1 = table;
	register uint c;

		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif		
			

		#ifdef __GNUC__
			__asm__ __volatile__(
			
				"push %%rbx						\n"
				"push %%rcx						\n"
				"push %%rdx						\n"

				"subq %%rdx, %%rcx 				\n"
				
				"leaq (%%rbx,%%rdx,8), %%rbx 	\n"

				"movq $0, %%rdx					\n"

				"movq (%%rbx), %%rax			\n"
				"addq %4, %%rax					\n"
				"movq %%rax, (%%rbx)			\n"

				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"

				"movq (%%rbx), %%rax			\n"
				"adcq %5, %%rax					\n"
				"movq %%rax, (%%rbx)			\n"
			"jnc 2f								\n"

				"dec %%rcx						\n"
				"dec %%rcx						\n"
			"jz 2f								\n"

			"1:									\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"

				"movq (%%rbx), %%rax			\n"
				"adcq %%rdx, %%rax				\n"
				"movq %%rax, (%%rbx)			\n"

			"jnc 2f								\n"

			"loop 1b							\n"

			"2:									\n"

				"movq $0, %%rax					\n"
				"adcq %%rax,%%rax				\n"

				"pop %%rdx						\n"
				"pop %%rcx						\n"
				"pop %%rbx						\n"

				: "=a" (c)
				: "c" (b), "d" (index), "b" (p1), "q" (x1), "q" (x2)
				: "cc", "memory" );

		#endif

	
	return c;
	}


	/*!
		this method's subtracting ss2 from the 'this' and subtracting
		carry if it has been defined
		(this = this - ss2 - c)

		c must be zero or one (might be a bigger value than 1)
		function returns carry (1) (if it was)
	*/
	template<uint value_size>
	uint UInt<value_size>::Sub(const UInt<value_size> & ss2, uint c)
	{
	register uint b = value_size;
	register uint * p1 = table;
	register uint * p2 = const_cast<uint*>(ss2.table);

		#ifndef __GNUC__

		#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}

		#endif


		#ifdef __GNUC__
			__asm__  __volatile__(
			
				"push %%rbx				\n"
				"push %%rcx				\n"
				"push %%rdx				\n"

				"movq $0, %%rax			\n"
				"subq %%rsi, %%rax		\n"

			"1:							\n"
				"movq (%%rbx),%%rax		\n"
				"sbbq (%%rdx),%%rax		\n"
				"movq %%rax,(%%rbx)		\n"
				
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				"inc %%rbx				\n"
				
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				"inc %%rdx				\n"
				
			"loop 1b					\n"

				"movq $0, %%rax			\n"
				"adcq %%rax,%%rax		\n"
				"movq %%rax, %%rsi		\n" 

				"pop %%rdx				\n"
				"pop %%rcx				\n"
				"pop %%rbx				\n"

				: "=S" (c)
				: "0" (c), "c" (b), "b" (p1), "d" (p2)
				: "%rax", "cc", "memory" );

		#endif


	return c;
	}


	/*!
		this method subtracts one word (at a specific position)
		and returns a carry (if it was)

		e.g.

		if we've got (value_size=3):
			table[0] = 10;
			table[1] = 30;
			table[2] = 5;	
		and we call:
			SubInt(2,1)
		then it'll be:
			table[0] = 10;
			table[1] = 30 - 2;
			table[2] = 5;

		of course if there was a carry from table[3] it would be returned
	*/
	template<uint value_size>
	uint UInt<value_size>::SubInt(uint value, uint index)
	{
	register uint b = value_size;
	register uint * p1 = table;
	register uint c;

		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif		
			

		#ifdef __GNUC__
			__asm__ __volatile__(
			
				"push %%rbx						\n"
				"push %%rcx						\n"
				"push %%rdx						\n"

				"subq %%rdx, %%rcx 				\n"

				"leaq (%%rbx,%%rdx,8), %%rbx 	\n"

				"movq %4, %%rdx					\n"
				"clc							\n"
			"1:									\n"

				"movq (%%rbx), %%rax			\n"
				"sbbq %%rdx, %%rax				\n"
				"movq %%rax, (%%rbx)			\n"

			"jnc 2f								\n"

				"movq $0, %%rdx					\n"

				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"
				"inc %%rbx						\n"

			"loop 1b							\n"

			"2:									\n"

				"movq $0, %%rax					\n"
				"adcq %%rax,%%rax				\n"

				"pop %%rdx						\n"
				"pop %%rcx						\n"
				"pop %%rbx						\n"

				: "=a" (c)
				: "c" (b), "d" (index), "b" (p1), "q" (value)
				: "cc", "memory" );

		#endif

	
	return c;
	}


	/*!
		this method moving once all bits into the left side
		return value <- this <- C

		the lowest bit will hold value of 'c' and
		function returns the highest bit
	*/
	template<uint value_size>
	uint UInt<value_size>::Rcl(uint c)
	{
	register sint b = value_size;
	register uint * p1 = table;


		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif


		#ifdef __GNUC__
		__asm__  __volatile__(
		
			"push %%rbx			\n"
			"push %%rcx			\n"
			
			"movq $0,%%rax		\n"
			"subq %%rdx,%%rax	\n"
		
		"1:						\n"
			"rclq $1,(%%rbx)	\n"
			
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			"inc %%rbx			\n"
			
		"loop 1b				\n"
			
			"movq $0, %%rdx		\n"
			"adcq %%rdx,%%rdx	\n"

			"pop %%rcx			\n"
			"pop %%rbx			\n"

			: "=d" (c)
			: "0" (c), "c" (b), "b" (p1)
			: "%rax", "cc", "memory" );

		#endif


	return c;
	}


	/*!
		this method moving once all bits into the right side
		C -> *this -> return value

		the highest bit will be held value of 'c' and
		function returns the lowest bit
	*/
	template<uint value_size>
	uint UInt<value_size>::Rcr(uint c)
	{
	register sint b = value_size;
	register uint * p1 = table;


		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif


		#ifdef __GNUC__
			__asm__  __volatile__(

			"push %%rbx			\n"
			"push %%rcx			\n"

			"leaq (%%rbx,%%rcx,8),%%rbx  \n"
		
			"movq $0, %%rax		\n"
			"subq %%rdx, %%rax	\n"

		"1:						\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			"dec %%rbx			\n"
			
			"rcrq $1,(%%rbx)	\n"
			
		"loop 1b				\n"

			"movq $0, %%rdx		\n"
			"adcq %%rdx,%%rdx	\n"

			"pop %%rcx			\n"
			"pop %%rbx			\n"

			: "=d" (c)
			: "0" (c), "c" (b), "b" (p1)
			: "%rax", "cc", "memory" );

		#endif


	return c;
	}


	/*
		this method returns the number of the highest set bit in one 32-bit word
		if the 'x' is zero this method returns '-1'
	*/
	template<uint value_size>
	sint UInt<value_size>::FindLeadingBitInWord(uint x)
	{
	register sint result;

		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif


		#ifdef __GNUC__
			__asm__  __volatile__(


			"bsrq %%rbx, %%rax	\n"
			"jnz 1f				\n"
			"movq $-1, %%rax	\n"
		"1:						\n"

			: "=a" (result)
			: "b" (x)
			: "cc" );

		#endif


	return result;
	}


	/*!
		this method sets a special bit in the 'value'
		and returns the result

		bit is from <0,31>

		e.g.
		SetBitInWord(0,0) = 1
		SetBitInWord(0,2) = 4
		SetBitInWord(10, 8) = 266
	*/
	template<uint value_size>
	uint UInt<value_size>::SetBitInWord(uint value, uint bit)
	{
		#ifndef __GNUC__
		
			#error "another compiler than GCC is currently not supported in 64bit mode"
		
		__asm
			{
			}
		#endif


		#ifdef __GNUC__
			__asm__  __volatile__(

			"btsq %%rbx,%%rax	\n"

			: "=a" (value)
			: "0" (value), "b" (bit)
			: "cc" );

		#endif

	return value;
	}


	/*!
	 *
	 * Multiplication
	 *
	 *
	*/


	/*!
		multiplication: result2:result1 = a * b
		result2 - higher word
		result1 - lower word of the result
	
		this methos never returns a carry

		it is an auxiliary method for version two of the multiplication algorithm
	*/
	template<uint value_size>
	void UInt<value_size>::MulTwoWords(uint a, uint b, uint * result2, uint * result1)
	{
	/*
		we must use these temporary variables in order to inform the compilator
		that value pointed with result1 and result2 has changed

		this has no effect in visual studio but it's usefull when
		using gcc and options like -O
	*/
	register uint result1_;
	register uint result2_;

		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}

		#endif


		#ifdef __GNUC__

		asm __volatile__(
		
			"mulq %%rdx			\n"

			: "=a" (result1_), "=d" (result2_)
			: "0" (a), "1" (b)
			: "cc" );

		#endif


		*result1 = result1_;
		*result2 = result2_;
	}


	/*!
	 *
	 * Division
	 *
	 *
	*/
	

	/*!
		this method calculates 64bits word a:b / 32bits c (a higher, b lower word)
		r = a:b / c and rest - remainder

		*
		* WARNING:
		* if r (one word) is too small for the result or c is equal zero
		* there'll be a hardware interruption (0)
		* and probably the end of your program
		*
	*/
	template<uint value_size>
	void UInt<value_size>::DivTwoWords(uint a,uint b, uint c, uint * r, uint * rest)
	{
		register uint r_;
		register uint rest_;
		/*
			these variables have similar meaning like those in
			the multiplication algorithm MulTwoWords
		*/

		#ifndef __GNUC__

			#error "another compiler than GCC is currently not supported in 64bit mode"

			__asm
			{
			}
		#endif


		#ifdef __GNUC__
		
			__asm__ __volatile__(

			"divq %%rcx				\n"

			: "=a" (r_), "=d" (rest_)
			: "d" (a), "a" (b), "c" (c)
			: "cc" );

		#endif


		*r = r_;
		*rest = rest_;
	}

#endif

} //namespace
fixed the problem with a sign in the mathematical parser /-(1) was 1/ added UInt::AddInt and UInt::SubInt changed UInt::AddOne and UInt::SubOne (much faster now) added UInt::SetBitInWord changed UInt::SetBit (much faster now) UInt::AddTwoUints renamed to UInt::AddTwoInts UInt::FindLeadingBit32 renamed to UInt::FindLeadingBitInWord added UInt::SetBitInWord UInt::Mul64 renamed to UInt::MulTwoWords UInt::Div64 renamed to UInt::DivTwoWords and more small changes in UInt type start adding support for Amd64 (not finished yet) (added ttmathuint64.h) git-svn-id: svn://ttmath.org/publicrep/ttmath/trunk@12 e52654a7-88a9-db11-a3e9-0013d4bc506e 2007-01-29 18:58:18 +01:00			`/*`
			`* This file is a part of TTMath Mathematical Library`
			`* and is distributed under the (new) BSD licence.`
			`* Author: Tomasz Sowa <t.sowa@slimaczek.pl>`
			`*/`

			`/*`
			`* Copyright (c) 2006-2007, Tomasz Sowa`
			`* All rights reserved.`
			`*`
			`* Redistribution and use in source and binary forms, with or without`
			`* modification, are permitted provided that the following conditions are met:`
			`*`
			`* * Redistributions of source code must retain the above copyright notice,`
			`* this list of conditions and the following disclaimer.`
			`*`
			`* * Redistributions in binary form must reproduce the above copyright`
			`* notice, this list of conditions and the following disclaimer in the`
			`* documentation and/or other materials provided with the distribution.`
			`*`
			`* * Neither the name Tomasz Sowa nor the names of contributors to this`
			`* project may be used to endorse or promote products derived`
			`* from this software without specific prior written permission.`
			`*`
			`* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"`
			`* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE`
			`* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE`
			`* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE`
			`* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR`
			`* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF`
			`* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS`
			`* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN`
			`* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)`
			`* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF`
			`* THE POSSIBILITY OF SUCH DAMAGE.`
			`*/`



			`/*!`
			`\file ttmathuint.h`
			`\brief template class UInt<uint> for 64bit processors`
			`*/`


			`namespace ttmath`
			`{`

			`/*!`
			`*`
			`* basic mathematic functions`
			`*`
			`*/`

			`#if defined _M_X64 \|\| defined __x86_64__`

			`/*!`
			`this method adding ss2 to the this and adding carry if it's defined`
			`(this = this + ss2 + c)`

			`c must be zero or one (might be a bigger value than 1)`
			`function returns carry (1) (if it was)`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::Add(const UInt<value_size> & ss2, uint c)`
			`{`
			`register uint b = value_size;`
			`register uint * p1 = table;`
			`register uint * p2 = const_cast<uint*>(ss2.table);`


			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`/*`
			`this part might be compiled with for example visual c`
			`*/`
			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`/*`
			`this part should be compiled with gcc`
			`*/`
			`__asm__ __volatile__(`

			`"push %%rbx \n"`
			`"push %%rcx \n"`
			`"push %%rdx \n"`

			`"movq $0, %%rax \n"`
			`"subq %%rsi, %%rax \n"`

			`"1: \n"`
			`"movq (%%rbx),%%rax \n"`
			`"adcq (%%rdx),%%rax \n"`
			`"movq %%rax,(%%rbx) \n"`

			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`

			`"loop 1b \n"`

			`"movq $0, %%rax \n"`
			`"adcq %%rax,%%rax \n"`
			`"movq %%rax, %%rsi \n"`

			`"pop %%rdx \n"`
			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=S" (c)`
			`: "0" (c), "c" (b), "b" (p1), "d" (p2)`
			`: "%rax", "cc", "memory" );`

			`#endif`



			`return c;`
			`}`



			`/*!`
			`this method adds one word (at a specific position)`
			`and returns a carry (if it was)`

			`e.g.`

			`if we've got (value_size=3):`
			`table[0] = 10;`
			`table[1] = 30;`
			`table[2] = 5;`
			`and we call:`
			`AddInt(2,1)`
			`then it'll be:`
			`table[0] = 10;`
			`table[1] = 30 + 2;`
			`table[2] = 5;`

			`of course if there was a carry from table[3] it would be returned`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::AddInt(uint value, uint index)`
			`{`
			`register uint b = value_size;`
			`register uint * p1 = table;`
			`register uint c;`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`
			`"push %%rbx \n"`
			`"push %%rcx \n"`
			`"push %%rdx \n"`

			`"subq %%rdx, %%rcx \n"`

			`"leaq (%%rbx,%%rdx,8), %%rbx \n"`

			`"movq %4, %%rdx \n"`
			`"clc \n"`
			`"1: \n"`

			`"movq (%%rbx), %%rax \n"`
			`"adcq %%rdx, %%rax \n"`
			`"movq %%rax, (%%rbx) \n"`

			`"jnc 2f \n"`

			`"movq $0, %%rdx \n"`

			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"loop 1b \n"`

			`"2: \n"`

			`"movq $0, %%rax \n"`
			`"adcq %%rax,%%rax \n"`

			`"pop %%rdx \n"`
			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=a" (c)`
			`: "c" (b), "d" (index), "b" (p1), "q" (value)`
			`: "cc", "memory" );`

			`#endif`


			`return c;`
			`}`



			`/*!`
			`this method adds only two unsigned words to the existing value`
			`and these words begin on the 'index' position`
			`(it's used in the multiplication algorithm 2)`

			`index should be equal or smaller than value_size-2 (index <= value_size-2)`
			`x1 - lower word, x2 - higher word`

			`for example if we've got value_size equal 4 and:`
			`table[0] = 3`
			`table[1] = 4`
			`table[2] = 5`
			`table[3] = 6`
			`then let`
			`x1 = 10`
			`x2 = 20`
			`and`
			`index = 1`

			`the result of this method will be:`
			`table[0] = 3`
			`table[1] = 4 + x1 = 14`
			`table[2] = 5 + x2 = 25`
			`table[3] = 6`

			`and no carry at the end of table[3]`

			`(of course if there was a carry in table[2](5+20) then`
			`this carry would be passed to the table[3] etc.)`
			`*/`
			`template<uint value_size>`
added samples/uint.cpp samples/int.cpp samples/Makefile changed Int::Div -- a remainder is not returning now but taking as a parameter (a pointer or reference) changed order in parameters in UInt::AddTwoInts added Int::AddInt added Int::AddTwoInts added Int::SubInt changed Int::AddOne and Int::SubOne (much faster now) fixed a bug in UInt::operator--() and Int::operator--() (there was adding instead of subtracting) git-svn-id: svn://ttmath.org/publicrep/ttmath/trunk@13 e52654a7-88a9-db11-a3e9-0013d4bc506e 2007-02-05 18:40:23 +01:00			`uint UInt<value_size>::AddTwoInts(uint x2, uint x1, uint index)`
fixed the problem with a sign in the mathematical parser /-(1) was 1/ added UInt::AddInt and UInt::SubInt changed UInt::AddOne and UInt::SubOne (much faster now) added UInt::SetBitInWord changed UInt::SetBit (much faster now) UInt::AddTwoUints renamed to UInt::AddTwoInts UInt::FindLeadingBit32 renamed to UInt::FindLeadingBitInWord added UInt::SetBitInWord UInt::Mul64 renamed to UInt::MulTwoWords UInt::Div64 renamed to UInt::DivTwoWords and more small changes in UInt type start adding support for Amd64 (not finished yet) (added ttmathuint64.h) git-svn-id: svn://ttmath.org/publicrep/ttmath/trunk@12 e52654a7-88a9-db11-a3e9-0013d4bc506e 2007-01-29 18:58:18 +01:00			`{`
			`register uint b = value_size;`
			`register uint * p1 = table;`
			`register uint c;`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`

			`"push %%rbx \n"`
			`"push %%rcx \n"`
			`"push %%rdx \n"`

			`"subq %%rdx, %%rcx \n"`

			`"leaq (%%rbx,%%rdx,8), %%rbx \n"`

			`"movq $0, %%rdx \n"`

			`"movq (%%rbx), %%rax \n"`
			`"addq %4, %%rax \n"`
			`"movq %%rax, (%%rbx) \n"`

			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"movq (%%rbx), %%rax \n"`
			`"adcq %5, %%rax \n"`
			`"movq %%rax, (%%rbx) \n"`
			`"jnc 2f \n"`

			`"dec %%rcx \n"`
			`"dec %%rcx \n"`
			`"jz 2f \n"`

			`"1: \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"movq (%%rbx), %%rax \n"`
			`"adcq %%rdx, %%rax \n"`
			`"movq %%rax, (%%rbx) \n"`

			`"jnc 2f \n"`

			`"loop 1b \n"`

			`"2: \n"`

			`"movq $0, %%rax \n"`
			`"adcq %%rax,%%rax \n"`

			`"pop %%rdx \n"`
			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=a" (c)`
			`: "c" (b), "d" (index), "b" (p1), "q" (x1), "q" (x2)`
			`: "cc", "memory" );`

			`#endif`


			`return c;`
			`}`





			`/*!`
			`this method's subtracting ss2 from the 'this' and subtracting`
			`carry if it has been defined`
			`(this = this - ss2 - c)`

			`c must be zero or one (might be a bigger value than 1)`
			`function returns carry (1) (if it was)`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::Sub(const UInt<value_size> & ss2, uint c)`
			`{`
			`register uint b = value_size;`
			`register uint * p1 = table;`
			`register uint * p2 = const_cast<uint*>(ss2.table);`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`

			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`

			`"push %%rbx \n"`
			`"push %%rcx \n"`
			`"push %%rdx \n"`

			`"movq $0, %%rax \n"`
			`"subq %%rsi, %%rax \n"`

			`"1: \n"`
			`"movq (%%rbx),%%rax \n"`
			`"sbbq (%%rdx),%%rax \n"`
			`"movq %%rax,(%%rbx) \n"`

			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`
			`"inc %%rdx \n"`

			`"loop 1b \n"`

			`"movq $0, %%rax \n"`
			`"adcq %%rax,%%rax \n"`
			`"movq %%rax, %%rsi \n"`

			`"pop %%rdx \n"`
			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=S" (c)`
			`: "0" (c), "c" (b), "b" (p1), "d" (p2)`
			`: "%rax", "cc", "memory" );`

			`#endif`


			`return c;`
			`}`


			`/*!`
			`this method subtracts one word (at a specific position)`
			`and returns a carry (if it was)`

			`e.g.`

			`if we've got (value_size=3):`
			`table[0] = 10;`
			`table[1] = 30;`
			`table[2] = 5;`
			`and we call:`
			`SubInt(2,1)`
			`then it'll be:`
			`table[0] = 10;`
			`table[1] = 30 - 2;`
			`table[2] = 5;`

			`of course if there was a carry from table[3] it would be returned`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::SubInt(uint value, uint index)`
			`{`
			`register uint b = value_size;`
			`register uint * p1 = table;`
			`register uint c;`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`

			`"push %%rbx \n"`
			`"push %%rcx \n"`
			`"push %%rdx \n"`

			`"subq %%rdx, %%rcx \n"`

			`"leaq (%%rbx,%%rdx,8), %%rbx \n"`

			`"movq %4, %%rdx \n"`
			`"clc \n"`
			`"1: \n"`

			`"movq (%%rbx), %%rax \n"`
			`"sbbq %%rdx, %%rax \n"`
			`"movq %%rax, (%%rbx) \n"`

			`"jnc 2f \n"`

			`"movq $0, %%rdx \n"`

			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"loop 1b \n"`

			`"2: \n"`

			`"movq $0, %%rax \n"`
			`"adcq %%rax,%%rax \n"`

			`"pop %%rdx \n"`
			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=a" (c)`
			`: "c" (b), "d" (index), "b" (p1), "q" (value)`
			`: "cc", "memory" );`

			`#endif`


			`return c;`
			`}`


			`/*!`
			`this method moving once all bits into the left side`
			`return value <- this <- C`

			`the lowest bit will hold value of 'c' and`
			`function returns the highest bit`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::Rcl(uint c)`
			`{`
			`register sint b = value_size;`
			`register uint * p1 = table;`


			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`

			`"push %%rbx \n"`
			`"push %%rcx \n"`

			`"movq $0,%%rax \n"`
			`"subq %%rdx,%%rax \n"`

			`"1: \n"`
			`"rclq $1,(%%rbx) \n"`

			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`
			`"inc %%rbx \n"`

			`"loop 1b \n"`

			`"movq $0, %%rdx \n"`
			`"adcq %%rdx,%%rdx \n"`

			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=d" (c)`
			`: "0" (c), "c" (b), "b" (p1)`
			`: "%rax", "cc", "memory" );`

			`#endif`


			`return c;`
			`}`


			`/*!`
			`this method moving once all bits into the right side`
			`C -> *this -> return value`

			`the highest bit will be held value of 'c' and`
			`function returns the lowest bit`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::Rcr(uint c)`
			`{`
			`register sint b = value_size;`
			`register uint * p1 = table;`


			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`

			`"push %%rbx \n"`
			`"push %%rcx \n"`

			`"leaq (%%rbx,%%rcx,8),%%rbx \n"`

			`"movq $0, %%rax \n"`
			`"subq %%rdx, %%rax \n"`

			`"1: \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`
			`"dec %%rbx \n"`

			`"rcrq $1,(%%rbx) \n"`

			`"loop 1b \n"`

			`"movq $0, %%rdx \n"`
			`"adcq %%rdx,%%rdx \n"`

			`"pop %%rcx \n"`
			`"pop %%rbx \n"`

			`: "=d" (c)`
			`: "0" (c), "c" (b), "b" (p1)`
			`: "%rax", "cc", "memory" );`

			`#endif`


			`return c;`
			`}`


			`/*`
			`this method returns the number of the highest set bit in one 32-bit word`
			`if the 'x' is zero this method returns '-1'`
			`*/`
			`template<uint value_size>`
			`sint UInt<value_size>::FindLeadingBitInWord(uint x)`
			`{`
			`register sint result;`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`


			`"bsrq %%rbx, %%rax \n"`
			`"jnz 1f \n"`
			`"movq $-1, %%rax \n"`
			`"1: \n"`

			`: "=a" (result)`
			`: "b" (x)`
			`: "cc" );`

			`#endif`


			`return result;`
			`}`


			`/*!`
			`this method sets a special bit in the 'value'`
			`and returns the result`

			`bit is from <0,31>`

			`e.g.`
			`SetBitInWord(0,0) = 1`
			`SetBitInWord(0,2) = 4`
			`SetBitInWord(10, 8) = 266`
			`*/`
			`template<uint value_size>`
			`uint UInt<value_size>::SetBitInWord(uint value, uint bit)`
			`{`
			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`
			`__asm__ __volatile__(`

			`"btsq %%rbx,%%rax \n"`

			`: "=a" (value)`
			`: "0" (value), "b" (bit)`
			`: "cc" );`

			`#endif`

			`return value;`
			`}`


			`/*!`
			`*`
			`* Multiplication`
			`*`
			`*`
			`*/`


			`/*!`
			`multiplication: result2:result1 = a * b`
			`result2 - higher word`
			`result1 - lower word of the result`

			`this methos never returns a carry`

			`it is an auxiliary method for version two of the multiplication algorithm`
			`*/`
			`template<uint value_size>`
			`void UInt<value_size>::MulTwoWords(uint a, uint b, uint * result2, uint * result1)`
			`{`
			`/*`
			`we must use these temporary variables in order to inform the compilator`
			`that value pointed with result1 and result2 has changed`

			`this has no effect in visual studio but it's usefull when`
			`using gcc and options like -O`
			`*/`
			`register uint result1_;`
			`register uint result2_;`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`

			`#endif`


			`#ifdef __GNUC__`

			`asm __volatile__(`

			`"mulq %%rdx \n"`

			`: "=a" (result1_), "=d" (result2_)`
			`: "0" (a), "1" (b)`
			`: "cc" );`

			`#endif`


			`*result1 = result1_;`
			`*result2 = result2_;`
			`}`




			`/*!`
			`*`
			`* Division`
			`*`
			`*`
			`*/`


			`/*!`
			`this method calculates 64bits word a:b / 32bits c (a higher, b lower word)`
			`r = a:b / c and rest - remainder`

			`*`
			`* WARNING:`
			`* if r (one word) is too small for the result or c is equal zero`
			`* there'll be a hardware interruption (0)`
			`* and probably the end of your program`
			`*`
			`*/`
			`template<uint value_size>`
			`void UInt<value_size>::DivTwoWords(uint a,uint b, uint c, uint * r, uint * rest)`
			`{`
			`register uint r_;`
			`register uint rest_;`
			`/*`
			`these variables have similar meaning like those in`
			`the multiplication algorithm MulTwoWords`
			`*/`

			`#ifndef __GNUC__`

			`#error "another compiler than GCC is currently not supported in 64bit mode"`

			`__asm`
			`{`
			`}`
			`#endif`


			`#ifdef __GNUC__`

			`__asm__ __volatile__(`

			`"divq %%rcx \n"`

			`: "=a" (r_), "=d" (rest_)`
			`: "d" (a), "a" (b), "c" (c)`
			`: "cc" );`

			`#endif`


			`*r = r_;`
			`*rest = rest_;`
			`}`

			`#endif`

			`} //namespace`