mirror of
https://github.com/rn10950/RetroZilla.git
synced 2024-11-09 09:20:15 +01:00
142 lines
3.7 KiB
Plaintext
142 lines
3.7 KiB
Plaintext
!
|
|
! ***** BEGIN LICENSE BLOCK *****
|
|
! Version: MPL 1.1/GPL 2.0/LGPL 2.1
|
|
!
|
|
! The contents of this file are subject to the Mozilla Public License Version
|
|
! 1.1 (the "License"); you may not use this file except in compliance with
|
|
! the License. You may obtain a copy of the License at
|
|
! http://www.mozilla.org/MPL/
|
|
!
|
|
! Software distributed under the License is distributed on an "AS IS" basis,
|
|
! WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
|
|
! for the specific language governing rights and limitations under the
|
|
! License.
|
|
!
|
|
! The Original Code is inline macros for SPARC Montgomery multiply functions.
|
|
!
|
|
! The Initial Developer of the Original Code is
|
|
! Sun Microsystems Inc.
|
|
! Portions created by the Initial Developer are Copyright (C) 1999-2000
|
|
! the Initial Developer. All Rights Reserved.
|
|
!
|
|
! Contributor(s):
|
|
!
|
|
! Alternatively, the contents of this file may be used under the terms of
|
|
! either the GNU General Public License Version 2 or later (the "GPL"), or
|
|
! the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
|
|
! in which case the provisions of the GPL or the LGPL are applicable instead
|
|
! of those above. If you wish to allow use of your version of this file only
|
|
! under the terms of either the GPL or the LGPL, and not to allow others to
|
|
! use your version of this file under the terms of the MPL, indicate your
|
|
! decision by deleting the provisions above and replace them with the notice
|
|
! and other provisions required by the GPL or the LGPL. If you do not delete
|
|
! the provisions above, a recipient may use your version of this file under
|
|
! the terms of any one of the MPL, the GPL or the LGPL.
|
|
!
|
|
! ***** END LICENSE BLOCK *****
|
|
! $Id: montmulf.il,v 1.4 2004/04/27 23:04:36 gerv%gerv.net Exp $
|
|
|
|
!
|
|
! double upper32(double /*frs1*/);
|
|
!
|
|
.inline upper32,8
|
|
std %o0,[%sp+0x48]
|
|
ldd [%sp+0x48],%f10
|
|
|
|
fdtox %f10,%f10
|
|
fitod %f10,%f0
|
|
.end
|
|
|
|
!
|
|
! double lower32(double /*frs1*/, double /* Zero */);
|
|
!
|
|
.inline lower32,8
|
|
std %o0,[%sp+0x48]
|
|
ldd [%sp+0x48],%f10
|
|
std %o2,[%sp+0x48]
|
|
ldd [%sp+0x48],%f12
|
|
|
|
fdtox %f10,%f10
|
|
fmovs %f12,%f10
|
|
fxtod %f10,%f0
|
|
.end
|
|
|
|
!
|
|
! double mod(double /*x*/, double /*1/m*/, double /*m*/);
|
|
!
|
|
.inline mod,12
|
|
std %o0,[%sp+0x48]
|
|
ldd [%sp+0x48],%f2
|
|
std %o2,[%sp+0x48]
|
|
ldd [%sp+0x48],%f4
|
|
std %o4,[%sp+0x48]
|
|
ldd [%sp+0x48],%f6
|
|
|
|
fmuld %f2,%f4,%f4
|
|
fdtox %f4,%f4
|
|
fxtod %f4,%f4
|
|
fmuld %f4,%f6,%f4
|
|
fsubd %f2,%f4,%f0
|
|
.end
|
|
|
|
|
|
!
|
|
! void i16_to_d16_and_d32x4(double * /*1/(2^16)*/, double * /* 2^16*/,
|
|
! double * /* 0 */,
|
|
! double * /*result16*/, double * /* result32 */
|
|
! float * /*source - should be unsigned int*
|
|
! converted to float* */);
|
|
!
|
|
.inline i16_to_d16_and_d32x4,24
|
|
ldd [%o0],%f2 ! 1/(2^16)
|
|
ldd [%o1],%f4 ! 2^16
|
|
ldd [%o2],%f22
|
|
|
|
fmovd %f22,%f6
|
|
ld [%o5],%f7
|
|
fmovd %f22,%f10
|
|
ld [%o5+4],%f11
|
|
fmovd %f22,%f14
|
|
ld [%o5+8],%f15
|
|
fmovd %f22,%f18
|
|
ld [%o5+12],%f19
|
|
fxtod %f6,%f6
|
|
std %f6,[%o4]
|
|
fxtod %f10,%f10
|
|
std %f10,[%o4+8]
|
|
fxtod %f14,%f14
|
|
std %f14,[%o4+16]
|
|
fxtod %f18,%f18
|
|
std %f18,[%o4+24]
|
|
fmuld %f2,%f6,%f8
|
|
fmuld %f2,%f10,%f12
|
|
fmuld %f2,%f14,%f16
|
|
fmuld %f2,%f18,%f20
|
|
fdtox %f8,%f8
|
|
fdtox %f12,%f12
|
|
fdtox %f16,%f16
|
|
fdtox %f20,%f20
|
|
fxtod %f8,%f8
|
|
std %f8,[%o3+8]
|
|
fxtod %f12,%f12
|
|
std %f12,[%o3+24]
|
|
fxtod %f16,%f16
|
|
std %f16,[%o3+40]
|
|
fxtod %f20,%f20
|
|
std %f20,[%o3+56]
|
|
fmuld %f8,%f4,%f8
|
|
fmuld %f12,%f4,%f12
|
|
fmuld %f16,%f4,%f16
|
|
fmuld %f20,%f4,%f20
|
|
fsubd %f6,%f8,%f8
|
|
std %f8,[%o3]
|
|
fsubd %f10,%f12,%f12
|
|
std %f12,[%o3+16]
|
|
fsubd %f14,%f16,%f16
|
|
std %f16,[%o3+32]
|
|
fsubd %f18,%f20,%f20
|
|
std %f20,[%o3+48]
|
|
.end
|
|
|
|
|