Tizen 2.1 base
[external/gmp.git] / mpn / pa32 / hppa1_1 / pa7100 / lshift.asm
1 dnl  HP-PA  mpn_lshift -- Shift a number left.
2 dnl  Optimized for the PA7100, where is runs at 3.25 cycles/limb.
3
4 dnl  Copyright 1992, 1994, 2000, 2001, 2002, 2003 Free Software Foundation,
5 dnl  Inc.
6
7 dnl  This file is part of the GNU MP Library.
8
9 dnl  The GNU MP Library is free software; you can redistribute it and/or modify
10 dnl  it under the terms of the GNU Lesser General Public License as published
11 dnl  by the Free Software Foundation; either version 3 of the License, or (at
12 dnl  your option) any later version.
13
14 dnl  The GNU MP Library is distributed in the hope that it will be useful, but
15 dnl  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
16 dnl  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
17 dnl  License for more details.
18
19 dnl  You should have received a copy of the GNU Lesser General Public License
20 dnl  along with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.
21
22 include(`../config.m4')
23
24 C INPUT PARAMETERS
25 C res_ptr       r26
26 C s_ptr         r25
27 C size          r24
28 C cnt           r23
29
30 ASM_START()
31 PROLOGUE(mpn_lshift)
32         sh2add          %r24,%r25,%r25
33         sh2add          %r24,%r26,%r26
34         ldws,mb         -4(0,%r25),%r22
35         subi            32,%r23,%r1
36         mtsar           %r1
37         addib,=         -1,%r24,L(0004)
38         vshd            %r0,%r22,%r28           C compute carry out limb
39         ldws,mb         -4(0,%r25),%r29
40         addib,<=        -5,%r24,L(rest)
41         vshd            %r22,%r29,%r20
42
43 LDEF(loop)
44         ldws,mb         -4(0,%r25),%r22
45         stws,mb         %r20,-4(0,%r26)
46         vshd            %r29,%r22,%r20
47         ldws,mb         -4(0,%r25),%r29
48         stws,mb         %r20,-4(0,%r26)
49         vshd            %r22,%r29,%r20
50         ldws,mb         -4(0,%r25),%r22
51         stws,mb         %r20,-4(0,%r26)
52         vshd            %r29,%r22,%r20
53         ldws,mb         -4(0,%r25),%r29
54         stws,mb         %r20,-4(0,%r26)
55         addib,>         -4,%r24,L(loop)
56         vshd            %r22,%r29,%r20
57
58 LDEF(rest)
59         addib,=         4,%r24,L(end1)
60         nop
61
62 LDEF(eloop)
63         ldws,mb         -4(0,%r25),%r22
64         stws,mb         %r20,-4(0,%r26)
65         addib,<=        -1,%r24,L(end2)
66         vshd            %r29,%r22,%r20
67         ldws,mb         -4(0,%r25),%r29
68         stws,mb         %r20,-4(0,%r26)
69         addib,>         -1,%r24,L(eloop)
70         vshd            %r22,%r29,%r20
71
72 LDEF(end1)
73         stws,mb         %r20,-4(0,%r26)
74         vshd            %r29,%r0,%r20
75         bv              0(%r2)
76         stw             %r20,-4(0,%r26)
77
78 LDEF(end2)
79         stws,mb         %r20,-4(0,%r26)
80
81 LDEF(0004)
82         vshd            %r22,%r0,%r20
83         bv              0(%r2)
84         stw             %r20,-4(0,%r26)
85 EPILOGUE()