~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

TOMOYO Linux Cross Reference
Linux/arch/alpha/lib/memset.S

Version: ~ [ linux-6.12-rc7 ] ~ [ linux-6.11.7 ] ~ [ linux-6.10.14 ] ~ [ linux-6.9.12 ] ~ [ linux-6.8.12 ] ~ [ linux-6.7.12 ] ~ [ linux-6.6.60 ] ~ [ linux-6.5.13 ] ~ [ linux-6.4.16 ] ~ [ linux-6.3.13 ] ~ [ linux-6.2.16 ] ~ [ linux-6.1.116 ] ~ [ linux-6.0.19 ] ~ [ linux-5.19.17 ] ~ [ linux-5.18.19 ] ~ [ linux-5.17.15 ] ~ [ linux-5.16.20 ] ~ [ linux-5.15.171 ] ~ [ linux-5.14.21 ] ~ [ linux-5.13.19 ] ~ [ linux-5.12.19 ] ~ [ linux-5.11.22 ] ~ [ linux-5.10.229 ] ~ [ linux-5.9.16 ] ~ [ linux-5.8.18 ] ~ [ linux-5.7.19 ] ~ [ linux-5.6.19 ] ~ [ linux-5.5.19 ] ~ [ linux-5.4.285 ] ~ [ linux-5.3.18 ] ~ [ linux-5.2.21 ] ~ [ linux-5.1.21 ] ~ [ linux-5.0.21 ] ~ [ linux-4.20.17 ] ~ [ linux-4.19.323 ] ~ [ linux-4.18.20 ] ~ [ linux-4.17.19 ] ~ [ linux-4.16.18 ] ~ [ linux-4.15.18 ] ~ [ linux-4.14.336 ] ~ [ linux-4.13.16 ] ~ [ linux-4.12.14 ] ~ [ linux-4.11.12 ] ~ [ linux-4.10.17 ] ~ [ linux-4.9.337 ] ~ [ linux-4.4.302 ] ~ [ linux-3.10.108 ] ~ [ linux-2.6.32.71 ] ~ [ linux-2.6.0 ] ~ [ linux-2.4.37.11 ] ~ [ unix-v6-master ] ~ [ ccs-tools-1.8.12 ] ~ [ policy-sample ] ~
Architecture: ~ [ i386 ] ~ [ alpha ] ~ [ m68k ] ~ [ mips ] ~ [ ppc ] ~ [ sparc ] ~ [ sparc64 ] ~

Diff markup

Differences between /arch/alpha/lib/memset.S (Version linux-6.12-rc7) and /arch/sparc/lib/memset.S (Version linux-4.20.17)


  1 /* SPDX-License-Identifier: GPL-2.0 */              1 /* SPDX-License-Identifier: GPL-2.0 */
  2 /*                                             !!   2 /* linux/arch/sparc/lib/memset.S: Sparc optimized memset, bzero and clear_user code
  3  * linux/arch/alpha/lib/memset.S               !!   3  * Copyright (C) 1991,1996 Free Software Foundation
                                                   >>   4  * Copyright (C) 1996,1997 Jakub Jelinek (jj@sunsite.mff.cuni.cz)
                                                   >>   5  * Copyright (C) 1996 David S. Miller (davem@caip.rutgers.edu)
  4  *                                                  6  *
  5  * This is an efficient (and small) implementa !!   7  * Calls to memset returns initial %o0. Calls to bzero returns 0, if ok, and
  6  * function for the alpha.                     !!   8  * number of bytes not yet set if exception occurs and we were called as
  7  *                                             !!   9  * clear_user.
  8  *      (C) Copyright 1996 Linus Torvalds      << 
  9  *                                             << 
 10  * This routine is "moral-ware": you are free  << 
 11  * the only obligation I put on you is a moral << 
 12  * to the routine, please send me your improve << 
 13  *                                             << 
 14  * The scheduling comments are according to th << 
 15  * hand, so they might well be incorrect, plea << 
 16  */                                                10  */
 17 #include <linux/export.h>                      << 
 18         .set noat                              << 
 19         .set noreorder                         << 
 20 .text                                          << 
 21         .globl memset                          << 
 22         .globl __memset                        << 
 23         .globl ___memset                       << 
 24         .globl __memset16                      << 
 25         .globl __constant_c_memset             << 
 26                                                << 
 27         .ent ___memset                         << 
 28 .align 5                                       << 
 29 ___memset:                                     << 
 30         .frame $30,0,$26,0                     << 
 31         .prologue 0                            << 
 32                                                << 
 33         and $17,255,$1          /* E1 */       << 
 34         insbl $17,1,$17         /* .. E0 */    << 
 35         bis $17,$1,$17          /* E0 (p-c lat << 
 36         sll $17,16,$1           /* E1 (p-c lat << 
 37                                                << 
 38         bis $17,$1,$17          /* E0 (p-c lat << 
 39         sll $17,32,$1           /* E1 (p-c lat << 
 40         bis $17,$1,$17          /* E0 (p-c lat << 
 41         ldq_u $31,0($30)        /* .. E1 */    << 
 42                                                << 
 43 .align 5                                       << 
 44 __constant_c_memset:                           << 
 45         addq $18,$16,$6         /* E0 */       << 
 46         bis $16,$16,$0          /* .. E1 */    << 
 47         xor $16,$6,$1           /* E0 */       << 
 48         ble $18,end             /* .. E1 */    << 
 49                                                << 
 50         bic $1,7,$1             /* E0 */       << 
 51         beq $1,within_one_quad  /* .. E1 (note << 
 52         and $16,7,$3            /* E0 */       << 
 53         beq $3,aligned          /* .. E1 (note << 
 54                                                << 
 55         ldq_u $4,0($16)         /* E0 */       << 
 56         bis $16,$16,$5          /* .. E1 */    << 
 57         insql $17,$16,$2        /* E0 */       << 
 58         subq $3,8,$3            /* .. E1 */    << 
 59                                                << 
 60         addq $18,$3,$18         /* E0   $18 is << 
 61         mskql $4,$16,$4         /* .. E1 (and  << 
 62         subq $16,$3,$16         /* E0   $16 is << 
 63         bis $2,$4,$1            /* .. E1 */    << 
 64                                                << 
 65         bis $31,$31,$31         /* E0 */       << 
 66         ldq_u $31,0($30)        /* .. E1 */    << 
 67         stq_u $1,0($5)          /* E0 */       << 
 68         bis $31,$31,$31         /* .. E1 */    << 
 69                                                << 
 70 .align 4                                       << 
 71 aligned:                                       << 
 72         sra $18,3,$3            /* E0 */       << 
 73         and $18,7,$18           /* .. E1 */    << 
 74         bis $16,$16,$5          /* E0 */       << 
 75         beq $3,no_quad          /* .. E1 */    << 
 76                                                << 
 77 .align 3                                       << 
 78 loop:                                          << 
 79         stq $17,0($5)           /* E0 */       << 
 80         subq $3,1,$3            /* .. E1 */    << 
 81         addq $5,8,$5            /* E0 */       << 
 82         bne $3,loop             /* .. E1 */    << 
 83                                                << 
 84 no_quad:                                       << 
 85         bis $31,$31,$31         /* E0 */       << 
 86         beq $18,end             /* .. E1 */    << 
 87         ldq $7,0($5)            /* E0 */       << 
 88         mskqh $7,$6,$2          /* .. E1 (and  << 
 89                                                << 
 90         insqh $17,$6,$4         /* E0 */       << 
 91         bis $2,$4,$1            /* .. E1 */    << 
 92         stq $1,0($5)            /* E0 */       << 
 93         ret $31,($26),1         /* .. E1 */    << 
 94                                                << 
 95 .align 3                                       << 
 96 within_one_quad:                               << 
 97         ldq_u $1,0($16)         /* E0 */       << 
 98         insql $17,$16,$2        /* E1 */       << 
 99         mskql $1,$16,$4         /* E0 (after l << 
100         bis $2,$4,$2            /* E0 */       << 
101                                                << 
102         mskql $2,$6,$4          /* E0 */       << 
103         mskqh $1,$6,$2          /* .. E1 */    << 
104         bis $2,$4,$1            /* E0 */       << 
105         stq_u $1,0($16)         /* E0 */       << 
106                                                << 
107 end:                                           << 
108         ret $31,($26),1         /* E1 */       << 
109         .end ___memset                         << 
110 EXPORT_SYMBOL(___memset)                       << 
111 EXPORT_SYMBOL(__constant_c_memset)             << 
112                                                << 
113         .align 5                               << 
114         .ent __memset16                        << 
115 __memset16:                                    << 
116         .prologue 0                            << 
117                                                << 
118         inswl $17,0,$1          /* E0 */       << 
119         inswl $17,2,$2          /* E0 */       << 
120         inswl $17,4,$3          /* E0 */       << 
121         or $1,$2,$1             /* .. E1 */    << 
122         inswl $17,6,$4          /* E0 */       << 
123         or $1,$3,$1             /* .. E1 */    << 
124         or $1,$4,$17            /* E0 */       << 
125         br __constant_c_memset  /* .. E1 */    << 
126                                                    11 
127         .end __memset16                        !!  12 #include <asm/ptrace.h>
128 EXPORT_SYMBOL(__memset16)                      !!  13 #include <asm/export.h>
129                                                    14 
130 memset = ___memset                             !!  15 /* Work around cpp -rob */
131 __memset = ___memset                           !!  16 #define ALLOC #alloc
                                                   >>  17 #define EXECINSTR #execinstr
                                                   >>  18 #define EX(x,y,a,b)                             \
                                                   >>  19 98:     x,y;                                    \
                                                   >>  20         .section .fixup,ALLOC,EXECINSTR;        \
                                                   >>  21         .align  4;                              \
                                                   >>  22 99:     ba 30f;                                 \
                                                   >>  23          a, b, %o0;                             \
                                                   >>  24         .section __ex_table,ALLOC;              \
                                                   >>  25         .align  4;                              \
                                                   >>  26         .word   98b, 99b;                       \
                                                   >>  27         .text;                                  \
                                                   >>  28         .align  4
                                                   >>  29 
                                                   >>  30 #define EXT(start,end,handler)                  \
                                                   >>  31         .section __ex_table,ALLOC;              \
                                                   >>  32         .align  4;                              \
                                                   >>  33         .word   start, 0, end, handler;         \
                                                   >>  34         .text;                                  \
                                                   >>  35         .align  4
                                                   >>  36 
                                                   >>  37 /* Please don't change these macros, unless you change the logic
                                                   >>  38  * in the .fixup section below as well.
                                                   >>  39  * Store 64 bytes at (BASE + OFFSET) using value SOURCE. */
                                                   >>  40 #define ZERO_BIG_BLOCK(base, offset, source)    \
                                                   >>  41         std     source, [base + offset + 0x00]; \
                                                   >>  42         std     source, [base + offset + 0x08]; \
                                                   >>  43         std     source, [base + offset + 0x10]; \
                                                   >>  44         std     source, [base + offset + 0x18]; \
                                                   >>  45         std     source, [base + offset + 0x20]; \
                                                   >>  46         std     source, [base + offset + 0x28]; \
                                                   >>  47         std     source, [base + offset + 0x30]; \
                                                   >>  48         std     source, [base + offset + 0x38];
                                                   >>  49 
                                                   >>  50 #define ZERO_LAST_BLOCKS(base, offset, source)  \
                                                   >>  51         std     source, [base - offset - 0x38]; \
                                                   >>  52         std     source, [base - offset - 0x30]; \
                                                   >>  53         std     source, [base - offset - 0x28]; \
                                                   >>  54         std     source, [base - offset - 0x20]; \
                                                   >>  55         std     source, [base - offset - 0x18]; \
                                                   >>  56         std     source, [base - offset - 0x10]; \
                                                   >>  57         std     source, [base - offset - 0x08]; \
                                                   >>  58         std     source, [base - offset - 0x00];
                                                   >>  59 
                                                   >>  60         .text
                                                   >>  61         .align 4
                                                   >>  62 
                                                   >>  63         .globl  __bzero_begin
                                                   >>  64 __bzero_begin:
                                                   >>  65 
                                                   >>  66         .globl  __bzero
                                                   >>  67         .type   __bzero,#function
                                                   >>  68         .globl  memset
                                                   >>  69         EXPORT_SYMBOL(__bzero)
132         EXPORT_SYMBOL(memset)                      70         EXPORT_SYMBOL(memset)
133         EXPORT_SYMBOL(__memset)                !!  71         .globl  __memset_start, __memset_end
                                                   >>  72 __memset_start:
                                                   >>  73 memset:
                                                   >>  74         mov     %o0, %g1
                                                   >>  75         mov     1, %g4
                                                   >>  76         and     %o1, 0xff, %g3
                                                   >>  77         sll     %g3, 8, %g2
                                                   >>  78         or      %g3, %g2, %g3
                                                   >>  79         sll     %g3, 16, %g2
                                                   >>  80         or      %g3, %g2, %g3
                                                   >>  81         b       1f
                                                   >>  82          mov    %o2, %o1
                                                   >>  83 3:
                                                   >>  84         cmp     %o2, 3
                                                   >>  85         be      2f
                                                   >>  86          EX(stb %g3, [%o0], sub %o1, 0)
                                                   >>  87 
                                                   >>  88         cmp     %o2, 2
                                                   >>  89         be      2f
                                                   >>  90          EX(stb %g3, [%o0 + 0x01], sub %o1, 1)
                                                   >>  91 
                                                   >>  92         EX(stb  %g3, [%o0 + 0x02], sub %o1, 2)
                                                   >>  93 2:
                                                   >>  94         sub     %o2, 4, %o2
                                                   >>  95         add     %o1, %o2, %o1
                                                   >>  96         b       4f
                                                   >>  97          sub    %o0, %o2, %o0
                                                   >>  98 
                                                   >>  99 __bzero:
                                                   >> 100         clr     %g4
                                                   >> 101         mov     %g0, %g3
                                                   >> 102 1:
                                                   >> 103         cmp     %o1, 7
                                                   >> 104         bleu    7f
                                                   >> 105          andcc  %o0, 3, %o2
                                                   >> 106 
                                                   >> 107         bne     3b
                                                   >> 108 4:
                                                   >> 109          andcc  %o0, 4, %g0
                                                   >> 110 
                                                   >> 111         be      2f
                                                   >> 112          mov    %g3, %g2
                                                   >> 113 
                                                   >> 114         EX(st   %g3, [%o0], sub %o1, 0)
                                                   >> 115         sub     %o1, 4, %o1
                                                   >> 116         add     %o0, 4, %o0
                                                   >> 117 2:
                                                   >> 118         andcc   %o1, 0xffffff80, %o3    ! Now everything is 8 aligned and o1 is len to run
                                                   >> 119         be      9f
                                                   >> 120          andcc  %o1, 0x78, %o2
                                                   >> 121 10:
                                                   >> 122         ZERO_BIG_BLOCK(%o0, 0x00, %g2)
                                                   >> 123         subcc   %o3, 128, %o3
                                                   >> 124         ZERO_BIG_BLOCK(%o0, 0x40, %g2)
                                                   >> 125 11:
                                                   >> 126         EXT(10b, 11b, 20f)
                                                   >> 127         bne     10b
                                                   >> 128          add    %o0, 128, %o0
                                                   >> 129 
                                                   >> 130         orcc    %o2, %g0, %g0
                                                   >> 131 9:
                                                   >> 132         be      13f
                                                   >> 133          andcc  %o1, 7, %o1
                                                   >> 134 
                                                   >> 135         srl     %o2, 1, %o3
                                                   >> 136         set     13f, %o4
                                                   >> 137         sub     %o4, %o3, %o4
                                                   >> 138         jmp     %o4
                                                   >> 139          add    %o0, %o2, %o0
                                                   >> 140 
                                                   >> 141 12:
                                                   >> 142         ZERO_LAST_BLOCKS(%o0, 0x48, %g2)
                                                   >> 143         ZERO_LAST_BLOCKS(%o0, 0x08, %g2)
                                                   >> 144 13:
                                                   >> 145         be      8f
                                                   >> 146          andcc  %o1, 4, %g0
                                                   >> 147 
                                                   >> 148         be      1f
                                                   >> 149          andcc  %o1, 2, %g0
                                                   >> 150 
                                                   >> 151         EX(st   %g3, [%o0], and %o1, 7)
                                                   >> 152         add     %o0, 4, %o0
                                                   >> 153 1:
                                                   >> 154         be      1f
                                                   >> 155          andcc  %o1, 1, %g0
                                                   >> 156 
                                                   >> 157         EX(sth  %g3, [%o0], and %o1, 3)
                                                   >> 158         add     %o0, 2, %o0
                                                   >> 159 1:
                                                   >> 160         bne,a   8f
                                                   >> 161          EX(stb %g3, [%o0], and %o1, 1)
                                                   >> 162 8:
                                                   >> 163         b       0f
                                                   >> 164          nop
                                                   >> 165 7:
                                                   >> 166         be      13b
                                                   >> 167          orcc   %o1, 0, %g0
                                                   >> 168 
                                                   >> 169         be      0f
                                                   >> 170 8:
                                                   >> 171          add    %o0, 1, %o0
                                                   >> 172         subcc   %o1, 1, %o1
                                                   >> 173         bne     8b
                                                   >> 174          EX(stb %g3, [%o0 - 1], add %o1, 1)
                                                   >> 175 0:
                                                   >> 176         andcc   %g4, 1, %g0
                                                   >> 177         be      5f
                                                   >> 178          nop
                                                   >> 179         retl
                                                   >> 180          mov    %g1, %o0
                                                   >> 181 5:
                                                   >> 182         retl
                                                   >> 183          clr    %o0
                                                   >> 184 __memset_end:
                                                   >> 185 
                                                   >> 186         .section .fixup,#alloc,#execinstr
                                                   >> 187         .align  4
                                                   >> 188 20:
                                                   >> 189         cmp     %g2, 8
                                                   >> 190         bleu    1f
                                                   >> 191          and    %o1, 0x7f, %o1
                                                   >> 192         sub     %g2, 9, %g2
                                                   >> 193         add     %o3, 64, %o3
                                                   >> 194 1:
                                                   >> 195         sll     %g2, 3, %g2
                                                   >> 196         add     %o3, %o1, %o0
                                                   >> 197         b 30f
                                                   >> 198          sub    %o0, %g2, %o0
                                                   >> 199 21:
                                                   >> 200         mov     8, %o0
                                                   >> 201         and     %o1, 7, %o1
                                                   >> 202         sub     %o0, %g2, %o0
                                                   >> 203         sll     %o0, 3, %o0
                                                   >> 204         b 30f
                                                   >> 205          add    %o0, %o1, %o0
                                                   >> 206 30:
                                                   >> 207 /* %o4 is faulting address, %o5 is %pc where fault occurred */
                                                   >> 208         save    %sp, -104, %sp
                                                   >> 209         mov     %i5, %o0
                                                   >> 210         mov     %i7, %o1
                                                   >> 211         call    lookup_fault
                                                   >> 212          mov    %i4, %o2
                                                   >> 213         ret
                                                   >> 214          restore
                                                   >> 215 
                                                   >> 216         .globl __bzero_end
                                                   >> 217 __bzero_end:
                                                      

~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

kernel.org | git.kernel.org | LWN.net | Project Home | SVN repository | Mail admin

Linux® is a registered trademark of Linus Torvalds in the United States and other countries.
TOMOYO® is a registered trademark of NTT DATA CORPORATION.

sflogo.php