~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

TOMOYO Linux Cross Reference
Linux/arch/powerpc/crypto/sha1-spe-asm.S

Version: ~ [ linux-6.12-rc7 ] ~ [ linux-6.11.7 ] ~ [ linux-6.10.14 ] ~ [ linux-6.9.12 ] ~ [ linux-6.8.12 ] ~ [ linux-6.7.12 ] ~ [ linux-6.6.60 ] ~ [ linux-6.5.13 ] ~ [ linux-6.4.16 ] ~ [ linux-6.3.13 ] ~ [ linux-6.2.16 ] ~ [ linux-6.1.116 ] ~ [ linux-6.0.19 ] ~ [ linux-5.19.17 ] ~ [ linux-5.18.19 ] ~ [ linux-5.17.15 ] ~ [ linux-5.16.20 ] ~ [ linux-5.15.171 ] ~ [ linux-5.14.21 ] ~ [ linux-5.13.19 ] ~ [ linux-5.12.19 ] ~ [ linux-5.11.22 ] ~ [ linux-5.10.229 ] ~ [ linux-5.9.16 ] ~ [ linux-5.8.18 ] ~ [ linux-5.7.19 ] ~ [ linux-5.6.19 ] ~ [ linux-5.5.19 ] ~ [ linux-5.4.285 ] ~ [ linux-5.3.18 ] ~ [ linux-5.2.21 ] ~ [ linux-5.1.21 ] ~ [ linux-5.0.21 ] ~ [ linux-4.20.17 ] ~ [ linux-4.19.323 ] ~ [ linux-4.18.20 ] ~ [ linux-4.17.19 ] ~ [ linux-4.16.18 ] ~ [ linux-4.15.18 ] ~ [ linux-4.14.336 ] ~ [ linux-4.13.16 ] ~ [ linux-4.12.14 ] ~ [ linux-4.11.12 ] ~ [ linux-4.10.17 ] ~ [ linux-4.9.337 ] ~ [ linux-4.4.302 ] ~ [ linux-3.10.108 ] ~ [ linux-2.6.32.71 ] ~ [ linux-2.6.0 ] ~ [ linux-2.4.37.11 ] ~ [ unix-v6-master ] ~ [ ccs-tools-1.8.12 ] ~ [ policy-sample ] ~
Architecture: ~ [ i386 ] ~ [ alpha ] ~ [ m68k ] ~ [ mips ] ~ [ ppc ] ~ [ sparc ] ~ [ sparc64 ] ~

Diff markup

Differences between /arch/powerpc/crypto/sha1-spe-asm.S (Version linux-6.12-rc7) and /arch/i386/crypto/sha1-spe-asm.S (Version linux-5.9.16)


  1 /* SPDX-License-Identifier: GPL-2.0-or-later *    
  2 /*                                                
  3  * Fast SHA-1 implementation for SPE instructi    
  4  *                                                
  5  * This code makes use of the SPE SIMD instruc    
  6  * http://cache.freescale.com/files/32bit/doc/    
  7  * Implementation is based on optimization gui    
  8  * http://cache.freescale.com/files/32bit/doc/    
  9  *                                                
 10  * Copyright (c) 2015 Markus Stockhausen <stock    
 11  */                                               
 12                                                   
 13 #include <asm/ppc_asm.h>                          
 14 #include <asm/asm-offsets.h>                      
 15                                                   
 16 #define rHP     r3      /* pointer to hash val    
 17 #define rWP     r4      /* pointer to input       
 18 #define rKP     r5      /* pointer to constant    
 19                                                   
 20 #define rW0     r14     /* 64 bit round words     
 21 #define rW1     r15                               
 22 #define rW2     r16                               
 23 #define rW3     r17                               
 24 #define rW4     r18                               
 25 #define rW5     r19                               
 26 #define rW6     r20                               
 27 #define rW7     r21                               
 28                                                   
 29 #define rH0     r6      /* 32 bit hash values     
 30 #define rH1     r7                                
 31 #define rH2     r8                                
 32 #define rH3     r9                                
 33 #define rH4     r10                               
 34                                                   
 35 #define rT0     r22     /* 64 bit temporary       
 36 #define rT1     r0      /* 32 bit temporaries     
 37 #define rT2     r11                               
 38 #define rT3     r12                               
 39                                                   
 40 #define rK      r23     /* 64 bit constant in     
 41                                                   
 42 #define LOAD_K01                                  
 43                                                   
 44 #define LOAD_K11 \                                
 45         evlwwsplat      rK,0(rKP);                
 46                                                   
 47 #define LOAD_K21 \                                
 48         evlwwsplat      rK,4(rKP);                
 49                                                   
 50 #define LOAD_K31 \                                
 51         evlwwsplat      rK,8(rKP);                
 52                                                   
 53 #define LOAD_K41 \                                
 54         evlwwsplat      rK,12(rKP);               
 55                                                   
 56 #define INITIALIZE \                              
 57         stwu            r1,-128(r1);    /* cre    
 58         evstdw          r14,8(r1);      /* We     
 59         evstdw          r15,16(r1);     /* reg    
 60         evstdw          r16,24(r1);     /* and    
 61         evstdw          r17,32(r1);               
 62         evstdw          r18,40(r1);               
 63         evstdw          r19,48(r1);               
 64         evstdw          r20,56(r1);               
 65         evstdw          r21,64(r1);               
 66         evstdw          r22,72(r1);               
 67         evstdw          r23,80(r1);               
 68                                                   
 69                                                   
 70 #define FINALIZE \                                
 71         evldw           r14,8(r1);      /* res    
 72         evldw           r15,16(r1);               
 73         evldw           r16,24(r1);               
 74         evldw           r17,32(r1);               
 75         evldw           r18,40(r1);               
 76         evldw           r19,48(r1);               
 77         evldw           r20,56(r1);               
 78         evldw           r21,64(r1);               
 79         evldw           r22,72(r1);               
 80         evldw           r23,80(r1);               
 81         xor             r0,r0,r0;                 
 82         stw             r0,8(r1);       /* Del    
 83         stw             r0,16(r1);      /* tha    
 84         stw             r0,24(r1);      /* fro    
 85         stw             r0,32(r1);      /* the    
 86         stw             r0,40(r1);      /* the    
 87         stw             r0,48(r1);      /* wer    
 88         stw             r0,56(r1);      /* the    
 89         stw             r0,64(r1);                
 90         stw             r0,72(r1);                
 91         stw             r0,80(r1);                
 92         addi            r1,r1,128;      /* cle    
 93                                                   
 94 #ifdef __BIG_ENDIAN__                             
 95 #define LOAD_DATA(reg, off) \                     
 96         lwz             reg,off(rWP);   /* loa    
 97 #define NEXT_BLOCK \                              
 98         addi            rWP,rWP,64;     /* inc    
 99 #else                                             
100 #define LOAD_DATA(reg, off) \                     
101         lwbrx           reg,0,rWP;      /* loa    
102         addi            rWP,rWP,4;      /* inc    
103 #define NEXT_BLOCK                      /* not    
104 #endif                                            
105                                                   
106 #define R_00_15(a, b, c, d, e, w0, w1, k, off)    
107         LOAD_DATA(w0, off)              /* 1:     
108         and             rT2,b,c;        /* 1:     
109         LOAD_K##k##1                              
110         andc            rT1,d,b;        /* 1:     
111         rotrwi          rT0,a,27;       /* 1:     
112         or              rT2,rT2,rT1;    /* 1:     
113         add             e,e,rT0;        /* 1:     
114         rotrwi          b,b,2;          /* 1:     
115         add             e,e,w0;         /* 1:     
116         LOAD_DATA(w1, off+4)            /* 2:     
117         add             e,e,rT2;        /* 1:     
118         and             rT1,a,b;        /* 2:     
119         add             e,e,rK;         /* 1:     
120         andc            rT2,c,a;        /* 2:     
121         add             d,d,rK;         /* 2:     
122         or              rT2,rT2,rT1;    /* 2:     
123         rotrwi          rT0,e,27;       /* 2:     
124         add             d,d,w1;         /* 2:     
125         rotrwi          a,a,2;          /* 2:     
126         add             d,d,rT0;        /* 2:     
127         evmergelo       w1,w1,w0;       /*        
128         add             d,d,rT2         /* 2:     
129                                                   
130 #define R_16_19(a, b, c, d, e, w0, w1, w4, w6,    
131         and             rT2,b,c;        /* 1:     
132         evmergelohi     rT0,w7,w6;      /*        
133         andc            rT1,d,b;        /* 1:     
134         evxor           w0,w0,rT0;      /*        
135         or              rT1,rT1,rT2;    /* 1:     
136         evxor           w0,w0,w4;       /*        
137         add             e,e,rT1;        /* 1:     
138         evxor           w0,w0,w1;       /*        
139         rotrwi          rT2,a,27;       /* 1:     
140         evrlwi          w0,w0,1;        /*        
141         add             e,e,rT2;        /* 1:     
142         evaddw          rT0,w0,rK;      /*        
143         rotrwi          b,b,2;          /* 1:     
144         LOAD_K##k##1                              
145         evmergehi       rT1,rT1,rT0;    /*        
146         add             e,e,rT0;        /* 1:     
147         add             d,d,rT1;        /* 2:     
148         and             rT2,a,b;        /* 2:     
149         andc            rT1,c,a;        /* 2:     
150         rotrwi          rT0,e,27;       /* 2:     
151         or              rT1,rT1,rT2;    /* 2:     
152         add             d,d,rT0;        /* 2:     
153         rotrwi          a,a,2;          /* 2:     
154         add             d,d,rT1         /* 2:     
155                                                   
156 #define R_20_39(a, b, c, d, e, w0, w1, w4, w6,    
157         evmergelohi     rT0,w7,w6;      /*        
158         xor             rT2,b,c;        /* 1:     
159         evxor           w0,w0,rT0;      /*        
160         xor             rT2,rT2,d;      /* 1:     
161         evxor           w0,w0,w4;       /*        
162         add             e,e,rT2;        /* 1:     
163         evxor           w0,w0,w1;       /*        
164         rotrwi          rT2,a,27;       /* 1:     
165         evrlwi          w0,w0,1;        /*        
166         add             e,e,rT2;        /* 1:     
167         evaddw          rT0,w0,rK;      /*        
168         rotrwi          b,b,2;          /* 1:     
169         LOAD_K##k##1                              
170         evmergehi       rT1,rT1,rT0;    /*        
171         add             e,e,rT0;        /* 1:     
172         xor             rT2,a,b;        /* 2:     
173         add             d,d,rT1;        /* 2:     
174         xor             rT2,rT2,c;      /* 2:     
175         rotrwi          rT0,e,27;       /* 2:     
176         add             d,d,rT2;        /* 2:     
177         rotrwi          a,a,2;          /* 2:     
178         add             d,d,rT0         /* 2:     
179                                                   
180 #define R_40_59(a, b, c, d, e, w0, w1, w4, w6,    
181         and             rT2,b,c;        /* 1:     
182         evmergelohi     rT0,w7,w6;      /*        
183         or              rT1,b,c;        /* 1:     
184         evxor           w0,w0,rT0;      /*        
185         and             rT1,d,rT1;      /* 1:     
186         evxor           w0,w0,w4;       /*        
187         or              rT2,rT2,rT1;    /* 1:     
188         evxor           w0,w0,w1;       /*        
189         add             e,e,rT2;        /* 1:     
190         evrlwi          w0,w0,1;        /*        
191         rotrwi          rT2,a,27;       /* 1:     
192         evaddw          rT0,w0,rK;      /*        
193         add             e,e,rT2;        /* 1:     
194         LOAD_K##k##1                              
195         evmergehi       rT1,rT1,rT0;    /*        
196         rotrwi          b,b,2;          /* 1:     
197         add             e,e,rT0;        /* 1:     
198         and             rT2,a,b;        /* 2:     
199         or              rT0,a,b;        /* 2:     
200         add             d,d,rT1;        /* 2:     
201         and             rT0,c,rT0;      /* 2:     
202         rotrwi          a,a,2;          /* 2:     
203         or              rT2,rT2,rT0;    /* 2:     
204         rotrwi          rT0,e,27;       /* 2:     
205         add             d,d,rT2;        /* 2:     
206         add             d,d,rT0         /* 2:     
207                                                   
208 #define R_60_79(a, b, c, d, e, w0, w1, w4, w6,    
209         R_20_39(a, b, c, d, e, w0, w1, w4, w6,    
210                                                   
211 _GLOBAL(ppc_spe_sha1_transform)                   
212         INITIALIZE                                
213                                                   
214         lwz             rH0,0(rHP)                
215         lwz             rH1,4(rHP)                
216         mtctr           r5                        
217         lwz             rH2,8(rHP)                
218         lis             rKP,PPC_SPE_SHA1_K@h      
219         lwz             rH3,12(rHP)               
220         ori             rKP,rKP,PPC_SPE_SHA1_K    
221         lwz             rH4,16(rHP)               
222                                                   
223 ppc_spe_sha1_main:                                
224         R_00_15(rH0, rH1, rH2, rH3, rH4, rW1,     
225         R_00_15(rH3, rH4, rH0, rH1, rH2, rW2,     
226         R_00_15(rH1, rH2, rH3, rH4, rH0, rW3,     
227         R_00_15(rH4, rH0, rH1, rH2, rH3, rW4,     
228         R_00_15(rH2, rH3, rH4, rH0, rH1, rW5,     
229         R_00_15(rH0, rH1, rH2, rH3, rH4, rW6,     
230         R_00_15(rH3, rH4, rH0, rH1, rH2, rT3,     
231         R_00_15(rH1, rH2, rH3, rH4, rH0, rT3,     
232                                                   
233         R_16_19(rH4, rH0, rH1, rH2, rH3, rW0,     
234         R_16_19(rH2, rH3, rH4, rH0, rH1, rW1,     
235                                                   
236         R_20_39(rH0, rH1, rH2, rH3, rH4, rW2,     
237         R_20_39(rH3, rH4, rH0, rH1, rH2, rW3,     
238         R_20_39(rH1, rH2, rH3, rH4, rH0, rW4,     
239         R_20_39(rH4, rH0, rH1, rH2, rH3, rW5,     
240         R_20_39(rH2, rH3, rH4, rH0, rH1, rW6,     
241         R_20_39(rH0, rH1, rH2, rH3, rH4, rW7,     
242         R_20_39(rH3, rH4, rH0, rH1, rH2, rW0,     
243         R_20_39(rH1, rH2, rH3, rH4, rH0, rW1,     
244         R_20_39(rH4, rH0, rH1, rH2, rH3, rW2,     
245         R_20_39(rH2, rH3, rH4, rH0, rH1, rW3,     
246                                                   
247         R_40_59(rH0, rH1, rH2, rH3, rH4, rW4,     
248         R_40_59(rH3, rH4, rH0, rH1, rH2, rW5,     
249         R_40_59(rH1, rH2, rH3, rH4, rH0, rW6,     
250         R_40_59(rH4, rH0, rH1, rH2, rH3, rW7,     
251         R_40_59(rH2, rH3, rH4, rH0, rH1, rW0,     
252         R_40_59(rH0, rH1, rH2, rH3, rH4, rW1,     
253         R_40_59(rH3, rH4, rH0, rH1, rH2, rW2,     
254         R_40_59(rH1, rH2, rH3, rH4, rH0, rW3,     
255         R_40_59(rH4, rH0, rH1, rH2, rH3, rW4,     
256         R_40_59(rH2, rH3, rH4, rH0, rH1, rW5,     
257                                                   
258         R_60_79(rH0, rH1, rH2, rH3, rH4, rW6,     
259         R_60_79(rH3, rH4, rH0, rH1, rH2, rW7,     
260         R_60_79(rH1, rH2, rH3, rH4, rH0, rW0,     
261         R_60_79(rH4, rH0, rH1, rH2, rH3, rW1,     
262         R_60_79(rH2, rH3, rH4, rH0, rH1, rW2,     
263         R_60_79(rH0, rH1, rH2, rH3, rH4, rW3,     
264         R_60_79(rH3, rH4, rH0, rH1, rH2, rW4,     
265         lwz             rT3,0(rHP)                
266         R_60_79(rH1, rH2, rH3, rH4, rH0, rW5,     
267         lwz             rW1,4(rHP)                
268         R_60_79(rH4, rH0, rH1, rH2, rH3, rW6,     
269         lwz             rW2,8(rHP)                
270         R_60_79(rH2, rH3, rH4, rH0, rH1, rW7,     
271         lwz             rW3,12(rHP)               
272         NEXT_BLOCK                                
273         lwz             rW4,16(rHP)               
274                                                   
275         add             rH0,rH0,rT3               
276         stw             rH0,0(rHP)                
277         add             rH1,rH1,rW1               
278         stw             rH1,4(rHP)                
279         add             rH2,rH2,rW2               
280         stw             rH2,8(rHP)                
281         add             rH3,rH3,rW3               
282         stw             rH3,12(rHP)               
283         add             rH4,rH4,rW4               
284         stw             rH4,16(rHP)               
285                                                   
286         bdnz            ppc_spe_sha1_main         
287                                                   
288         FINALIZE                                  
289         blr                                       
290                                                   
291 .data                                             
292 .align 4                                          
293 PPC_SPE_SHA1_K:                                   
294         .long 0x5A827999,0x6ED9EBA1,0x8F1BBCDC    
                                                      

~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

kernel.org | git.kernel.org | LWN.net | Project Home | SVN repository | Mail admin

Linux® is a registered trademark of Linus Torvalds in the United States and other countries.
TOMOYO® is a registered trademark of NTT DATA CORPORATION.

sflogo.php