~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

TOMOYO Linux Cross Reference
Linux/arch/x86/crypto/nh-sse2-x86_64.S

Version: ~ [ linux-6.12-rc7 ] ~ [ linux-6.11.7 ] ~ [ linux-6.10.14 ] ~ [ linux-6.9.12 ] ~ [ linux-6.8.12 ] ~ [ linux-6.7.12 ] ~ [ linux-6.6.60 ] ~ [ linux-6.5.13 ] ~ [ linux-6.4.16 ] ~ [ linux-6.3.13 ] ~ [ linux-6.2.16 ] ~ [ linux-6.1.116 ] ~ [ linux-6.0.19 ] ~ [ linux-5.19.17 ] ~ [ linux-5.18.19 ] ~ [ linux-5.17.15 ] ~ [ linux-5.16.20 ] ~ [ linux-5.15.171 ] ~ [ linux-5.14.21 ] ~ [ linux-5.13.19 ] ~ [ linux-5.12.19 ] ~ [ linux-5.11.22 ] ~ [ linux-5.10.229 ] ~ [ linux-5.9.16 ] ~ [ linux-5.8.18 ] ~ [ linux-5.7.19 ] ~ [ linux-5.6.19 ] ~ [ linux-5.5.19 ] ~ [ linux-5.4.285 ] ~ [ linux-5.3.18 ] ~ [ linux-5.2.21 ] ~ [ linux-5.1.21 ] ~ [ linux-5.0.21 ] ~ [ linux-4.20.17 ] ~ [ linux-4.19.323 ] ~ [ linux-4.18.20 ] ~ [ linux-4.17.19 ] ~ [ linux-4.16.18 ] ~ [ linux-4.15.18 ] ~ [ linux-4.14.336 ] ~ [ linux-4.13.16 ] ~ [ linux-4.12.14 ] ~ [ linux-4.11.12 ] ~ [ linux-4.10.17 ] ~ [ linux-4.9.337 ] ~ [ linux-4.4.302 ] ~ [ linux-3.10.108 ] ~ [ linux-2.6.32.71 ] ~ [ linux-2.6.0 ] ~ [ linux-2.4.37.11 ] ~ [ unix-v6-master ] ~ [ ccs-tools-1.8.12 ] ~ [ policy-sample ] ~
Architecture: ~ [ i386 ] ~ [ alpha ] ~ [ m68k ] ~ [ mips ] ~ [ ppc ] ~ [ sparc ] ~ [ sparc64 ] ~

Diff markup

Differences between /arch/x86/crypto/nh-sse2-x86_64.S (Version linux-6.12-rc7) and /arch/i386/crypto/nh-sse2-x86_64.S (Version linux-6.2.16)


  1 /* SPDX-License-Identifier: GPL-2.0 */            
  2 /*                                                
  3  * NH - ε-almost-universal hash function, x86    
  4  *                                                
  5  * Copyright 2018 Google LLC                      
  6  *                                                
  7  * Author: Eric Biggers <ebiggers@google.com>      
  8  */                                               
  9                                                   
 10 #include <linux/linkage.h>                        
 11 #include <linux/cfi_types.h>                      
 12                                                   
 13 #define         PASS0_SUMS      %xmm0             
 14 #define         PASS1_SUMS      %xmm1             
 15 #define         PASS2_SUMS      %xmm2             
 16 #define         PASS3_SUMS      %xmm3             
 17 #define         K0              %xmm4             
 18 #define         K1              %xmm5             
 19 #define         K2              %xmm6             
 20 #define         K3              %xmm7             
 21 #define         T0              %xmm8             
 22 #define         T1              %xmm9             
 23 #define         T2              %xmm10            
 24 #define         T3              %xmm11            
 25 #define         T4              %xmm12            
 26 #define         T5              %xmm13            
 27 #define         T6              %xmm14            
 28 #define         T7              %xmm15            
 29 #define         KEY             %rdi              
 30 #define         MESSAGE         %rsi              
 31 #define         MESSAGE_LEN     %rdx              
 32 #define         HASH            %rcx              
 33                                                   
 34 .macro _nh_stride       k0, k1, k2, k3, offset    
 35                                                   
 36         // Load next message stride               
 37         movdqu          \offset(MESSAGE), T1      
 38                                                   
 39         // Load next key stride                   
 40         movdqu          \offset(KEY), \k3         
 41                                                   
 42         // Add message words to key words         
 43         movdqa          T1, T2                    
 44         movdqa          T1, T3                    
 45         paddd           T1, \k0    // reuse k0    
 46         paddd           \k1, T1                   
 47         paddd           \k2, T2                   
 48         paddd           \k3, T3                   
 49                                                   
 50         // Multiply 32x32 => 64 and accumulate    
 51         pshufd          $0x10, \k0, T4            
 52         pshufd          $0x32, \k0, \k0           
 53         pshufd          $0x10, T1, T5             
 54         pshufd          $0x32, T1, T1             
 55         pshufd          $0x10, T2, T6             
 56         pshufd          $0x32, T2, T2             
 57         pshufd          $0x10, T3, T7             
 58         pshufd          $0x32, T3, T3             
 59         pmuludq         T4, \k0                   
 60         pmuludq         T5, T1                    
 61         pmuludq         T6, T2                    
 62         pmuludq         T7, T3                    
 63         paddq           \k0, PASS0_SUMS           
 64         paddq           T1, PASS1_SUMS            
 65         paddq           T2, PASS2_SUMS            
 66         paddq           T3, PASS3_SUMS            
 67 .endm                                             
 68                                                   
 69 /*                                                
 70  * void nh_sse2(const u32 *key, const u8 *mess    
 71  *              __le64 hash[NH_NUM_PASSES])       
 72  *                                                
 73  * It's guaranteed that message_len % 16 == 0.    
 74  */                                               
 75 SYM_TYPED_FUNC_START(nh_sse2)                     
 76                                                   
 77         movdqu          0x00(KEY), K0             
 78         movdqu          0x10(KEY), K1             
 79         movdqu          0x20(KEY), K2             
 80         add             $0x30, KEY                
 81         pxor            PASS0_SUMS, PASS0_SUMS    
 82         pxor            PASS1_SUMS, PASS1_SUMS    
 83         pxor            PASS2_SUMS, PASS2_SUMS    
 84         pxor            PASS3_SUMS, PASS3_SUMS    
 85                                                   
 86         sub             $0x40, MESSAGE_LEN        
 87         jl              .Lloop4_done              
 88 .Lloop4:                                          
 89         _nh_stride      K0, K1, K2, K3, 0x00      
 90         _nh_stride      K1, K2, K3, K0, 0x10      
 91         _nh_stride      K2, K3, K0, K1, 0x20      
 92         _nh_stride      K3, K0, K1, K2, 0x30      
 93         add             $0x40, KEY                
 94         add             $0x40, MESSAGE            
 95         sub             $0x40, MESSAGE_LEN        
 96         jge             .Lloop4                   
 97                                                   
 98 .Lloop4_done:                                     
 99         and             $0x3f, MESSAGE_LEN        
100         jz              .Ldone                    
101         _nh_stride      K0, K1, K2, K3, 0x00      
102                                                   
103         sub             $0x10, MESSAGE_LEN        
104         jz              .Ldone                    
105         _nh_stride      K1, K2, K3, K0, 0x10      
106                                                   
107         sub             $0x10, MESSAGE_LEN        
108         jz              .Ldone                    
109         _nh_stride      K2, K3, K0, K1, 0x20      
110                                                   
111 .Ldone:                                           
112         // Sum the accumulators for each pass,    
113         movdqa          PASS0_SUMS, T0            
114         movdqa          PASS2_SUMS, T1            
115         punpcklqdq      PASS1_SUMS, T0            
116         punpcklqdq      PASS3_SUMS, T1            
117         punpckhqdq      PASS1_SUMS, PASS0_SUMS    
118         punpckhqdq      PASS3_SUMS, PASS2_SUMS    
119         paddq           PASS0_SUMS, T0            
120         paddq           PASS2_SUMS, T1            
121         movdqu          T0, 0x00(HASH)            
122         movdqu          T1, 0x10(HASH)            
123         RET                                       
124 SYM_FUNC_END(nh_sse2)                             
                                                      

~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

kernel.org | git.kernel.org | LWN.net | Project Home | SVN repository | Mail admin

Linux® is a registered trademark of Linus Torvalds in the United States and other countries.
TOMOYO® is a registered trademark of NTT DATA CORPORATION.

sflogo.php