~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

TOMOYO Linux Cross Reference
Linux/kernel/rcu/refscale.c

Version: ~ [ linux-6.12-rc7 ] ~ [ linux-6.11.7 ] ~ [ linux-6.10.14 ] ~ [ linux-6.9.12 ] ~ [ linux-6.8.12 ] ~ [ linux-6.7.12 ] ~ [ linux-6.6.60 ] ~ [ linux-6.5.13 ] ~ [ linux-6.4.16 ] ~ [ linux-6.3.13 ] ~ [ linux-6.2.16 ] ~ [ linux-6.1.116 ] ~ [ linux-6.0.19 ] ~ [ linux-5.19.17 ] ~ [ linux-5.18.19 ] ~ [ linux-5.17.15 ] ~ [ linux-5.16.20 ] ~ [ linux-5.15.171 ] ~ [ linux-5.14.21 ] ~ [ linux-5.13.19 ] ~ [ linux-5.12.19 ] ~ [ linux-5.11.22 ] ~ [ linux-5.10.229 ] ~ [ linux-5.9.16 ] ~ [ linux-5.8.18 ] ~ [ linux-5.7.19 ] ~ [ linux-5.6.19 ] ~ [ linux-5.5.19 ] ~ [ linux-5.4.285 ] ~ [ linux-5.3.18 ] ~ [ linux-5.2.21 ] ~ [ linux-5.1.21 ] ~ [ linux-5.0.21 ] ~ [ linux-4.20.17 ] ~ [ linux-4.19.323 ] ~ [ linux-4.18.20 ] ~ [ linux-4.17.19 ] ~ [ linux-4.16.18 ] ~ [ linux-4.15.18 ] ~ [ linux-4.14.336 ] ~ [ linux-4.13.16 ] ~ [ linux-4.12.14 ] ~ [ linux-4.11.12 ] ~ [ linux-4.10.17 ] ~ [ linux-4.9.337 ] ~ [ linux-4.4.302 ] ~ [ linux-3.10.108 ] ~ [ linux-2.6.32.71 ] ~ [ linux-2.6.0 ] ~ [ linux-2.4.37.11 ] ~ [ unix-v6-master ] ~ [ ccs-tools-1.8.12 ] ~ [ policy-sample ] ~
Architecture: ~ [ i386 ] ~ [ alpha ] ~ [ m68k ] ~ [ mips ] ~ [ ppc ] ~ [ sparc ] ~ [ sparc64 ] ~

Diff markup

Differences between /kernel/rcu/refscale.c (Version linux-6.12-rc7) and /kernel/rcu/refscale.c (Version linux-5.4.285)


  1 // SPDX-License-Identifier: GPL-2.0+                1 
  2 //                                                
  3 // Scalability test comparing RCU vs other mec    
  4 // for acquiring references on objects.           
  5 //                                                
  6 // Copyright (C) Google, 2020.                    
  7 //                                                
  8 // Author: Joel Fernandes <joel@joelfernandes.    
  9                                                   
 10 #define pr_fmt(fmt) fmt                           
 11                                                   
 12 #include <linux/atomic.h>                         
 13 #include <linux/bitops.h>                         
 14 #include <linux/completion.h>                     
 15 #include <linux/cpu.h>                            
 16 #include <linux/delay.h>                          
 17 #include <linux/err.h>                            
 18 #include <linux/init.h>                           
 19 #include <linux/interrupt.h>                      
 20 #include <linux/kthread.h>                        
 21 #include <linux/kernel.h>                         
 22 #include <linux/mm.h>                             
 23 #include <linux/module.h>                         
 24 #include <linux/moduleparam.h>                    
 25 #include <linux/notifier.h>                       
 26 #include <linux/percpu.h>                         
 27 #include <linux/rcupdate.h>                       
 28 #include <linux/rcupdate_trace.h>                 
 29 #include <linux/reboot.h>                         
 30 #include <linux/sched.h>                          
 31 #include <linux/seq_buf.h>                        
 32 #include <linux/spinlock.h>                       
 33 #include <linux/smp.h>                            
 34 #include <linux/stat.h>                           
 35 #include <linux/srcu.h>                           
 36 #include <linux/slab.h>                           
 37 #include <linux/torture.h>                        
 38 #include <linux/types.h>                          
 39                                                   
 40 #include "rcu.h"                                  
 41                                                   
 42 #define SCALE_FLAG "-ref-scale: "                 
 43                                                   
 44 #define SCALEOUT(s, x...) \                       
 45         pr_alert("%s" SCALE_FLAG s, scale_type    
 46                                                   
 47 #define VERBOSE_SCALEOUT(s, x...) \               
 48         do { \                                    
 49                 if (verbose) \                    
 50                         pr_alert("%s" SCALE_FL    
 51         } while (0)                               
 52                                                   
 53 static atomic_t verbose_batch_ctr;                
 54                                                   
 55 #define VERBOSE_SCALEOUT_BATCH(s, x...)           
 56 do {                                              
 57         if (verbose &&                            
 58             (verbose_batched <= 0 ||              
 59              !(atomic_inc_return(&verbose_batc    
 60                 schedule_timeout_uninterruptib    
 61                 pr_alert("%s" SCALE_FLAG s "\n    
 62         }                                         
 63 } while (0)                                       
 64                                                   
 65 #define SCALEOUT_ERRSTRING(s, x...) pr_alert("    
 66                                                   
 67 MODULE_DESCRIPTION("Scalability test for objec    
 68 MODULE_LICENSE("GPL");                            
 69 MODULE_AUTHOR("Joel Fernandes (Google) <joel@j    
 70                                                   
 71 static char *scale_type = "rcu";                  
 72 module_param(scale_type, charp, 0444);            
 73 MODULE_PARM_DESC(scale_type, "Type of test (rc    
 74                                                   
 75 torture_param(int, verbose, 0, "Enable verbose    
 76 torture_param(int, verbose_batched, 0, "Batch     
 77                                                   
 78 // Wait until there are multiple CPUs before s    
 79 torture_param(int, holdoff, IS_BUILTIN(CONFIG_    
 80               "Holdoff time before test start     
 81 // Number of typesafe_lookup structures, that     
 82 torture_param(long, lookup_instances, 0, "Numb    
 83 // Number of loops per experiment, all readers    
 84 torture_param(long, loops, 10000, "Number of l    
 85 // Number of readers, with -1 defaulting to ab    
 86 torture_param(int, nreaders, -1, "Number of re    
 87 // Number of runs.                                
 88 torture_param(int, nruns, 30, "Number of exper    
 89 // Reader delay in nanoseconds, 0 for no delay    
 90 torture_param(int, readdelay, 0, "Read-side de    
 91                                                   
 92 #ifdef MODULE                                     
 93 # define REFSCALE_SHUTDOWN 0                      
 94 #else                                             
 95 # define REFSCALE_SHUTDOWN 1                      
 96 #endif                                            
 97                                                   
 98 torture_param(bool, shutdown, REFSCALE_SHUTDOW    
 99               "Shutdown at end of scalability     
100                                                   
101 struct reader_task {                              
102         struct task_struct *task;                 
103         int start_reader;                         
104         wait_queue_head_t wq;                     
105         u64 last_duration_ns;                     
106 };                                                
107                                                   
108 static struct task_struct *shutdown_task;         
109 static wait_queue_head_t shutdown_wq;             
110                                                   
111 static struct task_struct *main_task;             
112 static wait_queue_head_t main_wq;                 
113 static int shutdown_start;                        
114                                                   
115 static struct reader_task *reader_tasks;          
116                                                   
117 // Number of readers that are part of the curr    
118 static atomic_t nreaders_exp;                     
119                                                   
120 // Use to wait for all threads to start.          
121 static atomic_t n_init;                           
122 static atomic_t n_started;                        
123 static atomic_t n_warmedup;                       
124 static atomic_t n_cooleddown;                     
125                                                   
126 // Track which experiment is currently running    
127 static int exp_idx;                               
128                                                   
129 // Operations vector for selecting different t    
130 struct ref_scale_ops {                            
131         bool (*init)(void);                       
132         void (*cleanup)(void);                    
133         void (*readsection)(const int nloops);    
134         void (*delaysection)(const int nloops,    
135         const char *name;                         
136 };                                                
137                                                   
138 static const struct ref_scale_ops *cur_ops;       
139                                                   
140 static void un_delay(const int udl, const int     
141 {                                                 
142         if (udl)                                  
143                 udelay(udl);                      
144         if (ndl)                                  
145                 ndelay(ndl);                      
146 }                                                 
147                                                   
148 static void ref_rcu_read_section(const int nlo    
149 {                                                 
150         int i;                                    
151                                                   
152         for (i = nloops; i >= 0; i--) {           
153                 rcu_read_lock();                  
154                 rcu_read_unlock();                
155         }                                         
156 }                                                 
157                                                   
158 static void ref_rcu_delay_section(const int nl    
159 {                                                 
160         int i;                                    
161                                                   
162         for (i = nloops; i >= 0; i--) {           
163                 rcu_read_lock();                  
164                 un_delay(udl, ndl);               
165                 rcu_read_unlock();                
166         }                                         
167 }                                                 
168                                                   
169 static bool rcu_sync_scale_init(void)             
170 {                                                 
171         return true;                              
172 }                                                 
173                                                   
174 static const struct ref_scale_ops rcu_ops = {     
175         .init           = rcu_sync_scale_init,    
176         .readsection    = ref_rcu_read_section    
177         .delaysection   = ref_rcu_delay_sectio    
178         .name           = "rcu"                   
179 };                                                
180                                                   
181 // Definitions for SRCU ref scale testing.        
182 DEFINE_STATIC_SRCU(srcu_refctl_scale);            
183 static struct srcu_struct *srcu_ctlp = &srcu_r    
184                                                   
185 static void srcu_ref_scale_read_section(const     
186 {                                                 
187         int i;                                    
188         int idx;                                  
189                                                   
190         for (i = nloops; i >= 0; i--) {           
191                 idx = srcu_read_lock(srcu_ctlp    
192                 srcu_read_unlock(srcu_ctlp, id    
193         }                                         
194 }                                                 
195                                                   
196 static void srcu_ref_scale_delay_section(const    
197 {                                                 
198         int i;                                    
199         int idx;                                  
200                                                   
201         for (i = nloops; i >= 0; i--) {           
202                 idx = srcu_read_lock(srcu_ctlp    
203                 un_delay(udl, ndl);               
204                 srcu_read_unlock(srcu_ctlp, id    
205         }                                         
206 }                                                 
207                                                   
208 static const struct ref_scale_ops srcu_ops = {    
209         .init           = rcu_sync_scale_init,    
210         .readsection    = srcu_ref_scale_read_    
211         .delaysection   = srcu_ref_scale_delay    
212         .name           = "srcu"                  
213 };                                                
214                                                   
215 #ifdef CONFIG_TASKS_RCU                           
216                                                   
217 // Definitions for RCU Tasks ref scale testing    
218 // These definitions also work for RCU Rude re    
219 static void rcu_tasks_ref_scale_read_section(c    
220 {                                                 
221         int i;                                    
222                                                   
223         for (i = nloops; i >= 0; i--)             
224                 continue;                         
225 }                                                 
226                                                   
227 static void rcu_tasks_ref_scale_delay_section(    
228 {                                                 
229         int i;                                    
230                                                   
231         for (i = nloops; i >= 0; i--)             
232                 un_delay(udl, ndl);               
233 }                                                 
234                                                   
235 static const struct ref_scale_ops rcu_tasks_op    
236         .init           = rcu_sync_scale_init,    
237         .readsection    = rcu_tasks_ref_scale_    
238         .delaysection   = rcu_tasks_ref_scale_    
239         .name           = "rcu-tasks"             
240 };                                                
241                                                   
242 #define RCU_TASKS_OPS &rcu_tasks_ops,             
243                                                   
244 #else // #ifdef CONFIG_TASKS_RCU                  
245                                                   
246 #define RCU_TASKS_OPS                             
247                                                   
248 #endif // #else // #ifdef CONFIG_TASKS_RCU        
249                                                   
250 #ifdef CONFIG_TASKS_TRACE_RCU                     
251                                                   
252 // Definitions for RCU Tasks Trace ref scale t    
253 static void rcu_trace_ref_scale_read_section(c    
254 {                                                 
255         int i;                                    
256                                                   
257         for (i = nloops; i >= 0; i--) {           
258                 rcu_read_lock_trace();            
259                 rcu_read_unlock_trace();          
260         }                                         
261 }                                                 
262                                                   
263 static void rcu_trace_ref_scale_delay_section(    
264 {                                                 
265         int i;                                    
266                                                   
267         for (i = nloops; i >= 0; i--) {           
268                 rcu_read_lock_trace();            
269                 un_delay(udl, ndl);               
270                 rcu_read_unlock_trace();          
271         }                                         
272 }                                                 
273                                                   
274 static const struct ref_scale_ops rcu_trace_op    
275         .init           = rcu_sync_scale_init,    
276         .readsection    = rcu_trace_ref_scale_    
277         .delaysection   = rcu_trace_ref_scale_    
278         .name           = "rcu-trace"             
279 };                                                
280                                                   
281 #define RCU_TRACE_OPS &rcu_trace_ops,             
282                                                   
283 #else // #ifdef CONFIG_TASKS_TRACE_RCU            
284                                                   
285 #define RCU_TRACE_OPS                             
286                                                   
287 #endif // #else // #ifdef CONFIG_TASKS_TRACE_R    
288                                                   
289 // Definitions for reference count                
290 static atomic_t refcnt;                           
291                                                   
292 static void ref_refcnt_section(const int nloop    
293 {                                                 
294         int i;                                    
295                                                   
296         for (i = nloops; i >= 0; i--) {           
297                 atomic_inc(&refcnt);              
298                 atomic_dec(&refcnt);              
299         }                                         
300 }                                                 
301                                                   
302 static void ref_refcnt_delay_section(const int    
303 {                                                 
304         int i;                                    
305                                                   
306         for (i = nloops; i >= 0; i--) {           
307                 atomic_inc(&refcnt);              
308                 un_delay(udl, ndl);               
309                 atomic_dec(&refcnt);              
310         }                                         
311 }                                                 
312                                                   
313 static const struct ref_scale_ops refcnt_ops =    
314         .init           = rcu_sync_scale_init,    
315         .readsection    = ref_refcnt_section,     
316         .delaysection   = ref_refcnt_delay_sec    
317         .name           = "refcnt"                
318 };                                                
319                                                   
320 // Definitions for rwlock                         
321 static rwlock_t test_rwlock;                      
322                                                   
323 static bool ref_rwlock_init(void)                 
324 {                                                 
325         rwlock_init(&test_rwlock);                
326         return true;                              
327 }                                                 
328                                                   
329 static void ref_rwlock_section(const int nloop    
330 {                                                 
331         int i;                                    
332                                                   
333         for (i = nloops; i >= 0; i--) {           
334                 read_lock(&test_rwlock);          
335                 read_unlock(&test_rwlock);        
336         }                                         
337 }                                                 
338                                                   
339 static void ref_rwlock_delay_section(const int    
340 {                                                 
341         int i;                                    
342                                                   
343         for (i = nloops; i >= 0; i--) {           
344                 read_lock(&test_rwlock);          
345                 un_delay(udl, ndl);               
346                 read_unlock(&test_rwlock);        
347         }                                         
348 }                                                 
349                                                   
350 static const struct ref_scale_ops rwlock_ops =    
351         .init           = ref_rwlock_init,        
352         .readsection    = ref_rwlock_section,     
353         .delaysection   = ref_rwlock_delay_sec    
354         .name           = "rwlock"                
355 };                                                
356                                                   
357 // Definitions for rwsem                          
358 static struct rw_semaphore test_rwsem;            
359                                                   
360 static bool ref_rwsem_init(void)                  
361 {                                                 
362         init_rwsem(&test_rwsem);                  
363         return true;                              
364 }                                                 
365                                                   
366 static void ref_rwsem_section(const int nloops    
367 {                                                 
368         int i;                                    
369                                                   
370         for (i = nloops; i >= 0; i--) {           
371                 down_read(&test_rwsem);           
372                 up_read(&test_rwsem);             
373         }                                         
374 }                                                 
375                                                   
376 static void ref_rwsem_delay_section(const int     
377 {                                                 
378         int i;                                    
379                                                   
380         for (i = nloops; i >= 0; i--) {           
381                 down_read(&test_rwsem);           
382                 un_delay(udl, ndl);               
383                 up_read(&test_rwsem);             
384         }                                         
385 }                                                 
386                                                   
387 static const struct ref_scale_ops rwsem_ops =     
388         .init           = ref_rwsem_init,         
389         .readsection    = ref_rwsem_section,      
390         .delaysection   = ref_rwsem_delay_sect    
391         .name           = "rwsem"                 
392 };                                                
393                                                   
394 // Definitions for global spinlock                
395 static DEFINE_RAW_SPINLOCK(test_lock);            
396                                                   
397 static void ref_lock_section(const int nloops)    
398 {                                                 
399         int i;                                    
400                                                   
401         preempt_disable();                        
402         for (i = nloops; i >= 0; i--) {           
403                 raw_spin_lock(&test_lock);        
404                 raw_spin_unlock(&test_lock);      
405         }                                         
406         preempt_enable();                         
407 }                                                 
408                                                   
409 static void ref_lock_delay_section(const int n    
410 {                                                 
411         int i;                                    
412                                                   
413         preempt_disable();                        
414         for (i = nloops; i >= 0; i--) {           
415                 raw_spin_lock(&test_lock);        
416                 un_delay(udl, ndl);               
417                 raw_spin_unlock(&test_lock);      
418         }                                         
419         preempt_enable();                         
420 }                                                 
421                                                   
422 static const struct ref_scale_ops lock_ops = {    
423         .readsection    = ref_lock_section,       
424         .delaysection   = ref_lock_delay_secti    
425         .name           = "lock"                  
426 };                                                
427                                                   
428 // Definitions for global irq-save spinlock       
429                                                   
430 static void ref_lock_irq_section(const int nlo    
431 {                                                 
432         unsigned long flags;                      
433         int i;                                    
434                                                   
435         preempt_disable();                        
436         for (i = nloops; i >= 0; i--) {           
437                 raw_spin_lock_irqsave(&test_lo    
438                 raw_spin_unlock_irqrestore(&te    
439         }                                         
440         preempt_enable();                         
441 }                                                 
442                                                   
443 static void ref_lock_irq_delay_section(const i    
444 {                                                 
445         unsigned long flags;                      
446         int i;                                    
447                                                   
448         preempt_disable();                        
449         for (i = nloops; i >= 0; i--) {           
450                 raw_spin_lock_irqsave(&test_lo    
451                 un_delay(udl, ndl);               
452                 raw_spin_unlock_irqrestore(&te    
453         }                                         
454         preempt_enable();                         
455 }                                                 
456                                                   
457 static const struct ref_scale_ops lock_irq_ops    
458         .readsection    = ref_lock_irq_section    
459         .delaysection   = ref_lock_irq_delay_s    
460         .name           = "lock-irq"              
461 };                                                
462                                                   
463 // Definitions acquire-release.                   
464 static DEFINE_PER_CPU(unsigned long, test_acqr    
465                                                   
466 static void ref_acqrel_section(const int nloop    
467 {                                                 
468         unsigned long x;                          
469         int i;                                    
470                                                   
471         preempt_disable();                        
472         for (i = nloops; i >= 0; i--) {           
473                 x = smp_load_acquire(this_cpu_    
474                 smp_store_release(this_cpu_ptr    
475         }                                         
476         preempt_enable();                         
477 }                                                 
478                                                   
479 static void ref_acqrel_delay_section(const int    
480 {                                                 
481         unsigned long x;                          
482         int i;                                    
483                                                   
484         preempt_disable();                        
485         for (i = nloops; i >= 0; i--) {           
486                 x = smp_load_acquire(this_cpu_    
487                 un_delay(udl, ndl);               
488                 smp_store_release(this_cpu_ptr    
489         }                                         
490         preempt_enable();                         
491 }                                                 
492                                                   
493 static const struct ref_scale_ops acqrel_ops =    
494         .readsection    = ref_acqrel_section,     
495         .delaysection   = ref_acqrel_delay_sec    
496         .name           = "acqrel"                
497 };                                                
498                                                   
499 static volatile u64 stopopts;                     
500                                                   
501 static void ref_clock_section(const int nloops    
502 {                                                 
503         u64 x = 0;                                
504         int i;                                    
505                                                   
506         preempt_disable();                        
507         for (i = nloops; i >= 0; i--)             
508                 x += ktime_get_real_fast_ns();    
509         preempt_enable();                         
510         stopopts = x;                             
511 }                                                 
512                                                   
513 static void ref_clock_delay_section(const int     
514 {                                                 
515         u64 x = 0;                                
516         int i;                                    
517                                                   
518         preempt_disable();                        
519         for (i = nloops; i >= 0; i--) {           
520                 x += ktime_get_real_fast_ns();    
521                 un_delay(udl, ndl);               
522         }                                         
523         preempt_enable();                         
524         stopopts = x;                             
525 }                                                 
526                                                   
527 static const struct ref_scale_ops clock_ops =     
528         .readsection    = ref_clock_section,      
529         .delaysection   = ref_clock_delay_sect    
530         .name           = "clock"                 
531 };                                                
532                                                   
533 static void ref_jiffies_section(const int nloo    
534 {                                                 
535         u64 x = 0;                                
536         int i;                                    
537                                                   
538         preempt_disable();                        
539         for (i = nloops; i >= 0; i--)             
540                 x += jiffies;                     
541         preempt_enable();                         
542         stopopts = x;                             
543 }                                                 
544                                                   
545 static void ref_jiffies_delay_section(const in    
546 {                                                 
547         u64 x = 0;                                
548         int i;                                    
549                                                   
550         preempt_disable();                        
551         for (i = nloops; i >= 0; i--) {           
552                 x += jiffies;                     
553                 un_delay(udl, ndl);               
554         }                                         
555         preempt_enable();                         
556         stopopts = x;                             
557 }                                                 
558                                                   
559 static const struct ref_scale_ops jiffies_ops     
560         .readsection    = ref_jiffies_section,    
561         .delaysection   = ref_jiffies_delay_se    
562         .name           = "jiffies"               
563 };                                                
564                                                   
565 //////////////////////////////////////////////    
566 //                                                
567 // Methods leveraging SLAB_TYPESAFE_BY_RCU.       
568 //                                                
569                                                   
570 // Item to look up in a typesafe manner.  Arra    
571 struct refscale_typesafe {                        
572         atomic_t rts_refctr;  // Used by all f    
573         spinlock_t rts_lock;                      
574         seqlock_t rts_seqlock;                    
575         unsigned int a;                           
576         unsigned int b;                           
577 };                                                
578                                                   
579 static struct kmem_cache *typesafe_kmem_cachep    
580 static struct refscale_typesafe **rtsarray;       
581 static long rtsarray_size;                        
582 static DEFINE_TORTURE_RANDOM_PERCPU(refscale_r    
583 static bool (*rts_acquire)(struct refscale_typ    
584 static bool (*rts_release)(struct refscale_typ    
585                                                   
586 // Conditionally acquire an explicit in-struct    
587 static bool typesafe_ref_acquire(struct refsca    
588 {                                                 
589         return atomic_inc_not_zero(&rtsp->rts_    
590 }                                                 
591                                                   
592 // Unconditionally release an explicit in-stru    
593 static bool typesafe_ref_release(struct refsca    
594 {                                                 
595         if (!atomic_dec_return(&rtsp->rts_refc    
596                 WRITE_ONCE(rtsp->a, rtsp->a +     
597                 kmem_cache_free(typesafe_kmem_    
598         }                                         
599         return true;                              
600 }                                                 
601                                                   
602 // Unconditionally acquire an explicit in-stru    
603 static bool typesafe_lock_acquire(struct refsc    
604 {                                                 
605         spin_lock(&rtsp->rts_lock);               
606         return true;                              
607 }                                                 
608                                                   
609 // Unconditionally release an explicit in-stru    
610 static bool typesafe_lock_release(struct refsc    
611 {                                                 
612         spin_unlock(&rtsp->rts_lock);             
613         return true;                              
614 }                                                 
615                                                   
616 // Unconditionally acquire an explicit in-stru    
617 static bool typesafe_seqlock_acquire(struct re    
618 {                                                 
619         *start = read_seqbegin(&rtsp->rts_seql    
620         return true;                              
621 }                                                 
622                                                   
623 // Conditionally release an explicit in-struct    
624 // true if this release was successful, that i    
625 static bool typesafe_seqlock_release(struct re    
626 {                                                 
627         return !read_seqretry(&rtsp->rts_seqlo    
628 }                                                 
629                                                   
630 // Do a read-side critical section with the sp    
631 // microseconds and nanoseconds inserted so as    
632 // of failure.                                    
633 static void typesafe_delay_section(const int n    
634 {                                                 
635         unsigned int a;                           
636         unsigned int b;                           
637         int i;                                    
638         long idx;                                 
639         struct refscale_typesafe *rtsp;           
640         unsigned int start;                       
641                                                   
642         for (i = nloops; i >= 0; i--) {           
643                 preempt_disable();                
644                 idx = torture_random(this_cpu_    
645                 preempt_enable();                 
646 retry:                                            
647                 rcu_read_lock();                  
648                 rtsp = rcu_dereference(rtsarra    
649                 a = READ_ONCE(rtsp->a);           
650                 if (!rts_acquire(rtsp, &start)    
651                         rcu_read_unlock();        
652                         goto retry;               
653                 }                                 
654                 if (a != READ_ONCE(rtsp->a)) {    
655                         (void)rts_release(rtsp    
656                         rcu_read_unlock();        
657                         goto retry;               
658                 }                                 
659                 un_delay(udl, ndl);               
660                 b = READ_ONCE(rtsp->a);           
661                 // Remember, seqlock read-side    
662                 if (!rts_release(rtsp, start))    
663                         rcu_read_unlock();        
664                         goto retry;               
665                 }                                 
666                 WARN_ONCE(a != b, "Re-read of     
667                 b = rtsp->b;                      
668                 rcu_read_unlock();                
669                 WARN_ON_ONCE(a * a != b);         
670         }                                         
671 }                                                 
672                                                   
673 // Because the acquisition and release methods    
674 // is no point in optimizing away the un_delay    
675 // Thus simply define typesafe_read_section()     
676 // typesafe_delay_section().                      
677 static void typesafe_read_section(const int nl    
678 {                                                 
679         typesafe_delay_section(nloops, 0, 0);     
680 }                                                 
681                                                   
682 // Allocate and initialize one refscale_typesa    
683 static struct refscale_typesafe *typesafe_allo    
684 {                                                 
685         struct refscale_typesafe *rtsp;           
686                                                   
687         rtsp = kmem_cache_alloc(typesafe_kmem_    
688         if (!rtsp)                                
689                 return NULL;                      
690         atomic_set(&rtsp->rts_refctr, 1);         
691         WRITE_ONCE(rtsp->a, rtsp->a + 1);         
692         WRITE_ONCE(rtsp->b, rtsp->a * rtsp->a)    
693         return rtsp;                              
694 }                                                 
695                                                   
696 // Slab-allocator constructor for refscale_typ    
697 // out of a new slab of system memory.            
698 static void refscale_typesafe_ctor(void *rtsp_    
699 {                                                 
700         struct refscale_typesafe *rtsp = rtsp_    
701                                                   
702         spin_lock_init(&rtsp->rts_lock);          
703         seqlock_init(&rtsp->rts_seqlock);         
704         preempt_disable();                        
705         rtsp->a = torture_random(this_cpu_ptr(    
706         preempt_enable();                         
707 }                                                 
708                                                   
709 static const struct ref_scale_ops typesafe_ref    
710 static const struct ref_scale_ops typesafe_loc    
711 static const struct ref_scale_ops typesafe_seq    
712                                                   
713 // Initialize for a typesafe test.                
714 static bool typesafe_init(void)                   
715 {                                                 
716         long idx;                                 
717         long si = lookup_instances;               
718                                                   
719         typesafe_kmem_cachep = kmem_cache_crea    
720                                                   
721                                                   
722         if (!typesafe_kmem_cachep)                
723                 return false;                     
724         if (si < 0)                               
725                 si = -si * nr_cpu_ids;            
726         else if (si == 0)                         
727                 si = nr_cpu_ids;                  
728         rtsarray_size = si;                       
729         rtsarray = kcalloc(si, sizeof(*rtsarra    
730         if (!rtsarray)                            
731                 return false;                     
732         for (idx = 0; idx < rtsarray_size; idx    
733                 rtsarray[idx] = typesafe_alloc    
734                 if (!rtsarray[idx])               
735                         return false;             
736         }                                         
737         if (cur_ops == &typesafe_ref_ops) {       
738                 rts_acquire = typesafe_ref_acq    
739                 rts_release = typesafe_ref_rel    
740         } else if (cur_ops == &typesafe_lock_o    
741                 rts_acquire = typesafe_lock_ac    
742                 rts_release = typesafe_lock_re    
743         } else if (cur_ops == &typesafe_seqloc    
744                 rts_acquire = typesafe_seqlock    
745                 rts_release = typesafe_seqlock    
746         } else {                                  
747                 WARN_ON_ONCE(1);                  
748                 return false;                     
749         }                                         
750         return true;                              
751 }                                                 
752                                                   
753 // Clean up after a typesafe test.                
754 static void typesafe_cleanup(void)                
755 {                                                 
756         long idx;                                 
757                                                   
758         if (rtsarray) {                           
759                 for (idx = 0; idx < rtsarray_s    
760                         kmem_cache_free(typesa    
761                 kfree(rtsarray);                  
762                 rtsarray = NULL;                  
763                 rtsarray_size = 0;                
764         }                                         
765         kmem_cache_destroy(typesafe_kmem_cache    
766         typesafe_kmem_cachep = NULL;              
767         rts_acquire = NULL;                       
768         rts_release = NULL;                       
769 }                                                 
770                                                   
771 // The typesafe_init() function distinguishes     
772 static const struct ref_scale_ops typesafe_ref    
773         .init           = typesafe_init,          
774         .cleanup        = typesafe_cleanup,       
775         .readsection    = typesafe_read_sectio    
776         .delaysection   = typesafe_delay_secti    
777         .name           = "typesafe_ref"          
778 };                                                
779                                                   
780 static const struct ref_scale_ops typesafe_loc    
781         .init           = typesafe_init,          
782         .cleanup        = typesafe_cleanup,       
783         .readsection    = typesafe_read_sectio    
784         .delaysection   = typesafe_delay_secti    
785         .name           = "typesafe_lock"         
786 };                                                
787                                                   
788 static const struct ref_scale_ops typesafe_seq    
789         .init           = typesafe_init,          
790         .cleanup        = typesafe_cleanup,       
791         .readsection    = typesafe_read_sectio    
792         .delaysection   = typesafe_delay_secti    
793         .name           = "typesafe_seqlock"      
794 };                                                
795                                                   
796 static void rcu_scale_one_reader(void)            
797 {                                                 
798         if (readdelay <= 0)                       
799                 cur_ops->readsection(loops);      
800         else                                      
801                 cur_ops->delaysection(loops, r    
802 }                                                 
803                                                   
804 // Reader kthread.  Repeatedly does empty RCU     
805 // critical section, minimizing update-side in    
806 static int                                        
807 ref_scale_reader(void *arg)                       
808 {                                                 
809         unsigned long flags;                      
810         long me = (long)arg;                      
811         struct reader_task *rt = &(reader_task    
812         u64 start;                                
813         s64 duration;                             
814                                                   
815         VERBOSE_SCALEOUT_BATCH("ref_scale_read    
816         WARN_ON_ONCE(set_cpus_allowed_ptr(curr    
817         set_user_nice(current, MAX_NICE);         
818         atomic_inc(&n_init);                      
819         if (holdoff)                              
820                 schedule_timeout_interruptible    
821 repeat:                                           
822         VERBOSE_SCALEOUT_BATCH("ref_scale_read    
823                                                   
824         // Wait for signal that this reader ca    
825         wait_event(rt->wq, (atomic_read(&nread    
826                            torture_must_stop()    
827                                                   
828         if (torture_must_stop())                  
829                 goto end;                         
830                                                   
831         // Make sure that the CPU is affinitiz    
832         WARN_ON_ONCE(raw_smp_processor_id() !=    
833                                                   
834         WRITE_ONCE(rt->start_reader, 0);          
835         if (!atomic_dec_return(&n_started))       
836                 while (atomic_read_acquire(&n_    
837                         cpu_relax();              
838                                                   
839         VERBOSE_SCALEOUT_BATCH("ref_scale_read    
840                                                   
841                                                   
842         // To reduce noise, do an initial cach    
843         // in, and then keep warming until eve    
844         rcu_scale_one_reader();                   
845         if (!atomic_dec_return(&n_warmedup))      
846                 while (atomic_read_acquire(&n_    
847                         rcu_scale_one_reader()    
848         // Also keep interrupts disabled.  Thi    
849         // of preventing entries into slow pat    
850         local_irq_save(flags);                    
851         start = ktime_get_mono_fast_ns();         
852                                                   
853         rcu_scale_one_reader();                   
854                                                   
855         duration = ktime_get_mono_fast_ns() -     
856         local_irq_restore(flags);                 
857                                                   
858         rt->last_duration_ns = WARN_ON_ONCE(du    
859         // To reduce runtime-skew noise, do ma    
860         // everyone is done.                      
861         if (!atomic_dec_return(&n_cooleddown))    
862                 while (atomic_read_acquire(&n_    
863                         rcu_scale_one_reader()    
864                                                   
865         if (atomic_dec_and_test(&nreaders_exp)    
866                 wake_up(&main_wq);                
867                                                   
868         VERBOSE_SCALEOUT_BATCH("ref_scale_read    
869                                 me, exp_idx, a    
870                                                   
871         if (!torture_must_stop())                 
872                 goto repeat;                      
873 end:                                              
874         torture_kthread_stopping("ref_scale_re    
875         return 0;                                 
876 }                                                 
877                                                   
878 static void reset_readers(void)                   
879 {                                                 
880         int i;                                    
881         struct reader_task *rt;                   
882                                                   
883         for (i = 0; i < nreaders; i++) {          
884                 rt = &(reader_tasks[i]);          
885                                                   
886                 rt->last_duration_ns = 0;         
887         }                                         
888 }                                                 
889                                                   
890 // Print the results of each reader and return    
891 static u64 process_durations(int n)               
892 {                                                 
893         int i;                                    
894         struct reader_task *rt;                   
895         struct seq_buf s;                         
896         char *buf;                                
897         u64 sum = 0;                              
898                                                   
899         buf = kmalloc(800 + 64, GFP_KERNEL);      
900         if (!buf)                                 
901                 return 0;                         
902         seq_buf_init(&s, buf, 800 + 64);          
903                                                   
904         seq_buf_printf(&s, "Experiment #%d (Fo    
905                        exp_idx);                  
906                                                   
907         for (i = 0; i < n && !torture_must_sto    
908                 rt = &(reader_tasks[i]);          
909                                                   
910                 if (i % 5 == 0)                   
911                         seq_buf_putc(&s, '\n')    
912                                                   
913                 if (seq_buf_used(&s) >= 800) {    
914                         pr_alert("%s", seq_buf    
915                         seq_buf_clear(&s);        
916                 }                                 
917                                                   
918                 seq_buf_printf(&s, "%d: %llu\t    
919                                                   
920                 sum += rt->last_duration_ns;      
921         }                                         
922         pr_alert("%s\n", seq_buf_str(&s));        
923                                                   
924         kfree(buf);                               
925         return sum;                               
926 }                                                 
927                                                   
928 // The main_func is the main orchestrator, it     
929 // experiments.  For every experiment, it orde    
930 // involved to start and waits for them to fin    
931 // then reads their timestamps and starts the     
932 // experiment progresses from 1 concurrent rea    
933 // point all the timestamps are printed.          
934 static int main_func(void *arg)                   
935 {                                                 
936         int exp, r;                               
937         char buf1[64];                            
938         char *buf;                                
939         u64 *result_avg;                          
940                                                   
941         set_cpus_allowed_ptr(current, cpumask_    
942         set_user_nice(current, MAX_NICE);         
943                                                   
944         VERBOSE_SCALEOUT("main_func task start    
945         result_avg = kzalloc(nruns * sizeof(*r    
946         buf = kzalloc(800 + 64, GFP_KERNEL);      
947         if (!result_avg || !buf) {                
948                 SCALEOUT_ERRSTRING("out of mem    
949                 goto oom_exit;                    
950         }                                         
951         if (holdoff)                              
952                 schedule_timeout_interruptible    
953                                                   
954         // Wait for all threads to start.         
955         atomic_inc(&n_init);                      
956         while (atomic_read(&n_init) < nreaders    
957                 schedule_timeout_uninterruptib    
958                                                   
959         // Start exp readers up per experiment    
960         for (exp = 0; exp < nruns && !torture_    
961                 if (torture_must_stop())          
962                         goto end;                 
963                                                   
964                 reset_readers();                  
965                 atomic_set(&nreaders_exp, nrea    
966                 atomic_set(&n_started, nreader    
967                 atomic_set(&n_warmedup, nreade    
968                 atomic_set(&n_cooleddown, nrea    
969                                                   
970                 exp_idx = exp;                    
971                                                   
972                 for (r = 0; r < nreaders; r++)    
973                         smp_store_release(&rea    
974                         wake_up(&reader_tasks[    
975                 }                                 
976                                                   
977                 VERBOSE_SCALEOUT("main_func: e    
978                                 nreaders);        
979                                                   
980                 wait_event(main_wq,               
981                            !atomic_read(&nread    
982                                                   
983                 VERBOSE_SCALEOUT("main_func: e    
984                                                   
985                 if (torture_must_stop())          
986                         goto end;                 
987                                                   
988                 result_avg[exp] = div_u64(1000    
989         }                                         
990                                                   
991         // Print the average of all experiment    
992         SCALEOUT("END OF TEST. Calculating ave    
993                                                   
994         pr_alert("Runs\tTime(ns)\n");             
995         for (exp = 0; exp < nruns; exp++) {       
996                 u64 avg;                          
997                 u32 rem;                          
998                                                   
999                 avg = div_u64_rem(result_avg[e    
1000                 sprintf(buf1, "%d\t%llu.%03u\    
1001                 strcat(buf, buf1);               
1002                 if (strlen(buf) >= 800) {        
1003                         pr_alert("%s", buf);     
1004                         buf[0] = 0;              
1005                 }                                
1006         }                                        
1007                                                  
1008         pr_alert("%s", buf);                     
1009                                                  
1010 oom_exit:                                        
1011         // This will shutdown everything incl    
1012         if (shutdown) {                          
1013                 shutdown_start = 1;              
1014                 wake_up(&shutdown_wq);           
1015         }                                        
1016                                                  
1017         // Wait for torture to stop us           
1018         while (!torture_must_stop())             
1019                 schedule_timeout_uninterrupti    
1020                                                  
1021 end:                                             
1022         torture_kthread_stopping("main_func")    
1023         kfree(result_avg);                       
1024         kfree(buf);                              
1025         return 0;                                
1026 }                                                
1027                                                  
1028 static void                                      
1029 ref_scale_print_module_parms(const struct ref    
1030 {                                                
1031         pr_alert("%s" SCALE_FLAG                 
1032                  "--- %s:  verbose=%d verbose    
1033                  verbose, verbose_batched, sh    
1034 }                                                
1035                                                  
1036 static void                                      
1037 ref_scale_cleanup(void)                          
1038 {                                                
1039         int i;                                   
1040                                                  
1041         if (torture_cleanup_begin())             
1042                 return;                          
1043                                                  
1044         if (!cur_ops) {                          
1045                 torture_cleanup_end();           
1046                 return;                          
1047         }                                        
1048                                                  
1049         if (reader_tasks) {                      
1050                 for (i = 0; i < nreaders; i++    
1051                         torture_stop_kthread(    
1052                                                  
1053         }                                        
1054         kfree(reader_tasks);                     
1055                                                  
1056         torture_stop_kthread("main_task", mai    
1057         kfree(main_task);                        
1058                                                  
1059         // Do scale-type-specific cleanup ope    
1060         if (cur_ops->cleanup != NULL)            
1061                 cur_ops->cleanup();              
1062                                                  
1063         torture_cleanup_end();                   
1064 }                                                
1065                                                  
1066 // Shutdown kthread.  Just waits to be awaken    
1067 static int                                       
1068 ref_scale_shutdown(void *arg)                    
1069 {                                                
1070         wait_event_idle(shutdown_wq, shutdown    
1071                                                  
1072         smp_mb(); // Wake before output.         
1073         ref_scale_cleanup();                     
1074         kernel_power_off();                      
1075                                                  
1076         return -EINVAL;                          
1077 }                                                
1078                                                  
1079 static int __init                                
1080 ref_scale_init(void)                             
1081 {                                                
1082         long i;                                  
1083         int firsterr = 0;                        
1084         static const struct ref_scale_ops *sc    
1085                 &rcu_ops, &srcu_ops, RCU_TRAC    
1086                 &rwsem_ops, &lock_ops, &lock_    
1087                 &typesafe_ref_ops, &typesafe_    
1088         };                                       
1089                                                  
1090         if (!torture_init_begin(scale_type, v    
1091                 return -EBUSY;                   
1092                                                  
1093         for (i = 0; i < ARRAY_SIZE(scale_ops)    
1094                 cur_ops = scale_ops[i];          
1095                 if (strcmp(scale_type, cur_op    
1096                         break;                   
1097         }                                        
1098         if (i == ARRAY_SIZE(scale_ops)) {        
1099                 pr_alert("rcu-scale: invalid     
1100                 pr_alert("rcu-scale types:");    
1101                 for (i = 0; i < ARRAY_SIZE(sc    
1102                         pr_cont(" %s", scale_    
1103                 pr_cont("\n");                   
1104                 firsterr = -EINVAL;              
1105                 cur_ops = NULL;                  
1106                 goto unwind;                     
1107         }                                        
1108         if (cur_ops->init)                       
1109                 if (!cur_ops->init()) {          
1110                         firsterr = -EUCLEAN;     
1111                         goto unwind;             
1112                 }                                
1113                                                  
1114         ref_scale_print_module_parms(cur_ops,    
1115                                                  
1116         // Shutdown task                         
1117         if (shutdown) {                          
1118                 init_waitqueue_head(&shutdown    
1119                 firsterr = torture_create_kth    
1120                                                  
1121                 if (torture_init_error(firste    
1122                         goto unwind;             
1123                 schedule_timeout_uninterrupti    
1124         }                                        
1125                                                  
1126         // Reader tasks (default to ~75% of o    
1127         if (nreaders < 0)                        
1128                 nreaders = (num_online_cpus()    
1129         if (WARN_ONCE(loops <= 0, "%s: loops     
1130                 loops = 1;                       
1131         if (WARN_ONCE(nreaders <= 0, "%s: nre    
1132                 nreaders = 1;                    
1133         if (WARN_ONCE(nruns <= 0, "%s: nruns     
1134                 nruns = 1;                       
1135         reader_tasks = kcalloc(nreaders, size    
1136                                GFP_KERNEL);      
1137         if (!reader_tasks) {                     
1138                 SCALEOUT_ERRSTRING("out of me    
1139                 firsterr = -ENOMEM;              
1140                 goto unwind;                     
1141         }                                        
1142                                                  
1143         VERBOSE_SCALEOUT("Starting %d reader     
1144                                                  
1145         for (i = 0; i < nreaders; i++) {         
1146                 init_waitqueue_head(&reader_t    
1147                 firsterr = torture_create_kth    
1148                                                  
1149                 if (torture_init_error(firste    
1150                         goto unwind;             
1151         }                                        
1152                                                  
1153         // Main Task                             
1154         init_waitqueue_head(&main_wq);           
1155         firsterr = torture_create_kthread(mai    
1156         if (torture_init_error(firsterr))        
1157                 goto unwind;                     
1158                                                  
1159         torture_init_end();                      
1160         return 0;                                
1161                                                  
1162 unwind:                                          
1163         torture_init_end();                      
1164         ref_scale_cleanup();                     
1165         if (shutdown) {                          
1166                 WARN_ON(!IS_MODULE(CONFIG_RCU    
1167                 kernel_power_off();              
1168         }                                        
1169         return firsterr;                         
1170 }                                                
1171                                                  
1172 module_init(ref_scale_init);                     
1173 module_exit(ref_scale_cleanup);                  
1174                                                  

~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

kernel.org | git.kernel.org | LWN.net | Project Home | SVN repository | Mail admin

Linux® is a registered trademark of Linus Torvalds in the United States and other countries.
TOMOYO® is a registered trademark of NTT DATA CORPORATION.

sflogo.php