23
23
* for each kernfs_node with one or more open files.
24
24
*
25
25
* kernfs_node->attr.open points to kernfs_open_node. attr.open is
26
- * protected by kernfs_open_node_lock .
26
+ * RCU protected .
27
27
*
28
28
* filp->private_data points to seq_file whose ->private points to
29
29
* kernfs_open_file. kernfs_open_files are chained at
30
30
* kernfs_open_node->files, which is protected by kernfs_open_file_mutex.
31
31
*/
32
- static DEFINE_SPINLOCK (kernfs_open_node_lock );
33
32
static DEFINE_MUTEX (kernfs_open_file_mutex );
34
33
35
34
struct kernfs_open_node {
35
+ struct rcu_head rcu_head ;
36
36
atomic_t event ;
37
37
wait_queue_head_t poll ;
38
38
struct list_head files ; /* goes through kernfs_open_file.list */
@@ -51,6 +51,52 @@ struct kernfs_open_node {
51
51
static DEFINE_SPINLOCK (kernfs_notify_lock );
52
52
static struct kernfs_node * kernfs_notify_list = KERNFS_NOTIFY_EOL ;
53
53
54
+ /**
55
+ * kernfs_deref_open_node - Get kernfs_open_node corresponding to @kn.
56
+ *
57
+ * @of: associated kernfs_open_file instance.
58
+ * @kn: target kernfs_node.
59
+ *
60
+ * Fetch and return ->attr.open of @kn if @of->list is non empty.
61
+ * If @of->list is not empty we can safely assume that @of is on
62
+ * @kn->attr.open->files list and this guarantees that @kn->attr.open
63
+ * will not vanish i.e. dereferencing outside RCU read-side critical
64
+ * section is safe here.
65
+ *
66
+ * The caller needs to make sure that @of->list is not empty.
67
+ */
68
+ static struct kernfs_open_node *
69
+ kernfs_deref_open_node (struct kernfs_open_file * of , struct kernfs_node * kn )
70
+ {
71
+ struct kernfs_open_node * on ;
72
+
73
+ on = rcu_dereference_check (kn -> attr .open , !list_empty (& of -> list ));
74
+
75
+ return on ;
76
+ }
77
+
78
+ /**
79
+ * kernfs_deref_open_node_protected - Get kernfs_open_node corresponding to @kn
80
+ *
81
+ * @kn: target kernfs_node.
82
+ *
83
+ * Fetch and return ->attr.open of @kn when caller holds the
84
+ * kernfs_open_file_mutex.
85
+ *
86
+ * Update of ->attr.open happens under kernfs_open_file_mutex. So when
87
+ * the caller guarantees that this mutex is being held, other updaters can't
88
+ * change ->attr.open and this means that we can safely deref ->attr.open
89
+ * outside RCU read-side critical section.
90
+ *
91
+ * The caller needs to make sure that kernfs_open_file_mutex is held.
92
+ */
93
+ static struct kernfs_open_node *
94
+ kernfs_deref_open_node_protected (struct kernfs_node * kn )
95
+ {
96
+ return rcu_dereference_protected (kn -> attr .open ,
97
+ lockdep_is_held (& kernfs_open_file_mutex ));
98
+ }
99
+
54
100
static struct kernfs_open_file * kernfs_of (struct file * file )
55
101
{
56
102
return ((struct seq_file * )file -> private_data )-> private ;
@@ -156,8 +202,12 @@ static void kernfs_seq_stop(struct seq_file *sf, void *v)
156
202
static int kernfs_seq_show (struct seq_file * sf , void * v )
157
203
{
158
204
struct kernfs_open_file * of = sf -> private ;
205
+ struct kernfs_open_node * on = kernfs_deref_open_node (of , of -> kn );
159
206
160
- of -> event = atomic_read (& of -> kn -> attr .open -> event );
207
+ if (!on )
208
+ return - EINVAL ;
209
+
210
+ of -> event = atomic_read (& on -> event );
161
211
162
212
return of -> kn -> attr .ops -> seq_show (sf , v );
163
213
}
@@ -180,6 +230,7 @@ static ssize_t kernfs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter)
180
230
struct kernfs_open_file * of = kernfs_of (iocb -> ki_filp );
181
231
ssize_t len = min_t (size_t , iov_iter_count (iter ), PAGE_SIZE );
182
232
const struct kernfs_ops * ops ;
233
+ struct kernfs_open_node * on ;
183
234
char * buf ;
184
235
185
236
buf = of -> prealloc_buf ;
@@ -201,7 +252,15 @@ static ssize_t kernfs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter)
201
252
goto out_free ;
202
253
}
203
254
204
- of -> event = atomic_read (& of -> kn -> attr .open -> event );
255
+ on = kernfs_deref_open_node (of , of -> kn );
256
+ if (!on ) {
257
+ len = - EINVAL ;
258
+ mutex_unlock (& of -> mutex );
259
+ goto out_free ;
260
+ }
261
+
262
+ of -> event = atomic_read (& on -> event );
263
+
205
264
ops = kernfs_ops (of -> kn );
206
265
if (ops -> read )
207
266
len = ops -> read (of , buf , len , iocb -> ki_pos );
@@ -518,36 +577,29 @@ static int kernfs_get_open_node(struct kernfs_node *kn,
518
577
{
519
578
struct kernfs_open_node * on , * new_on = NULL ;
520
579
521
- retry :
522
580
mutex_lock (& kernfs_open_file_mutex );
523
- spin_lock_irq (& kernfs_open_node_lock );
524
-
525
- if (!kn -> attr .open && new_on ) {
526
- kn -> attr .open = new_on ;
527
- new_on = NULL ;
528
- }
529
-
530
- on = kn -> attr .open ;
531
- if (on )
532
- list_add_tail (& of -> list , & on -> files );
533
-
534
- spin_unlock_irq (& kernfs_open_node_lock );
535
- mutex_unlock (& kernfs_open_file_mutex );
581
+ on = kernfs_deref_open_node_protected (kn );
536
582
537
583
if (on ) {
538
- kfree (new_on );
584
+ list_add_tail (& of -> list , & on -> files );
585
+ mutex_unlock (& kernfs_open_file_mutex );
539
586
return 0 ;
587
+ } else {
588
+ /* not there, initialize a new one */
589
+ new_on = kmalloc (sizeof (* new_on ), GFP_KERNEL );
590
+ if (!new_on ) {
591
+ mutex_unlock (& kernfs_open_file_mutex );
592
+ return - ENOMEM ;
593
+ }
594
+ atomic_set (& new_on -> event , 1 );
595
+ init_waitqueue_head (& new_on -> poll );
596
+ INIT_LIST_HEAD (& new_on -> files );
597
+ list_add_tail (& of -> list , & new_on -> files );
598
+ rcu_assign_pointer (kn -> attr .open , new_on );
540
599
}
600
+ mutex_unlock (& kernfs_open_file_mutex );
541
601
542
- /* not there, initialize a new one and retry */
543
- new_on = kmalloc (sizeof (* new_on ), GFP_KERNEL );
544
- if (!new_on )
545
- return - ENOMEM ;
546
-
547
- atomic_set (& new_on -> event , 1 );
548
- init_waitqueue_head (& new_on -> poll );
549
- INIT_LIST_HEAD (& new_on -> files );
550
- goto retry ;
602
+ return 0 ;
551
603
}
552
604
553
605
/**
@@ -566,24 +618,25 @@ static int kernfs_get_open_node(struct kernfs_node *kn,
566
618
static void kernfs_unlink_open_file (struct kernfs_node * kn ,
567
619
struct kernfs_open_file * of )
568
620
{
569
- struct kernfs_open_node * on = kn -> attr .open ;
570
- unsigned long flags ;
621
+ struct kernfs_open_node * on ;
571
622
572
623
mutex_lock (& kernfs_open_file_mutex );
573
- spin_lock_irqsave (& kernfs_open_node_lock , flags );
624
+
625
+ on = kernfs_deref_open_node_protected (kn );
626
+ if (!on ) {
627
+ mutex_unlock (& kernfs_open_file_mutex );
628
+ return ;
629
+ }
574
630
575
631
if (of )
576
632
list_del (& of -> list );
577
633
578
- if (list_empty (& on -> files ))
579
- kn -> attr .open = NULL ;
580
- else
581
- on = NULL ;
634
+ if (list_empty (& on -> files )) {
635
+ rcu_assign_pointer ( kn -> attr .open , NULL ) ;
636
+ kfree_rcu ( on , rcu_head );
637
+ }
582
638
583
- spin_unlock_irqrestore (& kernfs_open_node_lock , flags );
584
639
mutex_unlock (& kernfs_open_file_mutex );
585
-
586
- kfree (on );
587
640
}
588
641
589
642
static int kernfs_fop_open (struct inode * inode , struct file * file )
@@ -773,17 +826,16 @@ void kernfs_drain_open_files(struct kernfs_node *kn)
773
826
* check under kernfs_open_file_mutex will ensure bailing out if
774
827
* ->attr.open became NULL while waiting for the mutex.
775
828
*/
776
- if (!kn -> attr .open )
829
+ if (!rcu_access_pointer ( kn -> attr .open ) )
777
830
return ;
778
831
779
832
mutex_lock (& kernfs_open_file_mutex );
780
- if (!kn -> attr .open ) {
833
+ on = kernfs_deref_open_node_protected (kn );
834
+ if (!on ) {
781
835
mutex_unlock (& kernfs_open_file_mutex );
782
836
return ;
783
837
}
784
838
785
- on = kn -> attr .open ;
786
-
787
839
list_for_each_entry (of , & on -> files , list ) {
788
840
struct inode * inode = file_inode (of -> file );
789
841
@@ -814,7 +866,10 @@ void kernfs_drain_open_files(struct kernfs_node *kn)
814
866
__poll_t kernfs_generic_poll (struct kernfs_open_file * of , poll_table * wait )
815
867
{
816
868
struct kernfs_node * kn = kernfs_dentry_node (of -> file -> f_path .dentry );
817
- struct kernfs_open_node * on = kn -> attr .open ;
869
+ struct kernfs_open_node * on = kernfs_deref_open_node (of , kn );
870
+
871
+ if (!on )
872
+ return EPOLLERR ;
818
873
819
874
poll_wait (of -> file , & on -> poll , wait );
820
875
@@ -921,13 +976,13 @@ void kernfs_notify(struct kernfs_node *kn)
921
976
return ;
922
977
923
978
/* kick poll immediately */
924
- spin_lock_irqsave ( & kernfs_open_node_lock , flags );
925
- on = kn -> attr .open ;
979
+ rcu_read_lock ( );
980
+ on = rcu_dereference ( kn -> attr .open ) ;
926
981
if (on ) {
927
982
atomic_inc (& on -> event );
928
983
wake_up_interruptible (& on -> poll );
929
984
}
930
- spin_unlock_irqrestore ( & kernfs_open_node_lock , flags );
985
+ rcu_read_unlock ( );
931
986
932
987
/* schedule work to kick fsnotify */
933
988
spin_lock_irqsave (& kernfs_notify_lock , flags );
0 commit comments