LCOV - code coverage report
Current view: top level - fs - dcache.c (source / functions) Hit Total Coverage
Test: fstests of 6.5.0-rc3-djwx @ Mon Jul 31 20:08:22 PDT 2023 Lines: 1192 1448 82.3 %
Date: 2023-07-31 20:08:22 Functions: 96 111 86.5 %

          Line data    Source code
       1             : // SPDX-License-Identifier: GPL-2.0-only
       2             : /*
       3             :  * fs/dcache.c
       4             :  *
       5             :  * Complete reimplementation
       6             :  * (C) 1997 Thomas Schoebel-Theuer,
       7             :  * with heavy changes by Linus Torvalds
       8             :  */
       9             : 
      10             : /*
      11             :  * Notes on the allocation strategy:
      12             :  *
      13             :  * The dcache is a master of the icache - whenever a dcache entry
      14             :  * exists, the inode will always exist. "iput()" is done either when
      15             :  * the dcache entry is deleted or garbage collected.
      16             :  */
      17             : 
      18             : #include <linux/ratelimit.h>
      19             : #include <linux/string.h>
      20             : #include <linux/mm.h>
      21             : #include <linux/fs.h>
      22             : #include <linux/fscrypt.h>
      23             : #include <linux/fsnotify.h>
      24             : #include <linux/slab.h>
      25             : #include <linux/init.h>
      26             : #include <linux/hash.h>
      27             : #include <linux/cache.h>
      28             : #include <linux/export.h>
      29             : #include <linux/security.h>
      30             : #include <linux/seqlock.h>
      31             : #include <linux/memblock.h>
      32             : #include <linux/bit_spinlock.h>
      33             : #include <linux/rculist_bl.h>
      34             : #include <linux/list_lru.h>
      35             : #include "internal.h"
      36             : #include "mount.h"
      37             : 
      38             : /*
      39             :  * Usage:
      40             :  * dcache->d_inode->i_lock protects:
      41             :  *   - i_dentry, d_u.d_alias, d_inode of aliases
      42             :  * dcache_hash_bucket lock protects:
      43             :  *   - the dcache hash table
      44             :  * s_roots bl list spinlock protects:
      45             :  *   - the s_roots list (see __d_drop)
      46             :  * dentry->d_sb->s_dentry_lru_lock protects:
      47             :  *   - the dcache lru lists and counters
      48             :  * d_lock protects:
      49             :  *   - d_flags
      50             :  *   - d_name
      51             :  *   - d_lru
      52             :  *   - d_count
      53             :  *   - d_unhashed()
      54             :  *   - d_parent and d_subdirs
      55             :  *   - childrens' d_child and d_parent
      56             :  *   - d_u.d_alias, d_inode
      57             :  *
      58             :  * Ordering:
      59             :  * dentry->d_inode->i_lock
      60             :  *   dentry->d_lock
      61             :  *     dentry->d_sb->s_dentry_lru_lock
      62             :  *     dcache_hash_bucket lock
      63             :  *     s_roots lock
      64             :  *
      65             :  * If there is an ancestor relationship:
      66             :  * dentry->d_parent->...->d_parent->d_lock
      67             :  *   ...
      68             :  *     dentry->d_parent->d_lock
      69             :  *       dentry->d_lock
      70             :  *
      71             :  * If no ancestor relationship:
      72             :  * arbitrary, since it's serialized on rename_lock
      73             :  */
      74             : int sysctl_vfs_cache_pressure __read_mostly = 100;
      75             : EXPORT_SYMBOL_GPL(sysctl_vfs_cache_pressure);
      76             : 
      77             : __cacheline_aligned_in_smp DEFINE_SEQLOCK(rename_lock);
      78             : 
      79             : EXPORT_SYMBOL(rename_lock);
      80             : 
      81             : static struct kmem_cache *dentry_cache __read_mostly;
      82             : 
      83             : const struct qstr empty_name = QSTR_INIT("", 0);
      84             : EXPORT_SYMBOL(empty_name);
      85             : const struct qstr slash_name = QSTR_INIT("/", 1);
      86             : EXPORT_SYMBOL(slash_name);
      87             : const struct qstr dotdot_name = QSTR_INIT("..", 2);
      88             : EXPORT_SYMBOL(dotdot_name);
      89             : 
      90             : /*
      91             :  * This is the single most critical data structure when it comes
      92             :  * to the dcache: the hashtable for lookups. Somebody should try
      93             :  * to make this good - I've just made it work.
      94             :  *
      95             :  * This hash-function tries to avoid losing too many bits of hash
      96             :  * information, yet avoid using a prime hash-size or similar.
      97             :  */
      98             : 
      99             : static unsigned int d_hash_shift __read_mostly;
     100             : 
     101             : static struct hlist_bl_head *dentry_hashtable __read_mostly;
     102             : 
     103 41352253862 : static inline struct hlist_bl_head *d_hash(unsigned int hash)
     104             : {
     105 41352253862 :         return dentry_hashtable + (hash >> d_hash_shift);
     106             : }
     107             : 
     108             : #define IN_LOOKUP_SHIFT 10
     109             : static struct hlist_bl_head in_lookup_hashtable[1 << IN_LOOKUP_SHIFT];
     110             : 
     111             : static inline struct hlist_bl_head *in_lookup_hash(const struct dentry *parent,
     112             :                                         unsigned int hash)
     113             : {
     114  1671570144 :         hash += (unsigned long) parent / L1_CACHE_BYTES;
     115  1671570144 :         return in_lookup_hashtable + hash_32(hash, IN_LOOKUP_SHIFT);
     116             : }
     117             : 
     118             : struct dentry_stat_t {
     119             :         long nr_dentry;
     120             :         long nr_unused;
     121             :         long age_limit;         /* age in seconds */
     122             :         long want_pages;        /* pages requested by system */
     123             :         long nr_negative;       /* # of unused negative dentries */
     124             :         long dummy;             /* Reserved for future use */
     125             : };
     126             : 
     127             : static DEFINE_PER_CPU(long, nr_dentry);
     128             : static DEFINE_PER_CPU(long, nr_dentry_unused);
     129             : static DEFINE_PER_CPU(long, nr_dentry_negative);
     130             : 
     131             : #if defined(CONFIG_SYSCTL) && defined(CONFIG_PROC_FS)
     132             : /* Statistics gathering. */
     133             : static struct dentry_stat_t dentry_stat = {
     134             :         .age_limit = 45,
     135             : };
     136             : 
     137             : /*
     138             :  * Here we resort to our own counters instead of using generic per-cpu counters
     139             :  * for consistency with what the vfs inode code does. We are expected to harvest
     140             :  * better code and performance by having our own specialized counters.
     141             :  *
     142             :  * Please note that the loop is done over all possible CPUs, not over all online
     143             :  * CPUs. The reason for this is that we don't want to play games with CPUs going
     144             :  * on and off. If one of them goes off, we will just keep their counters.
     145             :  *
     146             :  * glommer: See cffbc8a for details, and if you ever intend to change this,
     147             :  * please update all vfs counters to match.
     148             :  */
     149         680 : static long get_nr_dentry(void)
     150             : {
     151         680 :         int i;
     152         680 :         long sum = 0;
     153        3400 :         for_each_possible_cpu(i)
     154        2720 :                 sum += per_cpu(nr_dentry, i);
     155         680 :         return sum < 0 ? 0 : sum;
     156             : }
     157             : 
     158         680 : static long get_nr_dentry_unused(void)
     159             : {
     160         680 :         int i;
     161         680 :         long sum = 0;
     162        3400 :         for_each_possible_cpu(i)
     163        2720 :                 sum += per_cpu(nr_dentry_unused, i);
     164         680 :         return sum < 0 ? 0 : sum;
     165             : }
     166             : 
     167         680 : static long get_nr_dentry_negative(void)
     168             : {
     169         680 :         int i;
     170         680 :         long sum = 0;
     171             : 
     172        3400 :         for_each_possible_cpu(i)
     173        2720 :                 sum += per_cpu(nr_dentry_negative, i);
     174         680 :         return sum < 0 ? 0 : sum;
     175             : }
     176             : 
     177         680 : static int proc_nr_dentry(struct ctl_table *table, int write, void *buffer,
     178             :                           size_t *lenp, loff_t *ppos)
     179             : {
     180         680 :         dentry_stat.nr_dentry = get_nr_dentry();
     181         680 :         dentry_stat.nr_unused = get_nr_dentry_unused();
     182         680 :         dentry_stat.nr_negative = get_nr_dentry_negative();
     183         680 :         return proc_doulongvec_minmax(table, write, buffer, lenp, ppos);
     184             : }
     185             : 
     186             : static struct ctl_table fs_dcache_sysctls[] = {
     187             :         {
     188             :                 .procname       = "dentry-state",
     189             :                 .data           = &dentry_stat,
     190             :                 .maxlen         = 6*sizeof(long),
     191             :                 .mode           = 0444,
     192             :                 .proc_handler   = proc_nr_dentry,
     193             :         },
     194             :         { }
     195             : };
     196             : 
     197           0 : static int __init init_fs_dcache_sysctls(void)
     198             : {
     199           0 :         register_sysctl_init("fs", fs_dcache_sysctls);
     200           0 :         return 0;
     201             : }
     202             : fs_initcall(init_fs_dcache_sysctls);
     203             : #endif
     204             : 
     205             : /*
     206             :  * Compare 2 name strings, return 0 if they match, otherwise non-zero.
     207             :  * The strings are both count bytes long, and count is non-zero.
     208             :  */
     209             : #ifdef CONFIG_DCACHE_WORD_ACCESS
     210             : 
     211             : #include <asm/word-at-a-time.h>
     212             : /*
     213             :  * NOTE! 'cs' and 'scount' come from a dentry, so it has a
     214             :  * aligned allocation for this particular component. We don't
     215             :  * strictly need the load_unaligned_zeropad() safety, but it
     216             :  * doesn't hurt either.
     217             :  *
     218             :  * In contrast, 'ct' and 'tcount' can be from a pathname, and do
     219             :  * need the careful unaligned handling.
     220             :  */
     221 37620498046 : static inline int dentry_string_cmp(const unsigned char *cs, const unsigned char *ct, unsigned tcount)
     222             : {
     223 39006098771 :         unsigned long a,b,mask;
     224             : 
     225 39006098771 :         for (;;) {
     226 39006098771 :                 a = read_word_at_a_time(cs);
     227 39006098771 :                 b = load_unaligned_zeropad(ct);
     228 39020946409 :                 if (tcount < sizeof(unsigned long))
     229             :                         break;
     230  1818729700 :                 if (unlikely(a != b))
     231             :                         return 1;
     232  1818729559 :                 cs += sizeof(unsigned long);
     233  1818729559 :                 ct += sizeof(unsigned long);
     234  1818729559 :                 tcount -= sizeof(unsigned long);
     235  1818729559 :                 if (!tcount)
     236             :                         return 0;
     237             :         }
     238 37202216709 :         mask = bytemask_from_count(tcount);
     239 37202216709 :         return unlikely(!!((a ^ b) & mask));
     240             : }
     241             : 
     242             : #else
     243             : 
     244             : static inline int dentry_string_cmp(const unsigned char *cs, const unsigned char *ct, unsigned tcount)
     245             : {
     246             :         do {
     247             :                 if (*cs != *ct)
     248             :                         return 1;
     249             :                 cs++;
     250             :                 ct++;
     251             :                 tcount--;
     252             :         } while (tcount);
     253             :         return 0;
     254             : }
     255             : 
     256             : #endif
     257             : 
     258             : static inline int dentry_cmp(const struct dentry *dentry, const unsigned char *ct, unsigned tcount)
     259             : {
     260             :         /*
     261             :          * Be careful about RCU walk racing with rename:
     262             :          * use 'READ_ONCE' to fetch the name pointer.
     263             :          *
     264             :          * NOTE! Even if a rename will mean that the length
     265             :          * was not loaded atomically, we don't care. The
     266             :          * RCU walk will check the sequence count eventually,
     267             :          * and catch it. And we won't overrun the buffer,
     268             :          * because we're reading the name pointer atomically,
     269             :          * and a dentry name is guaranteed to be properly
     270             :          * terminated with a NUL byte.
     271             :          *
     272             :          * End result: even if 'len' is wrong, we'll exit
     273             :          * early because the data cannot match (there can
     274             :          * be no NUL in the ct/tcount data)
     275             :          */
     276 37650401393 :         const unsigned char *cs = READ_ONCE(dentry->d_name.name);
     277             : 
     278 37650401393 :         return dentry_string_cmp(cs, ct, tcount);
     279             : }
     280             : 
     281             : struct external_name {
     282             :         union {
     283             :                 atomic_t count;
     284             :                 struct rcu_head head;
     285             :         } u;
     286             :         unsigned char name[];
     287             : };
     288             : 
     289             : static inline struct external_name *external_name(struct dentry *dentry)
     290             : {
     291     3882823 :         return container_of(dentry->d_name.name, struct external_name, name[0]);
     292             : }
     293             : 
     294   999954779 : static void __d_free(struct rcu_head *head)
     295             : {
     296  1029848128 :         struct dentry *dentry = container_of(head, struct dentry, d_u.d_rcu);
     297             : 
     298   999954779 :         kmem_cache_free(dentry_cache, dentry); 
     299    29895310 : }
     300             : 
     301     2746643 : static void __d_free_external(struct rcu_head *head)
     302             : {
     303     2746643 :         struct dentry *dentry = container_of(head, struct dentry, d_u.d_rcu);
     304     2746643 :         kfree(external_name(dentry));
     305     2746225 :         kmem_cache_free(dentry_cache, dentry);
     306     2746879 : }
     307             : 
     308             : static inline int dname_external(const struct dentry *dentry)
     309             : {
     310  1199066076 :         return dentry->d_name.name != dentry->d_iname;
     311             : }
     312             : 
     313    49557825 : void take_dentry_name_snapshot(struct name_snapshot *name, struct dentry *dentry)
     314             : {
     315    49557825 :         spin_lock(&dentry->d_lock);
     316    49558584 :         name->name = dentry->d_name;
     317    49558584 :         if (unlikely(dname_external(dentry))) {
     318     1137549 :                 atomic_inc(&external_name(dentry)->u.count);
     319             :         } else {
     320    96842070 :                 memcpy(name->inline_name, dentry->d_iname,
     321             :                        dentry->d_name.len + 1);
     322    48421035 :                 name->name.name = name->inline_name;
     323             :         }
     324    49558658 :         spin_unlock(&dentry->d_lock);
     325    49558358 : }
     326             : EXPORT_SYMBOL(take_dentry_name_snapshot);
     327             : 
     328    49559088 : void release_dentry_name_snapshot(struct name_snapshot *name)
     329             : {
     330    49559088 :         if (unlikely(name->name.name != name->inline_name)) {
     331     1137783 :                 struct external_name *p;
     332     1137783 :                 p = container_of(name->name.name, struct external_name, name[0]);
     333     1137783 :                 if (unlikely(atomic_dec_and_test(&p->u.count)))
     334     1136179 :                         kfree_rcu(p, u.head);
     335             :         }
     336    49559064 : }
     337             : EXPORT_SYMBOL(release_dentry_name_snapshot);
     338             : 
     339             : static inline void __d_set_inode_and_type(struct dentry *dentry,
     340             :                                           struct inode *inode,
     341             :                                           unsigned type_flags)
     342             : {
     343   244924370 :         unsigned flags;
     344             : 
     345   244924370 :         dentry->d_inode = inode;
     346   244924370 :         flags = READ_ONCE(dentry->d_flags);
     347   244924370 :         flags &= ~(DCACHE_ENTRY_TYPE | DCACHE_FALLTHRU);
     348   244924370 :         flags |= type_flags;
     349   489836961 :         smp_store_release(&dentry->d_flags, flags);
     350             : }
     351             : 
     352             : static inline void __d_clear_type_and_inode(struct dentry *dentry)
     353             : {
     354   245398548 :         unsigned flags = READ_ONCE(dentry->d_flags);
     355             : 
     356   245398548 :         flags &= ~(DCACHE_ENTRY_TYPE | DCACHE_FALLTHRU);
     357   245398548 :         WRITE_ONCE(dentry->d_flags, flags);
     358   245398548 :         dentry->d_inode = NULL;
     359   245398548 :         if (dentry->d_flags & DCACHE_LRU_LIST)
     360    50181593 :                 this_cpu_inc(nr_dentry_negative);
     361             : }
     362             : 
     363  1040476770 : static void dentry_free(struct dentry *dentry)
     364             : {
     365  1040476770 :         WARN_ON(!hlist_unhashed(&dentry->d_u.d_alias));
     366  1040476770 :         if (unlikely(dname_external(dentry))) {
     367     3810392 :                 struct external_name *p = external_name(dentry);
     368     3810392 :                 if (likely(atomic_dec_and_test(&p->u.count))) {
     369     2747596 :                         call_rcu(&dentry->d_u.d_rcu, __d_free_external);
     370     2747596 :                         return;
     371             :                 }
     372             :         }
     373             :         /* if dentry was never visible to RCU, immediate free is OK */
     374  1037729447 :         if (dentry->d_flags & DCACHE_NORCU)
     375    29893349 :                 __d_free(&dentry->d_u.d_rcu);
     376             :         else
     377  1007836098 :                 call_rcu(&dentry->d_u.d_rcu, __d_free);
     378             : }
     379             : 
     380             : /*
     381             :  * Release the dentry's inode, using the filesystem
     382             :  * d_iput() operation if defined.
     383             :  */
     384   245477817 : static void dentry_unlink_inode(struct dentry * dentry)
     385             :         __releases(dentry->d_lock)
     386             :         __releases(dentry->d_inode->i_lock)
     387             : {
     388   245477817 :         struct inode *inode = dentry->d_inode;
     389             : 
     390   245477817 :         raw_write_seqcount_begin(&dentry->d_seq);
     391   245398548 :         __d_clear_type_and_inode(dentry);
     392   245409565 :         hlist_del_init(&dentry->d_u.d_alias);
     393   245409565 :         raw_write_seqcount_end(&dentry->d_seq);
     394   245393160 :         spin_unlock(&dentry->d_lock);
     395   245618422 :         spin_unlock(&inode->i_lock);
     396   245637362 :         if (!inode->i_nlink)
     397    66118287 :                 fsnotify_inoderemove(inode);
     398   245598500 :         if (dentry->d_op && dentry->d_op->d_iput)
     399      799336 :                 dentry->d_op->d_iput(dentry, inode);
     400             :         else
     401   244799164 :                 iput(inode);
     402   245528919 : }
     403             : 
     404             : /*
     405             :  * The DCACHE_LRU_LIST bit is set whenever the 'd_lru' entry
     406             :  * is in use - which includes both the "real" per-superblock
     407             :  * LRU list _and_ the DCACHE_SHRINK_LIST use.
     408             :  *
     409             :  * The DCACHE_SHRINK_LIST bit is set whenever the dentry is
     410             :  * on the shrink list (ie not on the superblock LRU list).
     411             :  *
     412             :  * The per-cpu "nr_dentry_unused" counters are updated with
     413             :  * the DCACHE_LRU_LIST bit.
     414             :  *
     415             :  * The per-cpu "nr_dentry_negative" counters are only updated
     416             :  * when deleted from or added to the per-superblock LRU list, not
     417             :  * from/to the shrink list. That is to avoid an unneeded dec/inc
     418             :  * pair when moving from LRU to shrink list in select_collect().
     419             :  *
     420             :  * These helper functions make sure we always follow the
     421             :  * rules. d_lock must be held by the caller.
     422             :  */
     423             : #define D_FLAG_VERIFY(dentry,x) WARN_ON_ONCE(((dentry)->d_flags & (DCACHE_LRU_LIST | DCACHE_SHRINK_LIST)) != (x))
     424   145722629 : static void d_lru_add(struct dentry *dentry)
     425             : {
     426   145722629 :         D_FLAG_VERIFY(dentry, 0);
     427   145722629 :         dentry->d_flags |= DCACHE_LRU_LIST;
     428   145722629 :         this_cpu_inc(nr_dentry_unused);
     429   145622194 :         if (d_is_negative(dentry))
     430    37532481 :                 this_cpu_inc(nr_dentry_negative);
     431   145620273 :         WARN_ON_ONCE(!list_lru_add(&dentry->d_sb->s_dentry_lru, &dentry->d_lru));
     432   146469364 : }
     433             : 
     434   115862163 : static void d_lru_del(struct dentry *dentry)
     435             : {
     436   115862163 :         D_FLAG_VERIFY(dentry, DCACHE_LRU_LIST);
     437   115862163 :         dentry->d_flags &= ~DCACHE_LRU_LIST;
     438   115862163 :         this_cpu_dec(nr_dentry_unused);
     439   115862048 :         if (d_is_negative(dentry))
     440    63658788 :                 this_cpu_dec(nr_dentry_negative);
     441   115862036 :         WARN_ON_ONCE(!list_lru_del(&dentry->d_sb->s_dentry_lru, &dentry->d_lru));
     442   115863021 : }
     443             : 
     444   152970746 : static void d_shrink_del(struct dentry *dentry)
     445             : {
     446   152970746 :         D_FLAG_VERIFY(dentry, DCACHE_SHRINK_LIST | DCACHE_LRU_LIST);
     447   152970746 :         list_del_init(&dentry->d_lru);
     448   152969937 :         dentry->d_flags &= ~(DCACHE_SHRINK_LIST | DCACHE_LRU_LIST);
     449   152969937 :         this_cpu_dec(nr_dentry_unused);
     450   152969860 : }
     451             : 
     452   123130961 : static void d_shrink_add(struct dentry *dentry, struct list_head *list)
     453             : {
     454   123130961 :         D_FLAG_VERIFY(dentry, 0);
     455   123130961 :         list_add(&dentry->d_lru, list);
     456   123130888 :         dentry->d_flags |= DCACHE_SHRINK_LIST | DCACHE_LRU_LIST;
     457   123130888 :         this_cpu_inc(nr_dentry_unused);
     458   123130895 : }
     459             : 
     460             : /*
     461             :  * These can only be called under the global LRU lock, ie during the
     462             :  * callback for freeing the LRU list. "isolate" removes it from the
     463             :  * LRU lists entirely, while shrink_move moves it to the indicated
     464             :  * private list.
     465             :  */
     466      960736 : static void d_lru_isolate(struct list_lru_one *lru, struct dentry *dentry)
     467             : {
     468      960736 :         D_FLAG_VERIFY(dentry, DCACHE_LRU_LIST);
     469      960736 :         dentry->d_flags &= ~DCACHE_LRU_LIST;
     470      960736 :         this_cpu_dec(nr_dentry_unused);
     471      960736 :         if (d_is_negative(dentry))
     472           0 :                 this_cpu_dec(nr_dentry_negative);
     473      960736 :         list_lru_isolate(lru, &dentry->d_lru);
     474      960736 : }
     475             : 
     476    29841253 : static void d_lru_shrink_move(struct list_lru_one *lru, struct dentry *dentry,
     477             :                               struct list_head *list)
     478             : {
     479    29841253 :         D_FLAG_VERIFY(dentry, DCACHE_LRU_LIST);
     480    29841253 :         dentry->d_flags |= DCACHE_SHRINK_LIST;
     481    29841253 :         if (d_is_negative(dentry))
     482     2516367 :                 this_cpu_dec(nr_dentry_negative);
     483    29841253 :         list_lru_isolate_move(lru, &dentry->d_lru, list);
     484    29841253 : }
     485             : 
     486   998027901 : static void ___d_drop(struct dentry *dentry)
     487             : {
     488   998027901 :         struct hlist_bl_head *b;
     489             :         /*
     490             :          * Hashed dentries are normally on the dentry hashtable,
     491             :          * with the exception of those newly allocated by
     492             :          * d_obtain_root, which are always IS_ROOT:
     493             :          */
     494   998027901 :         if (unlikely(IS_ROOT(dentry)))
     495           0 :                 b = &dentry->d_sb->s_roots;
     496             :         else
     497   998027901 :                 b = d_hash(dentry->d_name.hash);
     498             : 
     499   998021904 :         hlist_bl_lock(b);
     500   998029521 :         __hlist_bl_del(&dentry->d_hash);
     501   998031013 :         hlist_bl_unlock(b);
     502   998026481 : }
     503             : 
     504  1052140376 : void __d_drop(struct dentry *dentry)
     505             : {
     506  1052140376 :         if (!d_unhashed(dentry)) {
     507   899096255 :                 ___d_drop(dentry);
     508   899091574 :                 dentry->d_hash.pprev = NULL;
     509   899091574 :                 write_seqcount_invalidate(&dentry->d_seq);
     510             :         }
     511  1052135709 : }
     512             : EXPORT_SYMBOL(__d_drop);
     513             : 
     514             : /**
     515             :  * d_drop - drop a dentry
     516             :  * @dentry: dentry to drop
     517             :  *
     518             :  * d_drop() unhashes the entry from the parent dentry hashes, so that it won't
     519             :  * be found through a VFS lookup any more. Note that this is different from
     520             :  * deleting the dentry - d_delete will try to mark the dentry negative if
     521             :  * possible, giving a successful _negative_ lookup, while d_drop will
     522             :  * just make the cache lookup fail.
     523             :  *
     524             :  * d_drop() is used mainly for stuff that wants to invalidate a dentry for some
     525             :  * reason (NFS timeouts or autofs deletes).
     526             :  *
     527             :  * __d_drop requires dentry->d_lock
     528             :  *
     529             :  * ___d_drop doesn't mark dentry as "unhashed"
     530             :  * (dentry->d_hash.pprev will be LIST_POISON2, not NULL).
     531             :  */
     532      162657 : void d_drop(struct dentry *dentry)
     533             : {
     534      162657 :         spin_lock(&dentry->d_lock);
     535      162658 :         __d_drop(dentry);
     536      162652 :         spin_unlock(&dentry->d_lock);
     537      162654 : }
     538             : EXPORT_SYMBOL(d_drop);
     539             : 
     540  1040208306 : static inline void dentry_unlist(struct dentry *dentry, struct dentry *parent)
     541             : {
     542  1040208306 :         struct dentry *next;
     543             :         /*
     544             :          * Inform d_walk() and shrink_dentry_list() that we are no longer
     545             :          * attached to the dentry tree
     546             :          */
     547  1040208306 :         dentry->d_flags |= DCACHE_DENTRY_KILLED;
     548  1040208306 :         if (unlikely(list_empty(&dentry->d_child)))
     549             :                 return;
     550   958263987 :         __list_del_entry(&dentry->d_child);
     551             :         /*
     552             :          * Cursors can move around the list of children.  While we'd been
     553             :          * a normal list member, it didn't matter - ->d_child.next would've
     554             :          * been updated.  However, from now on it won't be and for the
     555             :          * things like d_walk() it might end up with a nasty surprise.
     556             :          * Normally d_walk() doesn't care about cursors moving around -
     557             :          * ->d_lock on parent prevents that and since a cursor has no children
     558             :          * of its own, we get through it without ever unlocking the parent.
     559             :          * There is one exception, though - if we ascend from a child that
     560             :          * gets killed as soon as we unlock it, the next sibling is found
     561             :          * using the value left in its ->d_child.next.  And if _that_
     562             :          * pointed to a cursor, and cursor got moved (e.g. by lseek())
     563             :          * before d_walk() regains parent->d_lock, we'll end up skipping
     564             :          * everything the cursor had been moved past.
     565             :          *
     566             :          * Solution: make sure that the pointer left behind in ->d_child.next
     567             :          * points to something that won't be moving around.  I.e. skip the
     568             :          * cursors.
     569             :          */
     570   958263987 :         while (dentry->d_child.next != &parent->d_subdirs) {
     571   897797028 :                 next = list_entry(dentry->d_child.next, struct dentry, d_child);
     572   897797028 :                 if (likely(!(next->d_flags & DCACHE_DENTRY_CURSOR)))
     573             :                         break;
     574           0 :                 dentry->d_child.next = next->d_child.next;
     575             :         }
     576             : }
     577             : 
     578  1040418546 : static void __dentry_kill(struct dentry *dentry)
     579             : {
     580  1040418546 :         struct dentry *parent = NULL;
     581  1040418546 :         bool can_free = true;
     582  1040418546 :         if (!IS_ROOT(dentry))
     583   963941256 :                 parent = dentry->d_parent;
     584             : 
     585             :         /*
     586             :          * The dentry is now unrecoverably dead to the world.
     587             :          */
     588  1040418546 :         lockref_mark_dead(&dentry->d_lockref);
     589             : 
     590             :         /*
     591             :          * inform the fs via d_prune that this dentry is about to be
     592             :          * unhashed and destroyed.
     593             :          */
     594  1040405808 :         if (dentry->d_flags & DCACHE_OP_PRUNE)
     595        5018 :                 dentry->d_op->d_prune(dentry);
     596             : 
     597  1040405808 :         if (dentry->d_flags & DCACHE_LRU_LIST) {
     598     1780031 :                 if (!(dentry->d_flags & DCACHE_SHRINK_LIST))
     599     1780031 :                         d_lru_del(dentry);
     600             :         }
     601             :         /* if it was on the hash then remove it */
     602  1040405820 :         __d_drop(dentry);
     603  1040169648 :         dentry_unlist(dentry, parent);
     604  1040246263 :         if (parent)
     605   963921685 :                 spin_unlock(&parent->d_lock);
     606  1040269246 :         if (dentry->d_inode)
     607   186220041 :                 dentry_unlink_inode(dentry);
     608             :         else
     609   854049205 :                 spin_unlock(&dentry->d_lock);
     610  1040378975 :         this_cpu_dec(nr_dentry);
     611  1040348971 :         if (dentry->d_op && dentry->d_op->d_release)
     612     1357262 :                 dentry->d_op->d_release(dentry);
     613             : 
     614  1040348971 :         spin_lock(&dentry->d_lock);
     615  1040480024 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
     616           0 :                 dentry->d_flags |= DCACHE_MAY_FREE;
     617           0 :                 can_free = false;
     618             :         }
     619  1040480024 :         spin_unlock(&dentry->d_lock);
     620  1040464681 :         if (likely(can_free))
     621  1040464681 :                 dentry_free(dentry);
     622  1040347022 :         cond_resched();
     623  1040391884 : }
     624             : 
     625     2753478 : static struct dentry *__lock_parent(struct dentry *dentry)
     626             : {
     627     2753478 :         struct dentry *parent;
     628     2753478 :         rcu_read_lock();
     629     2751911 :         spin_unlock(&dentry->d_lock);
     630     2759114 : again:
     631     2759114 :         parent = READ_ONCE(dentry->d_parent);
     632     2759114 :         spin_lock(&parent->d_lock);
     633             :         /*
     634             :          * We can't blindly lock dentry until we are sure
     635             :          * that we won't violate the locking order.
     636             :          * Any changes of dentry->d_parent must have
     637             :          * been done with parent->d_lock held, so
     638             :          * spin_lock() above is enough of a barrier
     639             :          * for checking if it's still our child.
     640             :          */
     641     2761891 :         if (unlikely(parent != dentry->d_parent)) {
     642           0 :                 spin_unlock(&parent->d_lock);
     643           0 :                 goto again;
     644             :         }
     645     2761891 :         rcu_read_unlock();
     646     2761891 :         if (parent != dentry)
     647     2761891 :                 spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
     648             :         else
     649             :                 parent = NULL;
     650     2761891 :         return parent;
     651             : }
     652             : 
     653        8475 : static inline struct dentry *lock_parent(struct dentry *dentry)
     654             : {
     655        8475 :         struct dentry *parent = dentry->d_parent;
     656        8475 :         if (IS_ROOT(dentry))
     657             :                 return NULL;
     658           6 :         if (likely(spin_trylock(&parent->d_lock)))
     659             :                 return parent;
     660           0 :         return __lock_parent(dentry);
     661             : }
     662             : 
     663  2651405181 : static inline bool retain_dentry(struct dentry *dentry)
     664             : {
     665  2651405181 :         WARN_ON(d_in_lookup(dentry));
     666             : 
     667             :         /* Unreachable? Get rid of it */
     668  2651405181 :         if (unlikely(d_unhashed(dentry)))
     669             :                 return false;
     670             : 
     671  2498081784 :         if (unlikely(dentry->d_flags & DCACHE_DISCONNECTED))
     672             :                 return false;
     673             : 
     674  2498081784 :         if (unlikely(dentry->d_flags & DCACHE_OP_DELETE)) {
     675   958465046 :                 if (dentry->d_op->d_delete(dentry))
     676             :                         return false;
     677             :         }
     678             : 
     679  1760720506 :         if (unlikely(dentry->d_flags & DCACHE_DONTCACHE))
     680             :                 return false;
     681             : 
     682             :         /* retain; LRU fodder */
     683  1760720482 :         dentry->d_lockref.count--;
     684  1760720482 :         if (unlikely(!(dentry->d_flags & DCACHE_LRU_LIST)))
     685   145941966 :                 d_lru_add(dentry);
     686  1614778516 :         else if (unlikely(!(dentry->d_flags & DCACHE_REFERENCED)))
     687   109119127 :                 dentry->d_flags |= DCACHE_REFERENCED;
     688             :         return true;
     689             : }
     690             : 
     691   611061170 : void d_mark_dontcache(struct inode *inode)
     692             : {
     693   611061170 :         struct dentry *de;
     694             : 
     695   611061170 :         spin_lock(&inode->i_lock);
     696  1224018946 :         hlist_for_each_entry(de, &inode->i_dentry, d_u.d_alias) {
     697      199727 :                 spin_lock(&de->d_lock);
     698          24 :                 de->d_flags |= DCACHE_DONTCACHE;
     699          24 :                 spin_unlock(&de->d_lock);
     700             :         }
     701   611809758 :         inode->i_state |= I_DONTCACHE;
     702   611809758 :         spin_unlock(&inode->i_lock);
     703   611788319 : }
     704             : EXPORT_SYMBOL(d_mark_dontcache);
     705             : 
     706             : /*
     707             :  * Finish off a dentry we've decided to kill.
     708             :  * dentry->d_lock must be held, returns with it unlocked.
     709             :  * Returns dentry requiring refcount drop, or NULL if we're done.
     710             :  */
     711   887932970 : static struct dentry *dentry_kill(struct dentry *dentry)
     712             :         __releases(dentry->d_lock)
     713             : {
     714   887932970 :         struct inode *inode = dentry->d_inode;
     715   887932970 :         struct dentry *parent = NULL;
     716             : 
     717   987139908 :         if (inode && unlikely(!spin_trylock(&inode->i_lock)))
     718        8281 :                 goto slow_positive;
     719             : 
     720   888099038 :         if (!IS_ROOT(dentry)) {
     721   811597433 :                 parent = dentry->d_parent;
     722   811597433 :                 if (unlikely(!spin_trylock(&parent->d_lock))) {
     723     2754542 :                         parent = __lock_parent(dentry);
     724     2761891 :                         if (likely(inode || !dentry->d_inode))
     725     2761891 :                                 goto got_locks;
     726             :                         /* negative that became positive */
     727           0 :                         if (parent)
     728           0 :                                 spin_unlock(&parent->d_lock);
     729           0 :                         inode = dentry->d_inode;
     730           0 :                         goto slow_positive;
     731             :                 }
     732             :         }
     733   885504008 :         __dentry_kill(dentry);
     734   885504008 :         return parent;
     735             : 
     736        8281 : slow_positive:
     737        8281 :         spin_unlock(&dentry->d_lock);
     738        8241 :         spin_lock(&inode->i_lock);
     739        8475 :         spin_lock(&dentry->d_lock);
     740        8475 :         parent = lock_parent(dentry);
     741     2770366 : got_locks:
     742     2770366 :         if (unlikely(dentry->d_lockref.count != 1)) {
     743      286235 :                 dentry->d_lockref.count--;
     744     2484131 :         } else if (likely(!retain_dentry(dentry))) {
     745     2484131 :                 __dentry_kill(dentry);
     746     2484131 :                 return parent;
     747             :         }
     748             :         /* we are keeping it, after all */
     749      286235 :         if (inode)
     750           0 :                 spin_unlock(&inode->i_lock);
     751      286235 :         if (parent)
     752      286235 :                 spin_unlock(&parent->d_lock);
     753      286235 :         spin_unlock(&dentry->d_lock);
     754      286235 :         return NULL;
     755             : }
     756             : 
     757             : /*
     758             :  * Try to do a lockless dput(), and return whether that was successful.
     759             :  *
     760             :  * If unsuccessful, we return false, having already taken the dentry lock.
     761             :  *
     762             :  * The caller needs to hold the RCU read lock, so that the dentry is
     763             :  * guaranteed to stay around even if the refcount goes down to zero!
     764             :  */
     765 14013143547 : static inline bool fast_dput(struct dentry *dentry)
     766             : {
     767 14013143547 :         int ret;
     768 14013143547 :         unsigned int d_flags;
     769             : 
     770             :         /*
     771             :          * If we have a d_op->d_delete() operation, we sould not
     772             :          * let the dentry count go to zero, so use "put_or_lock".
     773             :          */
     774 14013143547 :         if (unlikely(dentry->d_flags & DCACHE_OP_DELETE))
     775  7175446600 :                 return lockref_put_or_lock(&dentry->d_lockref);
     776             : 
     777             :         /*
     778             :          * .. otherwise, we can try to just decrement the
     779             :          * lockref optimistically.
     780             :          */
     781  6837696947 :         ret = lockref_put_return(&dentry->d_lockref);
     782             : 
     783             :         /*
     784             :          * If the lockref_put_return() failed due to the lock being held
     785             :          * by somebody else, the fast path has failed. We will need to
     786             :          * get the lock, and then check the count again.
     787             :          */
     788  6838105807 :         if (unlikely(ret < 0)) {
     789  6838105807 :                 spin_lock(&dentry->d_lock);
     790  6846445698 :                 if (dentry->d_lockref.count > 1) {
     791  5168317707 :                         dentry->d_lockref.count--;
     792  5168317707 :                         spin_unlock(&dentry->d_lock);
     793  5168317707 :                         return true;
     794             :                 }
     795             :                 return false;
     796             :         }
     797             : 
     798             :         /*
     799             :          * If we weren't the last ref, we're done.
     800             :          */
     801           0 :         if (ret)
     802             :                 return true;
     803             : 
     804             :         /*
     805             :          * Careful, careful. The reference count went down
     806             :          * to zero, but we don't hold the dentry lock, so
     807             :          * somebody else could get it again, and do another
     808             :          * dput(), and we need to not race with that.
     809             :          *
     810             :          * However, there is a very special and common case
     811             :          * where we don't care, because there is nothing to
     812             :          * do: the dentry is still hashed, it does not have
     813             :          * a 'delete' op, and it's referenced and already on
     814             :          * the LRU list.
     815             :          *
     816             :          * NOTE! Since we aren't locked, these values are
     817             :          * not "stable". However, it is sufficient that at
     818             :          * some point after we dropped the reference the
     819             :          * dentry was hashed and the flags had the proper
     820             :          * value. Other dentry users may have re-gotten
     821             :          * a reference to the dentry and change that, but
     822             :          * our work is done - we can leave the dentry
     823             :          * around with a zero refcount.
     824             :          *
     825             :          * Nevertheless, there are two cases that we should kill
     826             :          * the dentry anyway.
     827             :          * 1. free disconnected dentries as soon as their refcount
     828             :          *    reached zero.
     829             :          * 2. free dentries if they should not be cached.
     830             :          */
     831           0 :         smp_rmb();
     832           0 :         d_flags = READ_ONCE(dentry->d_flags);
     833           0 :         d_flags &= DCACHE_REFERENCED | DCACHE_LRU_LIST |
     834             :                         DCACHE_DISCONNECTED | DCACHE_DONTCACHE;
     835             : 
     836             :         /* Nothing to do? Dropping the reference was all we needed? */
     837           0 :         if (d_flags == (DCACHE_REFERENCED | DCACHE_LRU_LIST) && !d_unhashed(dentry))
     838             :                 return true;
     839             : 
     840             :         /*
     841             :          * Not the fast normal case? Get the lock. We've already decremented
     842             :          * the refcount, but we'll need to re-check the situation after
     843             :          * getting the lock.
     844             :          */
     845           0 :         spin_lock(&dentry->d_lock);
     846             : 
     847             :         /*
     848             :          * Did somebody else grab a reference to it in the meantime, and
     849             :          * we're no longer the last user after all? Alternatively, somebody
     850             :          * else could have killed it and marked it dead. Either way, we
     851             :          * don't need to do anything else.
     852             :          */
     853           0 :         if (dentry->d_lockref.count) {
     854           0 :                 spin_unlock(&dentry->d_lock);
     855           0 :                 return true;
     856             :         }
     857             : 
     858             :         /*
     859             :          * Re-get the reference we optimistically dropped. We hold the
     860             :          * lock, and we just tested that it was zero, so we can just
     861             :          * set it to 1.
     862             :          */
     863           0 :         dentry->d_lockref.count = 1;
     864           0 :         return false;
     865             : }
     866             : 
     867             : 
     868             : /* 
     869             :  * This is dput
     870             :  *
     871             :  * This is complicated by the fact that we do not want to put
     872             :  * dentries that are no longer on any hash chain on the unused
     873             :  * list: we'd much rather just get rid of them immediately.
     874             :  *
     875             :  * However, that implies that we have to traverse the dentry
     876             :  * tree upwards to the parents which might _also_ now be
     877             :  * scheduled for deletion (it may have been only waiting for
     878             :  * its last child to go away).
     879             :  *
     880             :  * This tail recursion is done by hand as we don't want to depend
     881             :  * on the compiler to always get this right (gcc generally doesn't).
     882             :  * Real recursion would eat up our stack space.
     883             :  */
     884             : 
     885             : /*
     886             :  * dput - release a dentry
     887             :  * @dentry: dentry to release 
     888             :  *
     889             :  * Release a dentry. This will drop the usage count and if appropriate
     890             :  * call the dentry unlink method as well as removing it from the queues and
     891             :  * releasing its resources. If the parent dentries were scheduled for release
     892             :  * they too may now get deleted.
     893             :  */
     894 18702385807 : void dput(struct dentry *dentry)
     895             : {
     896 19590557261 :         while (dentry) {
     897 14001746516 :                 might_sleep();
     898             : 
     899 14012832039 :                 rcu_read_lock();
     900 14003937411 :                 if (likely(fast_dput(dentry))) {
     901 11376298838 :                         rcu_read_unlock();
     902 11376298838 :                         return;
     903             :                 }
     904             : 
     905             :                 /* Slow case: now with the dentry lock held */
     906  2648620615 :                 rcu_read_unlock();
     907             : 
     908  2648731297 :                 if (likely(retain_dentry(dentry))) {
     909  1760101642 :                         spin_unlock(&dentry->d_lock);
     910  1760101642 :                         return;
     911             :                 }
     912             : 
     913   887825187 :                 dentry = dentry_kill(dentry);
     914             :         }
     915             : }
     916             : EXPORT_SYMBOL(dput);
     917             : 
     918   152393422 : static void __dput_to_list(struct dentry *dentry, struct list_head *list)
     919             : __must_hold(&dentry->d_lock)
     920             : {
     921   152393422 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
     922             :                 /* let the owner of the list it's on deal with it */
     923       61814 :                 --dentry->d_lockref.count;
     924             :         } else {
     925   152331608 :                 if (dentry->d_flags & DCACHE_LRU_LIST)
     926      607645 :                         d_lru_del(dentry);
     927   152331758 :                 if (!--dentry->d_lockref.count)
     928    14114156 :                         d_shrink_add(dentry, list);
     929             :         }
     930   152393567 : }
     931             : 
     932      327677 : void dput_to_list(struct dentry *dentry, struct list_head *list)
     933             : {
     934      327677 :         rcu_read_lock();
     935      327677 :         if (likely(fast_dput(dentry))) {
     936      253826 :                 rcu_read_unlock();
     937      253826 :                 return;
     938             :         }
     939       73851 :         rcu_read_unlock();
     940       73851 :         if (!retain_dentry(dentry))
     941           0 :                 __dput_to_list(dentry, list);
     942       73851 :         spin_unlock(&dentry->d_lock);
     943             : }
     944             : 
     945             : /* This must be called with d_lock held */
     946             : static inline void __dget_dlock(struct dentry *dentry)
     947             : {
     948   952287050 :         dentry->d_lockref.count++;
     949             : }
     950             : 
     951             : static inline void __dget(struct dentry *dentry)
     952             : {
     953   194917063 :         lockref_get(&dentry->d_lockref);
     954             : }
     955             : 
     956   758540121 : struct dentry *dget_parent(struct dentry *dentry)
     957             : {
     958   758540121 :         int gotref;
     959   758540121 :         struct dentry *ret;
     960   758540121 :         unsigned seq;
     961             : 
     962             :         /*
     963             :          * Do optimistic parent lookup without any
     964             :          * locking.
     965             :          */
     966   758540121 :         rcu_read_lock();
     967   758109665 :         seq = raw_seqcount_begin(&dentry->d_seq);
     968   758100942 :         ret = READ_ONCE(dentry->d_parent);
     969   758100942 :         gotref = lockref_get_not_zero(&ret->d_lockref);
     970   759198688 :         rcu_read_unlock();
     971   759143151 :         if (likely(gotref)) {
     972   759143151 :                 if (!read_seqcount_retry(&dentry->d_seq, seq))
     973             :                         return ret;
     974          52 :                 dput(ret);
     975             :         }
     976             : 
     977           0 : repeat:
     978             :         /*
     979             :          * Don't need rcu_dereference because we re-check it was correct under
     980             :          * the lock.
     981             :          */
     982          52 :         rcu_read_lock();
     983          52 :         ret = dentry->d_parent;
     984          52 :         spin_lock(&ret->d_lock);
     985          52 :         if (unlikely(ret != dentry->d_parent)) {
     986           0 :                 spin_unlock(&ret->d_lock);
     987           0 :                 rcu_read_unlock();
     988           0 :                 goto repeat;
     989             :         }
     990          52 :         rcu_read_unlock();
     991          52 :         BUG_ON(!ret->d_lockref.count);
     992          52 :         ret->d_lockref.count++;
     993          52 :         spin_unlock(&ret->d_lock);
     994          52 :         return ret;
     995             : }
     996             : EXPORT_SYMBOL(dget_parent);
     997             : 
     998             : static struct dentry * __d_find_any_alias(struct inode *inode)
     999             : {
    1000   316294586 :         struct dentry *alias;
    1001             : 
    1002   316294586 :         if (hlist_empty(&inode->i_dentry))
    1003             :                 return NULL;
    1004   194917063 :         alias = hlist_entry(inode->i_dentry.first, struct dentry, d_u.d_alias);
    1005         813 :         __dget(alias);
    1006   194916250 :         return alias;
    1007             : }
    1008             : 
    1009             : /**
    1010             :  * d_find_any_alias - find any alias for a given inode
    1011             :  * @inode: inode to find an alias for
    1012             :  *
    1013             :  * If any aliases exist for the given inode, take and return a
    1014             :  * reference for one of them.  If no aliases exist, return %NULL.
    1015             :  */
    1016   238838133 : struct dentry *d_find_any_alias(struct inode *inode)
    1017             : {
    1018   238838133 :         struct dentry *de;
    1019             : 
    1020   238838133 :         spin_lock(&inode->i_lock);
    1021   241433629 :         de = __d_find_any_alias(inode);
    1022   240921375 :         spin_unlock(&inode->i_lock);
    1023   241413688 :         return de;
    1024             : }
    1025             : EXPORT_SYMBOL(d_find_any_alias);
    1026             : 
    1027       61549 : static struct dentry *__d_find_alias(struct inode *inode)
    1028             : {
    1029       61549 :         struct dentry *alias;
    1030             : 
    1031       61549 :         if (S_ISDIR(inode->i_mode))
    1032           0 :                 return __d_find_any_alias(inode);
    1033             : 
    1034      123098 :         hlist_for_each_entry(alias, &inode->i_dentry, d_u.d_alias) {
    1035       61549 :                 spin_lock(&alias->d_lock);
    1036       61557 :                 if (!d_unhashed(alias)) {
    1037       61557 :                         __dget_dlock(alias);
    1038       61557 :                         spin_unlock(&alias->d_lock);
    1039       61557 :                         return alias;
    1040             :                 }
    1041           0 :                 spin_unlock(&alias->d_lock);
    1042             :         }
    1043             :         return NULL;
    1044             : }
    1045             : 
    1046             : /**
    1047             :  * d_find_alias - grab a hashed alias of inode
    1048             :  * @inode: inode in question
    1049             :  *
    1050             :  * If inode has a hashed alias, or is a directory and has any alias,
    1051             :  * acquire the reference to alias and return it. Otherwise return NULL.
    1052             :  * Notice that if inode is a directory there can be only one alias and
    1053             :  * it can be unhashed only if it has no children, or if it is the root
    1054             :  * of a filesystem, or if the directory was renamed and d_revalidate
    1055             :  * was the first vfs operation to notice.
    1056             :  *
    1057             :  * If the inode has an IS_ROOT, DCACHE_DISCONNECTED alias, then prefer
    1058             :  * any other hashed alias over that one.
    1059             :  */
    1060       61548 : struct dentry *d_find_alias(struct inode *inode)
    1061             : {
    1062       61548 :         struct dentry *de = NULL;
    1063             : 
    1064       61548 :         if (!hlist_empty(&inode->i_dentry)) {
    1065       61539 :                 spin_lock(&inode->i_lock);
    1066       61553 :                 de = __d_find_alias(inode);
    1067       61556 :                 spin_unlock(&inode->i_lock);
    1068             :         }
    1069       61557 :         return de;
    1070             : }
    1071             : EXPORT_SYMBOL(d_find_alias);
    1072             : 
    1073             : /*
    1074             :  *  Caller MUST be holding rcu_read_lock() and be guaranteed
    1075             :  *  that inode won't get freed until rcu_read_unlock().
    1076             :  */
    1077           0 : struct dentry *d_find_alias_rcu(struct inode *inode)
    1078             : {
    1079           0 :         struct hlist_head *l = &inode->i_dentry;
    1080           0 :         struct dentry *de = NULL;
    1081             : 
    1082           0 :         spin_lock(&inode->i_lock);
    1083             :         // ->i_dentry and ->i_rcu are colocated, but the latter won't be
    1084             :         // used without having I_FREEING set, which means no aliases left
    1085           0 :         if (likely(!(inode->i_state & I_FREEING) && !hlist_empty(l))) {
    1086           0 :                 if (S_ISDIR(inode->i_mode)) {
    1087           0 :                         de = hlist_entry(l->first, struct dentry, d_u.d_alias);
    1088             :                 } else {
    1089           0 :                         hlist_for_each_entry(de, l, d_u.d_alias)
    1090           0 :                                 if (!d_unhashed(de))
    1091             :                                         break;
    1092             :                 }
    1093             :         }
    1094           0 :         spin_unlock(&inode->i_lock);
    1095           0 :         return de;
    1096             : }
    1097             : 
    1098             : /*
    1099             :  *      Try to kill dentries associated with this inode.
    1100             :  * WARNING: you must own a reference to inode.
    1101             :  */
    1102         170 : void d_prune_aliases(struct inode *inode)
    1103             : {
    1104         170 :         struct dentry *dentry;
    1105         170 : restart:
    1106         170 :         spin_lock(&inode->i_lock);
    1107         510 :         hlist_for_each_entry(dentry, &inode->i_dentry, d_u.d_alias) {
    1108         170 :                 spin_lock(&dentry->d_lock);
    1109         170 :                 if (!dentry->d_lockref.count) {
    1110           0 :                         struct dentry *parent = lock_parent(dentry);
    1111           0 :                         if (likely(!dentry->d_lockref.count)) {
    1112           0 :                                 __dentry_kill(dentry);
    1113           0 :                                 dput(parent);
    1114           0 :                                 goto restart;
    1115             :                         }
    1116           0 :                         if (parent)
    1117           0 :                                 spin_unlock(&parent->d_lock);
    1118             :                 }
    1119         170 :                 spin_unlock(&dentry->d_lock);
    1120             :         }
    1121         170 :         spin_unlock(&inode->i_lock);
    1122         170 : }
    1123             : EXPORT_SYMBOL(d_prune_aliases);
    1124             : 
    1125             : /*
    1126             :  * Lock a dentry from shrink list.
    1127             :  * Called under rcu_read_lock() and dentry->d_lock; the former
    1128             :  * guarantees that nothing we access will be freed under us.
    1129             :  * Note that dentry is *not* protected from concurrent dentry_kill(),
    1130             :  * d_delete(), etc.
    1131             :  *
    1132             :  * Return false if dentry has been disrupted or grabbed, leaving
    1133             :  * the caller to kick it off-list.  Otherwise, return true and have
    1134             :  * that dentry's inode and parent both locked.
    1135             :  */
    1136   152971602 : static bool shrink_lock_dentry(struct dentry *dentry)
    1137             : {
    1138   152971602 :         struct inode *inode;
    1139   152971602 :         struct dentry *parent;
    1140             : 
    1141   152971602 :         if (dentry->d_lockref.count)
    1142             :                 return false;
    1143             : 
    1144   152395556 :         inode = dentry->d_inode;
    1145   239619517 :         if (inode && unlikely(!spin_trylock(&inode->i_lock))) {
    1146          15 :                 spin_unlock(&dentry->d_lock);
    1147          15 :                 spin_lock(&inode->i_lock);
    1148          15 :                 spin_lock(&dentry->d_lock);
    1149          15 :                 if (unlikely(dentry->d_lockref.count))
    1150           1 :                         goto out;
    1151             :                 /* changed inode means that somebody had grabbed it */
    1152          14 :                 if (unlikely(inode != dentry->d_inode))
    1153           0 :                         goto out;
    1154             :         }
    1155             : 
    1156   152395820 :         parent = dentry->d_parent;
    1157   304791922 :         if (IS_ROOT(dentry) || likely(spin_trylock(&parent->d_lock)))
    1158   152395300 :                 return true;
    1159             : 
    1160         802 :         spin_unlock(&dentry->d_lock);
    1161         802 :         spin_lock(&parent->d_lock);
    1162         802 :         if (unlikely(parent != dentry->d_parent)) {
    1163           0 :                 spin_unlock(&parent->d_lock);
    1164           0 :                 spin_lock(&dentry->d_lock);
    1165           0 :                 goto out;
    1166             :         }
    1167         802 :         spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
    1168         802 :         if (likely(!dentry->d_lockref.count))
    1169             :                 return true;
    1170           0 :         spin_unlock(&parent->d_lock);
    1171           1 : out:
    1172           1 :         if (inode)
    1173           1 :                 spin_unlock(&inode->i_lock);
    1174             :         return false;
    1175             : }
    1176             : 
    1177    14178538 : void shrink_dentry_list(struct list_head *list)
    1178             : {
    1179   167147402 :         while (!list_empty(list)) {
    1180   152971558 :                 struct dentry *dentry, *parent;
    1181             : 
    1182   152971558 :                 dentry = list_entry(list->prev, struct dentry, d_lru);
    1183   152971558 :                 spin_lock(&dentry->d_lock);
    1184   152971956 :                 rcu_read_lock();
    1185   152971883 :                 if (!shrink_lock_dentry(dentry)) {
    1186      576047 :                         bool can_free = false;
    1187      576047 :                         rcu_read_unlock();
    1188      576047 :                         d_shrink_del(dentry);
    1189      576047 :                         if (dentry->d_lockref.count < 0)
    1190           0 :                                 can_free = dentry->d_flags & DCACHE_MAY_FREE;
    1191      576047 :                         spin_unlock(&dentry->d_lock);
    1192      576047 :                         if (can_free)
    1193           0 :                                 dentry_free(dentry);
    1194      576047 :                         continue;
    1195             :                 }
    1196   152395679 :                 rcu_read_unlock();
    1197   152395200 :                 d_shrink_del(dentry);
    1198   152393762 :                 parent = dentry->d_parent;
    1199   152393762 :                 if (parent != dentry)
    1200   152393762 :                         __dput_to_list(parent, list);
    1201   152393493 :                 __dentry_kill(dentry);
    1202             :         }
    1203    14175844 : }
    1204             : 
    1205    61376847 : static enum lru_status dentry_lru_isolate(struct list_head *item,
    1206             :                 struct list_lru_one *lru, spinlock_t *lru_lock, void *arg)
    1207             : {
    1208    61376847 :         struct list_head *freeable = arg;
    1209    61376847 :         struct dentry   *dentry = container_of(item, struct dentry, d_lru);
    1210             : 
    1211             : 
    1212             :         /*
    1213             :          * we are inverting the lru lock/dentry->d_lock here,
    1214             :          * so use a trylock. If we fail to get the lock, just skip
    1215             :          * it
    1216             :          */
    1217    61376847 :         if (!spin_trylock(&dentry->d_lock))
    1218             :                 return LRU_SKIP;
    1219             : 
    1220             :         /*
    1221             :          * Referenced dentries are still in use. If they have active
    1222             :          * counts, just remove them from the LRU. Otherwise give them
    1223             :          * another pass through the LRU.
    1224             :          */
    1225    61376845 :         if (dentry->d_lockref.count) {
    1226      960736 :                 d_lru_isolate(lru, dentry);
    1227      960736 :                 spin_unlock(&dentry->d_lock);
    1228      960736 :                 return LRU_REMOVED;
    1229             :         }
    1230             : 
    1231    60416109 :         if (dentry->d_flags & DCACHE_REFERENCED) {
    1232    33394432 :                 dentry->d_flags &= ~DCACHE_REFERENCED;
    1233    33394432 :                 spin_unlock(&dentry->d_lock);
    1234             : 
    1235             :                 /*
    1236             :                  * The list move itself will be made by the common LRU code. At
    1237             :                  * this point, we've dropped the dentry->d_lock but keep the
    1238             :                  * lru lock. This is safe to do, since every list movement is
    1239             :                  * protected by the lru lock even if both locks are held.
    1240             :                  *
    1241             :                  * This is guaranteed by the fact that all LRU management
    1242             :                  * functions are intermediated by the LRU API calls like
    1243             :                  * list_lru_add and list_lru_del. List movement in this file
    1244             :                  * only ever occur through this functions or through callbacks
    1245             :                  * like this one, that are called from the LRU API.
    1246             :                  *
    1247             :                  * The only exceptions to this are functions like
    1248             :                  * shrink_dentry_list, and code that first checks for the
    1249             :                  * DCACHE_SHRINK_LIST flag.  Those are guaranteed to be
    1250             :                  * operating only with stack provided lists after they are
    1251             :                  * properly isolated from the main list.  It is thus, always a
    1252             :                  * local access.
    1253             :                  */
    1254    33394432 :                 return LRU_ROTATE;
    1255             :         }
    1256             : 
    1257    27021677 :         d_lru_shrink_move(lru, dentry, freeable);
    1258    27021677 :         spin_unlock(&dentry->d_lock);
    1259             : 
    1260    27021677 :         return LRU_REMOVED;
    1261             : }
    1262             : 
    1263             : /**
    1264             :  * prune_dcache_sb - shrink the dcache
    1265             :  * @sb: superblock
    1266             :  * @sc: shrink control, passed to list_lru_shrink_walk()
    1267             :  *
    1268             :  * Attempt to shrink the superblock dcache LRU by @sc->nr_to_scan entries. This
    1269             :  * is done when we need more memory and called from the superblock shrinker
    1270             :  * function.
    1271             :  *
    1272             :  * This function may fail to free any resources if all the dentries are in
    1273             :  * use.
    1274             :  */
    1275      268256 : long prune_dcache_sb(struct super_block *sb, struct shrink_control *sc)
    1276             : {
    1277      268256 :         LIST_HEAD(dispose);
    1278      268256 :         long freed;
    1279             : 
    1280      268256 :         freed = list_lru_shrink_walk(&sb->s_dentry_lru, sc,
    1281             :                                      dentry_lru_isolate, &dispose);
    1282      268256 :         shrink_dentry_list(&dispose);
    1283      268256 :         return freed;
    1284             : }
    1285             : 
    1286     2819576 : static enum lru_status dentry_lru_isolate_shrink(struct list_head *item,
    1287             :                 struct list_lru_one *lru, spinlock_t *lru_lock, void *arg)
    1288             : {
    1289     2819576 :         struct list_head *freeable = arg;
    1290     2819576 :         struct dentry   *dentry = container_of(item, struct dentry, d_lru);
    1291             : 
    1292             :         /*
    1293             :          * we are inverting the lru lock/dentry->d_lock here,
    1294             :          * so use a trylock. If we fail to get the lock, just skip
    1295             :          * it
    1296             :          */
    1297     2819576 :         if (!spin_trylock(&dentry->d_lock))
    1298             :                 return LRU_SKIP;
    1299             : 
    1300     2819576 :         d_lru_shrink_move(lru, dentry, freeable);
    1301     2819576 :         spin_unlock(&dentry->d_lock);
    1302             : 
    1303     2819576 :         return LRU_REMOVED;
    1304             : }
    1305             : 
    1306             : 
    1307             : /**
    1308             :  * shrink_dcache_sb - shrink dcache for a superblock
    1309             :  * @sb: superblock
    1310             :  *
    1311             :  * Shrink the dcache for the specified super block. This is used to free
    1312             :  * the dcache before unmounting a file system.
    1313             :  */
    1314        3383 : void shrink_dcache_sb(struct super_block *sb)
    1315             : {
    1316        5836 :         do {
    1317        5836 :                 LIST_HEAD(dispose);
    1318             : 
    1319        5836 :                 list_lru_walk(&sb->s_dentry_lru,
    1320             :                         dentry_lru_isolate_shrink, &dispose, 1024);
    1321        5836 :                 shrink_dentry_list(&dispose);
    1322        5836 :         } while (list_lru_count(&sb->s_dentry_lru) > 0);
    1323        3383 : }
    1324             : EXPORT_SYMBOL(shrink_dcache_sb);
    1325             : 
    1326             : /**
    1327             :  * enum d_walk_ret - action to talke during tree walk
    1328             :  * @D_WALK_CONTINUE:    contrinue walk
    1329             :  * @D_WALK_QUIT:        quit walk
    1330             :  * @D_WALK_NORETRY:     quit when retry is needed
    1331             :  * @D_WALK_SKIP:        skip this dentry and its children
    1332             :  */
    1333             : enum d_walk_ret {
    1334             :         D_WALK_CONTINUE,
    1335             :         D_WALK_QUIT,
    1336             :         D_WALK_NORETRY,
    1337             :         D_WALK_SKIP,
    1338             : };
    1339             : 
    1340             : /**
    1341             :  * d_walk - walk the dentry tree
    1342             :  * @parent:     start of walk
    1343             :  * @data:       data passed to @enter() and @finish()
    1344             :  * @enter:      callback when first entering the dentry
    1345             :  *
    1346             :  * The @enter() callbacks are called with d_lock held.
    1347             :  */
    1348    32729501 : static void d_walk(struct dentry *parent, void *data,
    1349             :                    enum d_walk_ret (*enter)(void *, struct dentry *))
    1350             : {
    1351    32729501 :         struct dentry *this_parent;
    1352    32729501 :         struct list_head *next;
    1353    32729501 :         unsigned seq = 0;
    1354    32729501 :         enum d_walk_ret ret;
    1355    32729501 :         bool retry = true;
    1356             : 
    1357    32729819 : again:
    1358    32729819 :         read_seqbegin_or_lock(&rename_lock, &seq);
    1359    32729960 :         this_parent = parent;
    1360    32729960 :         spin_lock(&this_parent->d_lock);
    1361             : 
    1362    32737001 :         ret = enter(data, this_parent);
    1363    32729781 :         switch (ret) {
    1364             :         case D_WALK_CONTINUE:
    1365             :                 break;
    1366           0 :         case D_WALK_QUIT:
    1367             :         case D_WALK_SKIP:
    1368           0 :                 goto out_unlock;
    1369           0 :         case D_WALK_NORETRY:
    1370           0 :                 retry = false;
    1371           0 :                 break;
    1372             :         }
    1373             : repeat:
    1374    38553005 :         next = this_parent->d_subdirs.next;
    1375             : resume:
    1376   151866748 :         while (next != &this_parent->d_subdirs) {
    1377   114841995 :                 struct list_head *tmp = next;
    1378   114841995 :                 struct dentry *dentry = list_entry(tmp, struct dentry, d_child);
    1379   114841995 :                 next = tmp->next;
    1380             : 
    1381   114841995 :                 if (unlikely(dentry->d_flags & DCACHE_DENTRY_CURSOR))
    1382           0 :                         continue;
    1383             : 
    1384   114841995 :                 spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
    1385             : 
    1386   114844941 :                 ret = enter(data, dentry);
    1387   114844820 :                 switch (ret) {
    1388             :                 case D_WALK_CONTINUE:
    1389             :                         break;
    1390       27568 :                 case D_WALK_QUIT:
    1391       27568 :                         spin_unlock(&dentry->d_lock);
    1392       27568 :                         goto out_unlock;
    1393   114660709 :                 case D_WALK_NORETRY:
    1394   114660709 :                         retry = false;
    1395   114660709 :                         break;
    1396           0 :                 case D_WALK_SKIP:
    1397           0 :                         spin_unlock(&dentry->d_lock);
    1398           0 :                         continue;
    1399             :                 }
    1400             : 
    1401   114817252 :                 if (!list_empty(&dentry->d_subdirs)) {
    1402     5823225 :                         spin_unlock(&this_parent->d_lock);
    1403     5823224 :                         spin_release(&dentry->d_lock.dep_map, _RET_IP_);
    1404     5823224 :                         this_parent = dentry;
    1405     5823224 :                         spin_acquire(&this_parent->d_lock.dep_map, 0, 1, _RET_IP_);
    1406     5823224 :                         goto repeat;
    1407             :                 }
    1408   108994027 :                 spin_unlock(&dentry->d_lock);
    1409             :         }
    1410             :         /*
    1411             :          * All done at this level ... ascend and resume the search.
    1412             :          */
    1413    37024753 :         rcu_read_lock();
    1414    38503183 : ascend:
    1415    38503183 :         if (this_parent != parent) {
    1416     5797263 :                 struct dentry *child = this_parent;
    1417     5797263 :                 this_parent = child->d_parent;
    1418             : 
    1419     5797263 :                 spin_unlock(&child->d_lock);
    1420     5797580 :                 spin_lock(&this_parent->d_lock);
    1421             : 
    1422             :                 /* might go back up the wrong parent if we have had a rename. */
    1423     5797578 :                 if (need_seqretry(&rename_lock, seq))
    1424          63 :                         goto rename_retry;
    1425             :                 /* go into the first sibling still alive */
    1426     5797516 :                 do {
    1427     5797516 :                         next = child->d_child.next;
    1428     5797516 :                         if (next == &this_parent->d_subdirs)
    1429     1478114 :                                 goto ascend;
    1430     4319402 :                         child = list_entry(next, struct dentry, d_child);
    1431     4319402 :                 } while (unlikely(child->d_flags & DCACHE_DENTRY_KILLED));
    1432     4319402 :                 rcu_read_unlock();
    1433     4319402 :                 goto resume;
    1434             :         }
    1435    32705920 :         if (need_seqretry(&rename_lock, seq))
    1436        1720 :                 goto rename_retry;
    1437    32705062 :         rcu_read_unlock();
    1438             : 
    1439    32733713 : out_unlock:
    1440    32733713 :         spin_unlock(&this_parent->d_lock);
    1441    32737486 :         done_seqretry(&rename_lock, seq);
    1442             :         return;
    1443             : 
    1444        1783 : rename_retry:
    1445        1783 :         spin_unlock(&this_parent->d_lock);
    1446        1783 :         rcu_read_unlock();
    1447        1783 :         BUG_ON(seq & 1);
    1448        1783 :         if (!retry)
    1449             :                 return;
    1450         318 :         seq = 1;
    1451         318 :         goto again;
    1452             : }
    1453             : 
    1454             : struct check_mount {
    1455             :         struct vfsmount *mnt;
    1456             :         unsigned int mounted;
    1457             : };
    1458             : 
    1459           0 : static enum d_walk_ret path_check_mount(void *data, struct dentry *dentry)
    1460             : {
    1461           0 :         struct check_mount *info = data;
    1462           0 :         struct path path = { .mnt = info->mnt, .dentry = dentry };
    1463             : 
    1464           0 :         if (likely(!d_mountpoint(dentry)))
    1465             :                 return D_WALK_CONTINUE;
    1466           0 :         if (__path_is_mountpoint(&path)) {
    1467           0 :                 info->mounted = 1;
    1468           0 :                 return D_WALK_QUIT;
    1469             :         }
    1470             :         return D_WALK_CONTINUE;
    1471             : }
    1472             : 
    1473             : /**
    1474             :  * path_has_submounts - check for mounts over a dentry in the
    1475             :  *                      current namespace.
    1476             :  * @parent: path to check.
    1477             :  *
    1478             :  * Return true if the parent or its subdirectories contain
    1479             :  * a mount point in the current namespace.
    1480             :  */
    1481           0 : int path_has_submounts(const struct path *parent)
    1482             : {
    1483           0 :         struct check_mount data = { .mnt = parent->mnt, .mounted = 0 };
    1484             : 
    1485           0 :         read_seqlock_excl(&mount_lock);
    1486           0 :         d_walk(parent->dentry, &data, path_check_mount);
    1487           0 :         read_sequnlock_excl(&mount_lock);
    1488             : 
    1489           0 :         return data.mounted;
    1490             : }
    1491             : EXPORT_SYMBOL(path_has_submounts);
    1492             : 
    1493             : /*
    1494             :  * Called by mount code to set a mountpoint and check if the mountpoint is
    1495             :  * reachable (e.g. NFS can unhash a directory dentry and then the complete
    1496             :  * subtree can become unreachable).
    1497             :  *
    1498             :  * Only one of d_invalidate() and d_set_mounted() must succeed.  For
    1499             :  * this reason take rename_lock and d_lock on dentry and ancestors.
    1500             :  */
    1501      327680 : int d_set_mounted(struct dentry *dentry)
    1502             : {
    1503      327680 :         struct dentry *p;
    1504      327680 :         int ret = -ENOENT;
    1505      327680 :         write_seqlock(&rename_lock);
    1506      328505 :         for (p = dentry->d_parent; !IS_ROOT(p); p = p->d_parent) {
    1507             :                 /* Need exclusion wrt. d_invalidate() */
    1508         825 :                 spin_lock(&p->d_lock);
    1509         825 :                 if (unlikely(d_unhashed(p))) {
    1510           0 :                         spin_unlock(&p->d_lock);
    1511           0 :                         goto out;
    1512             :                 }
    1513         825 :                 spin_unlock(&p->d_lock);
    1514             :         }
    1515      327680 :         spin_lock(&dentry->d_lock);
    1516      327680 :         if (!d_unlinked(dentry)) {
    1517      327680 :                 ret = -EBUSY;
    1518      327680 :                 if (!d_mountpoint(dentry)) {
    1519      327680 :                         dentry->d_flags |= DCACHE_MOUNTED;
    1520      327680 :                         ret = 0;
    1521             :                 }
    1522             :         }
    1523      327680 :         spin_unlock(&dentry->d_lock);
    1524      327680 : out:
    1525      327680 :         write_sequnlock(&rename_lock);
    1526      327680 :         return ret;
    1527             : }
    1528             : 
    1529             : /*
    1530             :  * Search the dentry child list of the specified parent,
    1531             :  * and move any unused dentries to the end of the unused
    1532             :  * list for prune_dcache(). We descend to the next level
    1533             :  * whenever the d_subdirs list is non-empty and continue
    1534             :  * searching.
    1535             :  *
    1536             :  * It returns zero iff there are no unused children,
    1537             :  * otherwise  it returns the number of children moved to
    1538             :  * the end of the unused list. This may not be the total
    1539             :  * number of unused children, because select_parent can
    1540             :  * drop the lock and return early due to latency
    1541             :  * constraints.
    1542             :  */
    1543             : 
    1544             : struct select_data {
    1545             :         struct dentry *start;
    1546             :         union {
    1547             :                 long found;
    1548             :                 struct dentry *victim;
    1549             :         };
    1550             :         struct list_head dispose;
    1551             : };
    1552             : 
    1553   136987197 : static enum d_walk_ret select_collect(void *_data, struct dentry *dentry)
    1554             : {
    1555   136987197 :         struct select_data *data = _data;
    1556   136987197 :         enum d_walk_ret ret = D_WALK_CONTINUE;
    1557             : 
    1558   136987197 :         if (data->start == dentry)
    1559    22142862 :                 goto out;
    1560             : 
    1561   114844335 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
    1562           0 :                 data->found++;
    1563             :         } else {
    1564   114844335 :                 if (dentry->d_flags & DCACHE_LRU_LIST)
    1565   113474812 :                         d_lru_del(dentry);
    1566   114844775 :                 if (!dentry->d_lockref.count) {
    1567   109016840 :                         d_shrink_add(dentry, &data->dispose);
    1568   109016684 :                         data->found++;
    1569             :                 }
    1570             :         }
    1571             :         /*
    1572             :          * We can return to the caller if we have found some (this
    1573             :          * ensures forward progress). We'll be coming back to find
    1574             :          * the rest.
    1575             :          */
    1576   114844619 :         if (!list_empty(&data->dispose))
    1577   114688205 :                 ret = need_resched() ? D_WALK_QUIT : D_WALK_NORETRY;
    1578      156414 : out:
    1579   136987481 :         return ret;
    1580             : }
    1581             : 
    1582           0 : static enum d_walk_ret select_collect2(void *_data, struct dentry *dentry)
    1583             : {
    1584           0 :         struct select_data *data = _data;
    1585           0 :         enum d_walk_ret ret = D_WALK_CONTINUE;
    1586             : 
    1587           0 :         if (data->start == dentry)
    1588           0 :                 goto out;
    1589             : 
    1590           0 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
    1591           0 :                 if (!dentry->d_lockref.count) {
    1592           0 :                         rcu_read_lock();
    1593           0 :                         data->victim = dentry;
    1594           0 :                         return D_WALK_QUIT;
    1595             :                 }
    1596             :         } else {
    1597           0 :                 if (dentry->d_flags & DCACHE_LRU_LIST)
    1598           0 :                         d_lru_del(dentry);
    1599           0 :                 if (!dentry->d_lockref.count)
    1600           0 :                         d_shrink_add(dentry, &data->dispose);
    1601             :         }
    1602             :         /*
    1603             :          * We can return to the caller if we have found some (this
    1604             :          * ensures forward progress). We'll be coming back to find
    1605             :          * the rest.
    1606             :          */
    1607           0 :         if (!list_empty(&data->dispose))
    1608           0 :                 ret = need_resched() ? D_WALK_QUIT : D_WALK_NORETRY;
    1609           0 : out:
    1610             :         return ret;
    1611             : }
    1612             : 
    1613             : /**
    1614             :  * shrink_dcache_parent - prune dcache
    1615             :  * @parent: parent of entries to prune
    1616             :  *
    1617             :  * Prune the dcache to remove unused children of the parent dentry.
    1618             :  */
    1619    11828911 : void shrink_dcache_parent(struct dentry *parent)
    1620             : {
    1621    22140633 :         for (;;) {
    1622    22140633 :                 struct select_data data = {.start = parent};
    1623             : 
    1624    22140633 :                 INIT_LIST_HEAD(&data.dispose);
    1625    22140633 :                 d_walk(parent, &data, select_collect);
    1626             : 
    1627    22144087 :                 if (!list_empty(&data.dispose)) {
    1628    10316682 :                         shrink_dentry_list(&data.dispose);
    1629    10311722 :                         continue;
    1630             :                 }
    1631             : 
    1632    11827405 :                 cond_resched();
    1633    11824988 :                 if (!data.found)
    1634             :                         break;
    1635           0 :                 data.victim = NULL;
    1636           0 :                 d_walk(parent, &data, select_collect2);
    1637           0 :                 if (data.victim) {
    1638           0 :                         struct dentry *parent;
    1639           0 :                         spin_lock(&data.victim->d_lock);
    1640           0 :                         if (!shrink_lock_dentry(data.victim)) {
    1641           0 :                                 spin_unlock(&data.victim->d_lock);
    1642           0 :                                 rcu_read_unlock();
    1643             :                         } else {
    1644           0 :                                 rcu_read_unlock();
    1645           0 :                                 parent = data.victim->d_parent;
    1646           0 :                                 if (parent != data.victim)
    1647           0 :                                         __dput_to_list(parent, &data.dispose);
    1648           0 :                                 __dentry_kill(data.victim);
    1649             :                         }
    1650             :                 }
    1651           0 :                 if (!list_empty(&data.dispose))
    1652           0 :                         shrink_dentry_list(&data.dispose);
    1653             :         }
    1654    11824988 : }
    1655             : EXPORT_SYMBOL(shrink_dcache_parent);
    1656             : 
    1657       94358 : static enum d_walk_ret umount_check(void *_data, struct dentry *dentry)
    1658             : {
    1659             :         /* it has busy descendents; complain about those instead */
    1660       94358 :         if (!list_empty(&dentry->d_subdirs))
    1661             :                 return D_WALK_CONTINUE;
    1662             : 
    1663             :         /* root with refcount 1 is fine */
    1664       94350 :         if (dentry == _data && dentry->d_lockref.count == 1)
    1665             :                 return D_WALK_CONTINUE;
    1666             : 
    1667           0 :         printk(KERN_ERR "BUG: Dentry %p{i=%lx,n=%pd} "
    1668             :                         " still in use (%d) [unmount of %s %s]\n",
    1669             :                        dentry,
    1670             :                        dentry->d_inode ?
    1671             :                        dentry->d_inode->i_ino : 0UL,
    1672             :                        dentry,
    1673             :                        dentry->d_lockref.count,
    1674             :                        dentry->d_sb->s_type->name,
    1675             :                        dentry->d_sb->s_id);
    1676           0 :         WARN_ON(1);
    1677             :         return D_WALK_CONTINUE;
    1678             : }
    1679             : 
    1680       94355 : static void do_one_tree(struct dentry *dentry)
    1681             : {
    1682       94355 :         shrink_dcache_parent(dentry);
    1683       94353 :         d_walk(dentry, dentry, umount_check);
    1684       94353 :         d_drop(dentry);
    1685       94345 :         dput(dentry);
    1686       94353 : }
    1687             : 
    1688             : /*
    1689             :  * destroy the dentries attached to a superblock on unmounting
    1690             :  */
    1691       94355 : void shrink_dcache_for_umount(struct super_block *sb)
    1692             : {
    1693       94355 :         struct dentry *dentry;
    1694             : 
    1695       94355 :         WARN(down_read_trylock(&sb->s_umount), "s_umount should've been locked");
    1696             : 
    1697       94355 :         dentry = sb->s_root;
    1698       94355 :         sb->s_root = NULL;
    1699       94355 :         do_one_tree(dentry);
    1700             : 
    1701       94355 :         while (!hlist_bl_empty(&sb->s_roots)) {
    1702           0 :                 dentry = dget(hlist_bl_entry(hlist_bl_first(&sb->s_roots), struct dentry, d_hash));
    1703           0 :                 do_one_tree(dentry);
    1704             :         }
    1705       94352 : }
    1706             : 
    1707    10495731 : static enum d_walk_ret find_submount(void *_data, struct dentry *dentry)
    1708             : {
    1709    10495731 :         struct dentry **victim = _data;
    1710    10495731 :         if (d_mountpoint(dentry)) {
    1711           0 :                 __dget_dlock(dentry);
    1712           0 :                 *victim = dentry;
    1713           0 :                 return D_WALK_QUIT;
    1714             :         }
    1715             :         return D_WALK_CONTINUE;
    1716             : }
    1717             : 
    1718             : /**
    1719             :  * d_invalidate - detach submounts, prune dcache, and drop
    1720             :  * @dentry: dentry to invalidate (aka detach, prune and drop)
    1721             :  */
    1722    11291108 : void d_invalidate(struct dentry *dentry)
    1723             : {
    1724    11291108 :         bool had_submounts = false;
    1725    11291108 :         spin_lock(&dentry->d_lock);
    1726    11292319 :         if (d_unhashed(dentry)) {
    1727        3747 :                 spin_unlock(&dentry->d_lock);
    1728        3747 :                 return;
    1729             :         }
    1730    11288572 :         __d_drop(dentry);
    1731    11288532 :         spin_unlock(&dentry->d_lock);
    1732             : 
    1733             :         /* Negative dentries can be dropped without further checks */
    1734    11288560 :         if (!dentry->d_inode)
    1735             :                 return;
    1736             : 
    1737    10501801 :         shrink_dcache_parent(dentry);
    1738           0 :         for (;;) {
    1739    10498202 :                 struct dentry *victim = NULL;
    1740    10498202 :                 d_walk(dentry, &victim, find_submount);
    1741    10500123 :                 if (!victim) {
    1742    10500123 :                         if (had_submounts)
    1743           0 :                                 shrink_dcache_parent(dentry);
    1744    10500123 :                         return;
    1745             :                 }
    1746           0 :                 had_submounts = true;
    1747           0 :                 detach_mounts(victim);
    1748           0 :                 dput(victim);
    1749             :         }
    1750             : }
    1751             : EXPORT_SYMBOL(d_invalidate);
    1752             : 
    1753             : /**
    1754             :  * __d_alloc    -       allocate a dcache entry
    1755             :  * @sb: filesystem it will belong to
    1756             :  * @name: qstr of the name
    1757             :  *
    1758             :  * Allocates a dentry. It returns %NULL if there is insufficient memory
    1759             :  * available. On a success the dentry is returned. The name passed in is
    1760             :  * copied and the copy passed in may be reused after this call.
    1761             :  */
    1762             :  
    1763  1038729849 : static struct dentry *__d_alloc(struct super_block *sb, const struct qstr *name)
    1764             : {
    1765  1038729849 :         struct dentry *dentry;
    1766  1038729849 :         char *dname;
    1767  1038729849 :         int err;
    1768             : 
    1769  1038729849 :         dentry = kmem_cache_alloc_lru(dentry_cache, &sb->s_dentry_lru,
    1770             :                                       GFP_KERNEL);
    1771  1038111925 :         if (!dentry)
    1772             :                 return NULL;
    1773             : 
    1774             :         /*
    1775             :          * We guarantee that the inline name is always NUL-terminated.
    1776             :          * This way the memcpy() done by the name switching in rename
    1777             :          * will still always have a NUL at the end, even if we might
    1778             :          * be overwriting an internal NUL character
    1779             :          */
    1780  1038111925 :         dentry->d_iname[DNAME_INLINE_LEN-1] = 0;
    1781  1038111925 :         if (unlikely(!name)) {
    1782    57181089 :                 name = &slash_name;
    1783    57181089 :                 dname = dentry->d_iname;
    1784   980930836 :         } else if (name->len > DNAME_INLINE_LEN-1) {
    1785     3874440 :                 size_t size = offsetof(struct external_name, name[1]);
    1786     3874440 :                 struct external_name *p = kmalloc(size + name->len,
    1787             :                                                   GFP_KERNEL_ACCOUNT |
    1788             :                                                   __GFP_RECLAIMABLE);
    1789     3874915 :                 if (!p) {
    1790           0 :                         kmem_cache_free(dentry_cache, dentry); 
    1791           0 :                         return NULL;
    1792             :                 }
    1793     3874915 :                 atomic_set(&p->u.count, 1);
    1794     3874915 :                 dname = p->name;
    1795             :         } else  {
    1796   977056396 :                 dname = dentry->d_iname;
    1797             :         }       
    1798             : 
    1799  1038112400 :         dentry->d_name.len = name->len;
    1800  1038112400 :         dentry->d_name.hash = name->hash;
    1801  2076224800 :         memcpy(dname, name->name, name->len);
    1802  1038112400 :         dname[name->len] = 0;
    1803             : 
    1804             :         /* Make sure we always see the terminating NUL character */
    1805  1038112400 :         smp_store_release(&dentry->d_name.name, dname); /* ^^^ */
    1806             : 
    1807  1037737854 :         dentry->d_lockref.count = 1;
    1808  1037737854 :         dentry->d_flags = 0;
    1809  1037737854 :         spin_lock_init(&dentry->d_lock);
    1810  1036828792 :         seqcount_spinlock_init(&dentry->d_seq, &dentry->d_lock);
    1811  1036828792 :         dentry->d_inode = NULL;
    1812  1036828792 :         dentry->d_parent = dentry;
    1813  1036828792 :         dentry->d_sb = sb;
    1814  1036828792 :         dentry->d_op = NULL;
    1815  1036828792 :         dentry->d_fsdata = NULL;
    1816  1036828792 :         INIT_HLIST_BL_NODE(&dentry->d_hash);
    1817  1036828792 :         INIT_LIST_HEAD(&dentry->d_lru);
    1818  1036828792 :         INIT_LIST_HEAD(&dentry->d_subdirs);
    1819  1036828792 :         INIT_HLIST_NODE(&dentry->d_u.d_alias);
    1820  1036828792 :         INIT_LIST_HEAD(&dentry->d_child);
    1821  1036828792 :         d_set_d_op(dentry, dentry->d_sb->s_d_op);
    1822             : 
    1823  1037232085 :         if (dentry->d_op && dentry->d_op->d_init) {
    1824           0 :                 err = dentry->d_op->d_init(dentry);
    1825           0 :                 if (err) {
    1826           0 :                         if (dname_external(dentry))
    1827           0 :                                 kfree(external_name(dentry));
    1828           0 :                         kmem_cache_free(dentry_cache, dentry);
    1829           0 :                         return NULL;
    1830             :                 }
    1831             :         }
    1832             : 
    1833  1037232085 :         this_cpu_inc(nr_dentry);
    1834             : 
    1835  1037232085 :         return dentry;
    1836             : }
    1837             : 
    1838             : /**
    1839             :  * d_alloc      -       allocate a dcache entry
    1840             :  * @parent: parent of entry to allocate
    1841             :  * @name: qstr of the name
    1842             :  *
    1843             :  * Allocates a dentry. It returns %NULL if there is insufficient memory
    1844             :  * available. On a success the dentry is returned. The name passed in is
    1845             :  * copied and the copy passed in may be reused after this call.
    1846             :  */
    1847   951465362 : struct dentry *d_alloc(struct dentry * parent, const struct qstr *name)
    1848             : {
    1849   951465362 :         struct dentry *dentry = __d_alloc(parent->d_sb, name);
    1850   950525993 :         if (!dentry)
    1851             :                 return NULL;
    1852   950525993 :         spin_lock(&parent->d_lock);
    1853             :         /*
    1854             :          * don't need child lock because it is not subject
    1855             :          * to concurrency here
    1856             :          */
    1857   952225493 :         __dget_dlock(parent);
    1858   952225493 :         dentry->d_parent = parent;
    1859   952225493 :         list_add(&dentry->d_child, &parent->d_subdirs);
    1860   951635506 :         spin_unlock(&parent->d_lock);
    1861             : 
    1862   951635506 :         return dentry;
    1863             : }
    1864             : EXPORT_SYMBOL(d_alloc);
    1865             : 
    1866        5018 : struct dentry *d_alloc_anon(struct super_block *sb)
    1867             : {
    1868        5018 :         return __d_alloc(sb, NULL);
    1869             : }
    1870             : EXPORT_SYMBOL(d_alloc_anon);
    1871             : 
    1872     5663404 : struct dentry *d_alloc_cursor(struct dentry * parent)
    1873             : {
    1874     5663404 :         struct dentry *dentry = d_alloc_anon(parent->d_sb);
    1875     5662750 :         if (dentry) {
    1876     5662750 :                 dentry->d_flags |= DCACHE_DENTRY_CURSOR;
    1877    11326002 :                 dentry->d_parent = dget(parent);
    1878             :         }
    1879     5663252 :         return dentry;
    1880             : }
    1881             : 
    1882             : /**
    1883             :  * d_alloc_pseudo - allocate a dentry (for lookup-less filesystems)
    1884             :  * @sb: the superblock
    1885             :  * @name: qstr of the name
    1886             :  *
    1887             :  * For a filesystem that just pins its dentries in memory and never
    1888             :  * performs lookups at all, return an unhashed IS_ROOT dentry.
    1889             :  * This is used for pipes, sockets et.al. - the stuff that should
    1890             :  * never be anyone's children or parents.  Unlike all other
    1891             :  * dentries, these will not have RCU delay between dropping the
    1892             :  * last reference and freeing them.
    1893             :  *
    1894             :  * The only user is alloc_file_pseudo() and that's what should
    1895             :  * be considered a public interface.  Don't use directly.
    1896             :  */
    1897    29891221 : struct dentry *d_alloc_pseudo(struct super_block *sb, const struct qstr *name)
    1898             : {
    1899    29891221 :         struct dentry *dentry = __d_alloc(sb, name);
    1900    29891371 :         if (likely(dentry))
    1901    29891371 :                 dentry->d_flags |= DCACHE_NORCU;
    1902    29891371 :         return dentry;
    1903             : }
    1904             : 
    1905           8 : struct dentry *d_alloc_name(struct dentry *parent, const char *name)
    1906             : {
    1907           8 :         struct qstr q;
    1908             : 
    1909           8 :         q.name = name;
    1910           8 :         q.hash_len = hashlen_string(parent, name);
    1911           8 :         return d_alloc(parent, &q);
    1912             : }
    1913             : EXPORT_SYMBOL(d_alloc_name);
    1914             : 
    1915  1797021056 : void d_set_d_op(struct dentry *dentry, const struct dentry_operations *op)
    1916             : {
    1917  1797021056 :         WARN_ON_ONCE(dentry->d_op);
    1918  1797021056 :         WARN_ON_ONCE(dentry->d_flags & (DCACHE_OP_HASH   |
    1919             :                                 DCACHE_OP_COMPARE       |
    1920             :                                 DCACHE_OP_REVALIDATE    |
    1921             :                                 DCACHE_OP_WEAK_REVALIDATE       |
    1922             :                                 DCACHE_OP_DELETE        |
    1923             :                                 DCACHE_OP_REAL));
    1924  1797021056 :         dentry->d_op = op;
    1925  1797021056 :         if (!op)
    1926             :                 return;
    1927   797405906 :         if (op->d_hash)
    1928        4150 :                 dentry->d_flags |= DCACHE_OP_HASH;
    1929   797405906 :         if (op->d_compare)
    1930        4769 :                 dentry->d_flags |= DCACHE_OP_COMPARE;
    1931   797405906 :         if (op->d_revalidate)
    1932    25952455 :                 dentry->d_flags |= DCACHE_OP_REVALIDATE;
    1933   797405906 :         if (op->d_weak_revalidate)
    1934     1406651 :                 dentry->d_flags |= DCACHE_OP_WEAK_REVALIDATE;
    1935   797405906 :         if (op->d_delete)
    1936   762843217 :                 dentry->d_flags |= DCACHE_OP_DELETE;
    1937   797405906 :         if (op->d_prune)
    1938        2070 :                 dentry->d_flags |= DCACHE_OP_PRUNE;
    1939   797405906 :         if (op->d_real)
    1940      172942 :                 dentry->d_flags |= DCACHE_OP_REAL;
    1941             : 
    1942             : }
    1943             : EXPORT_SYMBOL(d_set_d_op);
    1944             : 
    1945             : 
    1946             : /*
    1947             :  * d_set_fallthru - Mark a dentry as falling through to a lower layer
    1948             :  * @dentry - The dentry to mark
    1949             :  *
    1950             :  * Mark a dentry as falling through to the lower layer (as set with
    1951             :  * d_pin_lower()).  This flag may be recorded on the medium.
    1952             :  */
    1953           0 : void d_set_fallthru(struct dentry *dentry)
    1954             : {
    1955           0 :         spin_lock(&dentry->d_lock);
    1956           0 :         dentry->d_flags |= DCACHE_FALLTHRU;
    1957           0 :         spin_unlock(&dentry->d_lock);
    1958           0 : }
    1959             : EXPORT_SYMBOL(d_set_fallthru);
    1960             : 
    1961   244594226 : static unsigned d_flags_for_inode(struct inode *inode)
    1962             : {
    1963   244594226 :         unsigned add_flags = DCACHE_REGULAR_TYPE;
    1964             : 
    1965   244594226 :         if (!inode)
    1966             :                 return DCACHE_MISS_TYPE;
    1967             : 
    1968   244594226 :         if (S_ISDIR(inode->i_mode)) {
    1969    30589655 :                 add_flags = DCACHE_DIRECTORY_TYPE;
    1970    30589655 :                 if (unlikely(!(inode->i_opflags & IOP_LOOKUP))) {
    1971    24081490 :                         if (unlikely(!inode->i_op->lookup))
    1972             :                                 add_flags = DCACHE_AUTODIR_TYPE;
    1973             :                         else
    1974    24081490 :                                 inode->i_opflags |= IOP_LOOKUP;
    1975             :                 }
    1976    30589655 :                 goto type_determined;
    1977             :         }
    1978             : 
    1979   214004571 :         if (unlikely(!(inode->i_opflags & IOP_NOFOLLOW))) {
    1980   172582564 :                 if (unlikely(inode->i_op->get_link)) {
    1981    29939895 :                         add_flags = DCACHE_SYMLINK_TYPE;
    1982    29939895 :                         goto type_determined;
    1983             :                 }
    1984   142642669 :                 inode->i_opflags |= IOP_NOFOLLOW;
    1985             :         }
    1986             : 
    1987   184064676 :         if (unlikely(!S_ISREG(inode->i_mode)))
    1988    41116078 :                 add_flags = DCACHE_SPECIAL_TYPE;
    1989             : 
    1990   142948598 : type_determined:
    1991   244594226 :         if (unlikely(IS_AUTOMOUNT(inode)))
    1992           0 :                 add_flags |= DCACHE_NEED_AUTOMOUNT;
    1993             :         return add_flags;
    1994             : }
    1995             : 
    1996   131424161 : static void __d_instantiate(struct dentry *dentry, struct inode *inode)
    1997             : {
    1998   131424161 :         unsigned add_flags = d_flags_for_inode(inode);
    1999   131032190 :         WARN_ON(d_in_lookup(dentry));
    2000             : 
    2001   131032190 :         spin_lock(&dentry->d_lock);
    2002             :         /*
    2003             :          * Decrement negative dentry count if it was in the LRU list.
    2004             :          */
    2005   131355251 :         if (dentry->d_flags & DCACHE_LRU_LIST)
    2006    21658709 :                 this_cpu_dec(nr_dentry_negative);
    2007   131355455 :         hlist_add_head(&dentry->d_u.d_alias, &inode->i_dentry);
    2008   131355455 :         raw_write_seqcount_begin(&dentry->d_seq);
    2009   131218957 :         __d_set_inode_and_type(dentry, inode, add_flags);
    2010   131204811 :         raw_write_seqcount_end(&dentry->d_seq);
    2011   131167198 :         fsnotify_update_flags(dentry);
    2012   131099144 :         spin_unlock(&dentry->d_lock);
    2013   131606681 : }
    2014             : 
    2015             : /**
    2016             :  * d_instantiate - fill in inode information for a dentry
    2017             :  * @entry: dentry to complete
    2018             :  * @inode: inode to attach to this dentry
    2019             :  *
    2020             :  * Fill in inode information in the entry.
    2021             :  *
    2022             :  * This turns negative dentries into productive full members
    2023             :  * of society.
    2024             :  *
    2025             :  * NOTE! This assumes that the inode count has been incremented
    2026             :  * (or otherwise set) by the caller to indicate that it is now
    2027             :  * in use by the dcache.
    2028             :  */
    2029             :  
    2030   126155441 : void d_instantiate(struct dentry *entry, struct inode * inode)
    2031             : {
    2032   126155441 :         BUG_ON(!hlist_unhashed(&entry->d_u.d_alias));
    2033   126155441 :         if (inode) {
    2034   126155441 :                 security_d_instantiate(entry, inode);
    2035   126155441 :                 spin_lock(&inode->i_lock);
    2036   126485175 :                 __d_instantiate(entry, inode);
    2037   126514938 :                 spin_unlock(&inode->i_lock);
    2038             :         }
    2039   126607240 : }
    2040             : EXPORT_SYMBOL(d_instantiate);
    2041             : 
    2042             : /*
    2043             :  * This should be equivalent to d_instantiate() + unlock_new_inode(),
    2044             :  * with lockdep-related part of unlock_new_inode() done before
    2045             :  * anything else.  Use that instead of open-coding d_instantiate()/
    2046             :  * unlock_new_inode() combinations.
    2047             :  */
    2048     5082698 : void d_instantiate_new(struct dentry *entry, struct inode *inode)
    2049             : {
    2050     5082698 :         BUG_ON(!hlist_unhashed(&entry->d_u.d_alias));
    2051     5082698 :         BUG_ON(!inode);
    2052     5082698 :         lockdep_annotate_inode_mutex_key(inode);
    2053     5082698 :         security_d_instantiate(entry, inode);
    2054     5082698 :         spin_lock(&inode->i_lock);
    2055     5083315 :         __d_instantiate(entry, inode);
    2056     5082774 :         WARN_ON(!(inode->i_state & I_NEW));
    2057     5082774 :         inode->i_state &= ~I_NEW & ~I_CREATING;
    2058     5082774 :         smp_mb();
    2059     5083365 :         wake_up_bit(&inode->i_state, __I_NEW);
    2060     5082597 :         spin_unlock(&inode->i_lock);
    2061     5082973 : }
    2062             : EXPORT_SYMBOL(d_instantiate_new);
    2063             : 
    2064       94345 : struct dentry *d_make_root(struct inode *root_inode)
    2065             : {
    2066       94345 :         struct dentry *res = NULL;
    2067             : 
    2068       94345 :         if (root_inode) {
    2069       94345 :                 res = d_alloc_anon(root_inode->i_sb);
    2070       94340 :                 if (res)
    2071       94340 :                         d_instantiate(res, root_inode);
    2072             :                 else
    2073           0 :                         iput(root_inode);
    2074             :         }
    2075       94344 :         return res;
    2076             : }
    2077             : EXPORT_SYMBOL(d_make_root);
    2078             : 
    2079    51420315 : static struct dentry *__d_instantiate_anon(struct dentry *dentry,
    2080             :                                            struct inode *inode,
    2081             :                                            bool disconnected)
    2082             : {
    2083    51420315 :         struct dentry *res;
    2084    51420315 :         unsigned add_flags;
    2085             : 
    2086    51420315 :         security_d_instantiate(dentry, inode);
    2087    51420315 :         spin_lock(&inode->i_lock);
    2088    51511181 :         res = __d_find_any_alias(inode);
    2089         813 :         if (res) {
    2090         813 :                 spin_unlock(&inode->i_lock);
    2091         813 :                 dput(dentry);
    2092         813 :                 goto out_iput;
    2093             :         }
    2094             : 
    2095             :         /* attach a disconnected dentry */
    2096    51510368 :         add_flags = d_flags_for_inode(inode);
    2097             : 
    2098    51323917 :         if (disconnected)
    2099    51298444 :                 add_flags |= DCACHE_DISCONNECTED;
    2100             : 
    2101    51323917 :         spin_lock(&dentry->d_lock);
    2102    51613956 :         __d_set_inode_and_type(dentry, inode, add_flags);
    2103    51616429 :         hlist_add_head(&dentry->d_u.d_alias, &inode->i_dentry);
    2104    51616429 :         if (!disconnected) {
    2105           0 :                 hlist_bl_lock(&dentry->d_sb->s_roots);
    2106           0 :                 hlist_bl_add_head(&dentry->d_hash, &dentry->d_sb->s_roots);
    2107           0 :                 hlist_bl_unlock(&dentry->d_sb->s_roots);
    2108             :         }
    2109    51616429 :         spin_unlock(&dentry->d_lock);
    2110    51602454 :         spin_unlock(&inode->i_lock);
    2111             : 
    2112    51602454 :         return dentry;
    2113             : 
    2114             :  out_iput:
    2115         813 :         iput(inode);
    2116         813 :         return res;
    2117             : }
    2118             : 
    2119           0 : struct dentry *d_instantiate_anon(struct dentry *dentry, struct inode *inode)
    2120             : {
    2121           0 :         return __d_instantiate_anon(dentry, inode, true);
    2122             : }
    2123             : EXPORT_SYMBOL(d_instantiate_anon);
    2124             : 
    2125   230037869 : static struct dentry *__d_obtain_alias(struct inode *inode, bool disconnected)
    2126             : {
    2127   230037869 :         struct dentry *tmp;
    2128   230037869 :         struct dentry *res;
    2129             : 
    2130   230037869 :         if (!inode)
    2131             :                 return ERR_PTR(-ESTALE);
    2132   230037869 :         if (IS_ERR(inode))
    2133             :                 return ERR_CAST(inode);
    2134             : 
    2135   230013254 :         res = d_find_any_alias(inode);
    2136   232119163 :         if (res)
    2137   180568926 :                 goto out_iput;
    2138             : 
    2139    51550237 :         tmp = d_alloc_anon(inode->i_sb);
    2140    51381312 :         if (!tmp) {
    2141           0 :                 res = ERR_PTR(-ENOMEM);
    2142           0 :                 goto out_iput;
    2143             :         }
    2144             : 
    2145    51381312 :         return __d_instantiate_anon(tmp, inode, disconnected);
    2146             : 
    2147   180568926 : out_iput:
    2148   180568926 :         iput(inode);
    2149   180568926 :         return res;
    2150             : }
    2151             : 
    2152             : /**
    2153             :  * d_obtain_alias - find or allocate a DISCONNECTED dentry for a given inode
    2154             :  * @inode: inode to allocate the dentry for
    2155             :  *
    2156             :  * Obtain a dentry for an inode resulting from NFS filehandle conversion or
    2157             :  * similar open by handle operations.  The returned dentry may be anonymous,
    2158             :  * or may have a full name (if the inode was already in the cache).
    2159             :  *
    2160             :  * When called on a directory inode, we must ensure that the inode only ever
    2161             :  * has one dentry.  If a dentry is found, that is returned instead of
    2162             :  * allocating a new one.
    2163             :  *
    2164             :  * On successful return, the reference to the inode has been transferred
    2165             :  * to the dentry.  In case of an error the reference on the inode is released.
    2166             :  * To make it easier to use in export operations a %NULL or IS_ERR inode may
    2167             :  * be passed in and the error will be propagated to the return value,
    2168             :  * with a %NULL @inode replaced by ERR_PTR(-ESTALE).
    2169             :  */
    2170   231014258 : struct dentry *d_obtain_alias(struct inode *inode)
    2171             : {
    2172   231014258 :         return __d_obtain_alias(inode, true);
    2173             : }
    2174             : EXPORT_SYMBOL(d_obtain_alias);
    2175             : 
    2176             : /**
    2177             :  * d_obtain_root - find or allocate a dentry for a given inode
    2178             :  * @inode: inode to allocate the dentry for
    2179             :  *
    2180             :  * Obtain an IS_ROOT dentry for the root of a filesystem.
    2181             :  *
    2182             :  * We must ensure that directory inodes only ever have one dentry.  If a
    2183             :  * dentry is found, that is returned instead of allocating a new one.
    2184             :  *
    2185             :  * On successful return, the reference to the inode has been transferred
    2186             :  * to the dentry.  In case of an error the reference on the inode is
    2187             :  * released.  A %NULL or IS_ERR inode may be passed in and will be the
    2188             :  * error will be propagate to the return value, with a %NULL @inode
    2189             :  * replaced by ERR_PTR(-ESTALE).
    2190             :  */
    2191           0 : struct dentry *d_obtain_root(struct inode *inode)
    2192             : {
    2193           0 :         return __d_obtain_alias(inode, false);
    2194             : }
    2195             : EXPORT_SYMBOL(d_obtain_root);
    2196             : 
    2197             : /**
    2198             :  * d_add_ci - lookup or allocate new dentry with case-exact name
    2199             :  * @inode:  the inode case-insensitive lookup has found
    2200             :  * @dentry: the negative dentry that was passed to the parent's lookup func
    2201             :  * @name:   the case-exact name to be associated with the returned dentry
    2202             :  *
    2203             :  * This is to avoid filling the dcache with case-insensitive names to the
    2204             :  * same inode, only the actual correct case is stored in the dcache for
    2205             :  * case-insensitive filesystems.
    2206             :  *
    2207             :  * For a case-insensitive lookup match and if the case-exact dentry
    2208             :  * already exists in the dcache, use it and return it.
    2209             :  *
    2210             :  * If no entry exists with the exact case name, allocate new dentry with
    2211             :  * the exact case, and return the spliced entry.
    2212             :  */
    2213      484528 : struct dentry *d_add_ci(struct dentry *dentry, struct inode *inode,
    2214             :                         struct qstr *name)
    2215             : {
    2216      484528 :         struct dentry *found, *res;
    2217             : 
    2218             :         /*
    2219             :          * First check if a dentry matching the name already exists,
    2220             :          * if not go ahead and create it now.
    2221             :          */
    2222      484528 :         found = d_hash_and_lookup(dentry->d_parent, name);
    2223      484528 :         if (found) {
    2224      357324 :                 iput(inode);
    2225      357324 :                 return found;
    2226             :         }
    2227      127204 :         if (d_in_lookup(dentry)) {
    2228      126951 :                 found = d_alloc_parallel(dentry->d_parent, name,
    2229             :                                         dentry->d_wait);
    2230      126951 :                 if (IS_ERR(found) || !d_in_lookup(found)) {
    2231           0 :                         iput(inode);
    2232           0 :                         return found;
    2233             :                 }
    2234             :         } else {
    2235         253 :                 found = d_alloc(dentry->d_parent, name);
    2236         253 :                 if (!found) {
    2237           0 :                         iput(inode);
    2238           0 :                         return ERR_PTR(-ENOMEM);
    2239             :                 } 
    2240             :         }
    2241      127204 :         res = d_splice_alias(inode, found);
    2242      127204 :         if (res) {
    2243           0 :                 d_lookup_done(found);
    2244           0 :                 dput(found);
    2245           0 :                 return res;
    2246             :         }
    2247             :         return found;
    2248             : }
    2249             : EXPORT_SYMBOL(d_add_ci);
    2250             : 
    2251             : /**
    2252             :  * d_same_name - compare dentry name with case-exact name
    2253             :  * @parent: parent dentry
    2254             :  * @dentry: the negative dentry that was passed to the parent's lookup func
    2255             :  * @name:   the case-exact name to be associated with the returned dentry
    2256             :  *
    2257             :  * Return: true if names are same, or false
    2258             :  */
    2259   929714742 : bool d_same_name(const struct dentry *dentry, const struct dentry *parent,
    2260             :                  const struct qstr *name)
    2261             : {
    2262   929714742 :         if (likely(!(parent->d_flags & DCACHE_OP_COMPARE))) {
    2263   929222934 :                 if (dentry->d_name.len != name->len)
    2264             :                         return false;
    2265   929296817 :                 return dentry_cmp(dentry, name->name, name->len) == 0;
    2266             :         }
    2267      491808 :         return parent->d_op->d_compare(dentry,
    2268      491808 :                                        dentry->d_name.len, dentry->d_name.name,
    2269      491808 :                                        name) == 0;
    2270             : }
    2271             : EXPORT_SYMBOL_GPL(d_same_name);
    2272             : 
    2273             : /*
    2274             :  * This is __d_lookup_rcu() when the parent dentry has
    2275             :  * DCACHE_OP_COMPARE, which makes things much nastier.
    2276             :  */
    2277        8874 : static noinline struct dentry *__d_lookup_rcu_op_compare(
    2278             :         const struct dentry *parent,
    2279             :         const struct qstr *name,
    2280             :         unsigned *seqp)
    2281             : {
    2282        8874 :         u64 hashlen = name->hash_len;
    2283        8874 :         struct hlist_bl_head *b = d_hash(hashlen_hash(hashlen));
    2284        8874 :         struct hlist_bl_node *node;
    2285        8874 :         struct dentry *dentry;
    2286             : 
    2287        8987 :         hlist_bl_for_each_entry_rcu(dentry, node, b, d_hash) {
    2288         332 :                 int tlen;
    2289         332 :                 const char *tname;
    2290         332 :                 unsigned seq;
    2291             : 
    2292         332 : seqretry:
    2293         332 :                 seq = raw_seqcount_begin(&dentry->d_seq);
    2294         332 :                 if (dentry->d_parent != parent)
    2295         113 :                         continue;
    2296         219 :                 if (d_unhashed(dentry))
    2297           0 :                         continue;
    2298         219 :                 if (dentry->d_name.hash != hashlen_hash(hashlen))
    2299           0 :                         continue;
    2300         219 :                 tlen = dentry->d_name.len;
    2301         219 :                 tname = dentry->d_name.name;
    2302             :                 /* we want a consistent (name,len) pair */
    2303         219 :                 if (read_seqcount_retry(&dentry->d_seq, seq)) {
    2304           0 :                         cpu_relax();
    2305           0 :                         goto seqretry;
    2306             :                 }
    2307         219 :                 if (parent->d_op->d_compare(dentry, tlen, tname, name) != 0)
    2308           0 :                         continue;
    2309         219 :                 *seqp = seq;
    2310         219 :                 return dentry;
    2311             :         }
    2312             :         return NULL;
    2313             : }
    2314             : 
    2315             : /**
    2316             :  * __d_lookup_rcu - search for a dentry (racy, store-free)
    2317             :  * @parent: parent dentry
    2318             :  * @name: qstr of name we wish to find
    2319             :  * @seqp: returns d_seq value at the point where the dentry was found
    2320             :  * Returns: dentry, or NULL
    2321             :  *
    2322             :  * __d_lookup_rcu is the dcache lookup function for rcu-walk name
    2323             :  * resolution (store-free path walking) design described in
    2324             :  * Documentation/filesystems/path-lookup.txt.
    2325             :  *
    2326             :  * This is not to be used outside core vfs.
    2327             :  *
    2328             :  * __d_lookup_rcu must only be used in rcu-walk mode, ie. with vfsmount lock
    2329             :  * held, and rcu_read_lock held. The returned dentry must not be stored into
    2330             :  * without taking d_lock and checking d_seq sequence count against @seq
    2331             :  * returned here.
    2332             :  *
    2333             :  * A refcount may be taken on the found dentry with the d_rcu_to_refcount
    2334             :  * function.
    2335             :  *
    2336             :  * Alternatively, __d_lookup_rcu may be called again to look up the child of
    2337             :  * the returned dentry, so long as its parent's seqlock is checked after the
    2338             :  * child is looked up. Thus, an interlocking stepping of sequence lock checks
    2339             :  * is formed, giving integrity down the path walk.
    2340             :  *
    2341             :  * NOTE! The caller *has* to check the resulting dentry against the sequence
    2342             :  * number we've returned before using any of the resulting dentry state!
    2343             :  */
    2344 38307356403 : struct dentry *__d_lookup_rcu(const struct dentry *parent,
    2345             :                                 const struct qstr *name,
    2346             :                                 unsigned *seqp)
    2347             : {
    2348 38307356403 :         u64 hashlen = name->hash_len;
    2349 38307356403 :         const unsigned char *str = name->name;
    2350 38307356403 :         struct hlist_bl_head *b = d_hash(hashlen_hash(hashlen));
    2351 38306961153 :         struct hlist_bl_node *node;
    2352 38306961153 :         struct dentry *dentry;
    2353             : 
    2354             :         /*
    2355             :          * Note: There is significant duplication with __d_lookup_rcu which is
    2356             :          * required to prevent single threaded performance regressions
    2357             :          * especially on architectures where smp_rmb (in seqcounts) are costly.
    2358             :          * Keep the two functions in sync.
    2359             :          */
    2360             : 
    2361 38306961153 :         if (unlikely(parent->d_flags & DCACHE_OP_COMPARE))
    2362        8875 :                 return __d_lookup_rcu_op_compare(parent, name, seqp);
    2363             : 
    2364             :         /*
    2365             :          * The hash list is protected using RCU.
    2366             :          *
    2367             :          * Carefully use d_seq when comparing a candidate dentry, to avoid
    2368             :          * races with d_move().
    2369             :          *
    2370             :          * It is possible that concurrent renames can mess up our list
    2371             :          * walk here and result in missing our dentry, resulting in the
    2372             :          * false-negative result. d_lookup() protects against concurrent
    2373             :          * renames using rename_lock seqlock.
    2374             :          *
    2375             :          * See Documentation/filesystems/path-lookup.txt for more details.
    2376             :          */
    2377 41494521000 :         hlist_bl_for_each_entry_rcu(dentry, node, b, d_hash) {
    2378 39860585983 :                 unsigned seq;
    2379             : 
    2380             :                 /*
    2381             :                  * The dentry sequence count protects us from concurrent
    2382             :                  * renames, and thus protects parent and name fields.
    2383             :                  *
    2384             :                  * The caller must perform a seqcount check in order
    2385             :                  * to do anything useful with the returned dentry.
    2386             :                  *
    2387             :                  * NOTE! We do a "raw" seqcount_begin here. That means that
    2388             :                  * we don't wait for the sequence count to stabilize if it
    2389             :                  * is in the middle of a sequence change. If we do the slow
    2390             :                  * dentry compare, we will do seqretries until it is stable,
    2391             :                  * and if we end up with a successful lookup, we actually
    2392             :                  * want to exit RCU lookup anyway.
    2393             :                  *
    2394             :                  * Note that raw_seqcount_begin still *does* smp_rmb(), so
    2395             :                  * we are still guaranteed NUL-termination of ->d_name.name.
    2396             :                  */
    2397 39860585983 :                 seq = raw_seqcount_begin(&dentry->d_seq);
    2398 39908665701 :                 if (dentry->d_parent != parent)
    2399  3161252379 :                         continue;
    2400 36747413322 :                 if (d_unhashed(dentry))
    2401       31656 :                         continue;
    2402 36747381666 :                 if (dentry->d_name.hash_len != hashlen)
    2403    26277090 :                         continue;
    2404 36721104576 :                 if (dentry_cmp(dentry, str, hashlen_len(hashlen)) != 0)
    2405        7597 :                         continue;
    2406 36690488508 :                 *seqp = seq;
    2407 36690488508 :                 return dentry;
    2408             :         }
    2409             :         return NULL;
    2410             : }
    2411             : 
    2412             : /**
    2413             :  * d_lookup - search for a dentry
    2414             :  * @parent: parent dentry
    2415             :  * @name: qstr of name we wish to find
    2416             :  * Returns: dentry, or NULL
    2417             :  *
    2418             :  * d_lookup searches the children of the parent dentry for the name in
    2419             :  * question. If the dentry is found its reference count is incremented and the
    2420             :  * dentry is returned. The caller must use dput to free the entry when it has
    2421             :  * finished using it. %NULL is returned if the dentry does not exist.
    2422             :  */
    2423   596745777 : struct dentry *d_lookup(const struct dentry *parent, const struct qstr *name)
    2424             : {
    2425   596778396 :         struct dentry *dentry;
    2426   596778396 :         unsigned seq;
    2427             : 
    2428   596778396 :         do {
    2429   596778396 :                 seq = read_seqbegin(&rename_lock);
    2430   596630891 :                 dentry = __d_lookup(parent, name);
    2431   597405752 :                 if (dentry)
    2432             :                         break;
    2433   175220728 :         } while (read_seqretry(&rename_lock, seq));
    2434   597384745 :         return dentry;
    2435             : }
    2436             : EXPORT_SYMBOL(d_lookup);
    2437             : 
    2438             : /**
    2439             :  * __d_lookup - search for a dentry (racy)
    2440             :  * @parent: parent dentry
    2441             :  * @name: qstr of name we wish to find
    2442             :  * Returns: dentry, or NULL
    2443             :  *
    2444             :  * __d_lookup is like d_lookup, however it may (rarely) return a
    2445             :  * false-negative result due to unrelated rename activity.
    2446             :  *
    2447             :  * __d_lookup is slightly faster by avoiding rename_lock read seqlock,
    2448             :  * however it must be used carefully, eg. with a following d_lookup in
    2449             :  * the case of failure.
    2450             :  *
    2451             :  * __d_lookup callers must be commented.
    2452             :  */
    2453  1116928694 : struct dentry *__d_lookup(const struct dentry *parent, const struct qstr *name)
    2454             : {
    2455  1116928694 :         unsigned int hash = name->hash;
    2456  1116928694 :         struct hlist_bl_head *b = d_hash(hash);
    2457  1116788592 :         struct hlist_bl_node *node;
    2458  1116788592 :         struct dentry *found = NULL;
    2459  1116788592 :         struct dentry *dentry;
    2460             : 
    2461             :         /*
    2462             :          * Note: There is significant duplication with __d_lookup_rcu which is
    2463             :          * required to prevent single threaded performance regressions
    2464             :          * especially on architectures where smp_rmb (in seqcounts) are costly.
    2465             :          * Keep the two functions in sync.
    2466             :          */
    2467             : 
    2468             :         /*
    2469             :          * The hash list is protected using RCU.
    2470             :          *
    2471             :          * Take d_lock when comparing a candidate dentry, to avoid races
    2472             :          * with d_move().
    2473             :          *
    2474             :          * It is possible that concurrent renames can mess up our list
    2475             :          * walk here and result in missing our dentry, resulting in the
    2476             :          * false-negative result. d_lookup() protects against concurrent
    2477             :          * renames using rename_lock seqlock.
    2478             :          *
    2479             :          * See Documentation/filesystems/path-lookup.txt for more details.
    2480             :          */
    2481  1116788592 :         rcu_read_lock();
    2482             :         
    2483  1192058259 :         hlist_bl_for_each_entry_rcu(dentry, node, b, d_hash) {
    2484             : 
    2485   998608065 :                 if (dentry->d_name.hash != hash)
    2486    74521317 :                         continue;
    2487             : 
    2488   924086748 :                 spin_lock(&dentry->d_lock);
    2489   924813720 :                 if (dentry->d_parent != parent)
    2490       22580 :                         goto next;
    2491   924791140 :                 if (d_unhashed(dentry))
    2492         306 :                         goto next;
    2493             : 
    2494   924790834 :                 if (!d_same_name(dentry, parent, name))
    2495        6822 :                         goto next;
    2496             : 
    2497   924574873 :                 dentry->d_lockref.count++;
    2498   924574873 :                 found = dentry;
    2499   924574873 :                 spin_unlock(&dentry->d_lock);
    2500             :                 break;
    2501       29708 : next:
    2502       29708 :                 spin_unlock(&dentry->d_lock);
    2503             :         }
    2504  1118341975 :         rcu_read_unlock();
    2505             : 
    2506  1118190042 :         return found;
    2507             : }
    2508             : 
    2509             : /**
    2510             :  * d_hash_and_lookup - hash the qstr then search for a dentry
    2511             :  * @dir: Directory to search in
    2512             :  * @name: qstr of name we wish to find
    2513             :  *
    2514             :  * On lookup failure NULL is returned; on bad name - ERR_PTR(-error)
    2515             :  */
    2516    21137332 : struct dentry *d_hash_and_lookup(struct dentry *dir, struct qstr *name)
    2517             : {
    2518             :         /*
    2519             :          * Check for a fs-specific hash function. Note that we must
    2520             :          * calculate the standard hash first, as the d_op->d_hash()
    2521             :          * routine may choose to leave the hash value unchanged.
    2522             :          */
    2523    21137332 :         name->hash = full_name_hash(dir, name->name, name->len);
    2524    21137332 :         if (dir->d_flags & DCACHE_OP_HASH) {
    2525           0 :                 int err = dir->d_op->d_hash(dir, name);
    2526           0 :                 if (unlikely(err < 0))
    2527           0 :                         return ERR_PTR(err);
    2528             :         }
    2529    21137332 :         return d_lookup(dir, name);
    2530             : }
    2531             : EXPORT_SYMBOL(d_hash_and_lookup);
    2532             : 
    2533             : /*
    2534             :  * When a file is deleted, we have two options:
    2535             :  * - turn this dentry into a negative dentry
    2536             :  * - unhash this dentry and free it.
    2537             :  *
    2538             :  * Usually, we want to just turn this into
    2539             :  * a negative dentry, but if anybody else is
    2540             :  * currently using the dentry or the inode
    2541             :  * we can't do that and we fall back on removing
    2542             :  * it from the hash queues and waiting for
    2543             :  * it to be deleted later when it has no users
    2544             :  */
    2545             :  
    2546             : /**
    2547             :  * d_delete - delete a dentry
    2548             :  * @dentry: The dentry to delete
    2549             :  *
    2550             :  * Turn the dentry into a negative dentry if possible, otherwise
    2551             :  * remove it from the hash queues so it can be deleted later
    2552             :  */
    2553             :  
    2554    59464216 : void d_delete(struct dentry * dentry)
    2555             : {
    2556    59464216 :         struct inode *inode = dentry->d_inode;
    2557             : 
    2558    59464216 :         spin_lock(&inode->i_lock);
    2559    59482323 :         spin_lock(&dentry->d_lock);
    2560             :         /*
    2561             :          * Are we the only user?
    2562             :          */
    2563    59480622 :         if (dentry->d_lockref.count == 1) {
    2564    59217427 :                 dentry->d_flags &= ~DCACHE_CANT_MOUNT;
    2565    59217427 :                 dentry_unlink_inode(dentry);
    2566             :         } else {
    2567      263195 :                 __d_drop(dentry);
    2568      263198 :                 spin_unlock(&dentry->d_lock);
    2569      263198 :                 spin_unlock(&inode->i_lock);
    2570             :         }
    2571    59462053 : }
    2572             : EXPORT_SYMBOL(d_delete);
    2573             : 
    2574   997316348 : static void __d_rehash(struct dentry *entry)
    2575             : {
    2576   997316348 :         struct hlist_bl_head *b = d_hash(entry->d_name.hash);
    2577             : 
    2578   997019061 :         hlist_bl_lock(b);
    2579   997581971 :         hlist_bl_add_head_rcu(&entry->d_hash, b);
    2580   997623112 :         hlist_bl_unlock(b);
    2581   997455370 : }
    2582             : 
    2583             : /**
    2584             :  * d_rehash     - add an entry back to the hash
    2585             :  * @entry: dentry to add to the hash
    2586             :  *
    2587             :  * Adds a dentry to the hash according to its name.
    2588             :  */
    2589             :  
    2590           0 : void d_rehash(struct dentry * entry)
    2591             : {
    2592           0 :         spin_lock(&entry->d_lock);
    2593           0 :         __d_rehash(entry);
    2594           0 :         spin_unlock(&entry->d_lock);
    2595           0 : }
    2596             : EXPORT_SYMBOL(d_rehash);
    2597             : 
    2598   831040023 : static inline unsigned start_dir_add(struct inode *dir)
    2599             : {
    2600   831040023 :         preempt_disable_nested();
    2601   837866758 :         for (;;) {
    2602   837866758 :                 unsigned n = dir->i_dir_seq;
    2603   837866758 :                 if (!(n & 1) && cmpxchg(&dir->i_dir_seq, n, n + 1) == n)
    2604   831398074 :                         return n;
    2605     6762713 :                 cpu_relax();
    2606             :         }
    2607             : }
    2608             : 
    2609   831098981 : static inline void end_dir_add(struct inode *dir, unsigned int n,
    2610             :                                wait_queue_head_t *d_wait)
    2611             : {
    2612   831098981 :         smp_store_release(&dir->i_dir_seq, n + 2);
    2613   831107360 :         preempt_enable_nested();
    2614   831107360 :         wake_up_all(d_wait);
    2615   831247876 : }
    2616             : 
    2617     2548221 : static void d_wait_lookup(struct dentry *dentry)
    2618             : {
    2619     2548221 :         if (d_in_lookup(dentry)) {
    2620       81531 :                 DECLARE_WAITQUEUE(wait, current);
    2621       81531 :                 add_wait_queue(dentry->d_wait, &wait);
    2622       81531 :                 do {
    2623       81531 :                         set_current_state(TASK_UNINTERRUPTIBLE);
    2624       81531 :                         spin_unlock(&dentry->d_lock);
    2625       81531 :                         schedule();
    2626       81516 :                         spin_lock(&dentry->d_lock);
    2627       81531 :                 } while (d_in_lookup(dentry));
    2628             :         }
    2629     2548221 : }
    2630             : 
    2631   839001428 : struct dentry *d_alloc_parallel(struct dentry *parent,
    2632             :                                 const struct qstr *name,
    2633             :                                 wait_queue_head_t *wq)
    2634             : {
    2635   839001428 :         unsigned int hash = name->hash;
    2636   839001428 :         struct hlist_bl_head *b = in_lookup_hash(parent, hash);
    2637   839001428 :         struct hlist_bl_node *node;
    2638   839001428 :         struct dentry *new = d_alloc(parent, name);
    2639   839775953 :         struct dentry *dentry;
    2640   839775953 :         unsigned seq, r_seq, d_seq;
    2641             : 
    2642   839775953 :         if (unlikely(!new))
    2643             :                 return ERR_PTR(-ENOMEM);
    2644             : 
    2645   839775953 : retry:
    2646   868302245 :         rcu_read_lock();
    2647   868253097 :         seq = smp_load_acquire(&parent->d_inode->i_dir_seq);
    2648   868253097 :         r_seq = read_seqbegin(&rename_lock);
    2649   868039292 :         dentry = __d_lookup_rcu(parent, name, &d_seq);
    2650   867991655 :         if (unlikely(dentry)) {
    2651     5812981 :                 if (!lockref_get_not_dead(&dentry->d_lockref)) {
    2652     1283825 :                         rcu_read_unlock();
    2653     1283687 :                         goto retry;
    2654             :                 }
    2655     4538448 :                 if (read_seqcount_retry(&dentry->d_seq, d_seq)) {
    2656           0 :                         rcu_read_unlock();
    2657           0 :                         dput(dentry);
    2658           0 :                         goto retry;
    2659             :                 }
    2660     4526841 :                 rcu_read_unlock();
    2661     4527066 :                 dput(new);
    2662     4527066 :                 return dentry;
    2663             :         }
    2664   862178674 :         if (unlikely(read_seqretry(&rename_lock, r_seq))) {
    2665        8840 :                 rcu_read_unlock();
    2666        8839 :                 goto retry;
    2667             :         }
    2668             : 
    2669   862137024 :         if (unlikely(seq & 1)) {
    2670    25598394 :                 rcu_read_unlock();
    2671    25620620 :                 goto retry;
    2672             :         }
    2673             : 
    2674   836538630 :         hlist_bl_lock(b);
    2675   836735899 :         if (unlikely(READ_ONCE(parent->d_inode->i_dir_seq) != seq)) {
    2676     1606218 :                 hlist_bl_unlock(b);
    2677     1605717 :                 rcu_read_unlock();
    2678     1605759 :                 goto retry;
    2679             :         }
    2680             :         /*
    2681             :          * No changes for the parent since the beginning of d_lookup().
    2682             :          * Since all removals from the chain happen with hlist_bl_lock(),
    2683             :          * any potential in-lookup matches are going to stay here until
    2684             :          * we unlock the chain.  All fields are stable in everything
    2685             :          * we encounter.
    2686             :          */
    2687   835139530 :         hlist_bl_for_each_entry(dentry, node, b, d_u.d_in_lookup_hash) {
    2688     2560769 :                 if (dentry->d_name.hash != hash)
    2689        9839 :                         continue;
    2690     2550930 :                 if (dentry->d_parent != parent)
    2691           0 :                         continue;
    2692     2550930 :                 if (!d_same_name(dentry, parent, name))
    2693          10 :                         continue;
    2694     2548533 :                 hlist_bl_unlock(b);
    2695             :                 /* now we can try to grab a reference */
    2696     2548532 :                 if (!lockref_get_not_dead(&dentry->d_lockref)) {
    2697         312 :                         rcu_read_unlock();
    2698         312 :                         goto retry;
    2699             :                 }
    2700             : 
    2701     2548192 :                 rcu_read_unlock();
    2702             :                 /*
    2703             :                  * somebody is likely to be still doing lookup for it;
    2704             :                  * wait for them to finish
    2705             :                  */
    2706     2548130 :                 spin_lock(&dentry->d_lock);
    2707     2548221 :                 d_wait_lookup(dentry);
    2708             :                 /*
    2709             :                  * it's not in-lookup anymore; in principle we should repeat
    2710             :                  * everything from dcache lookup, but it's likely to be what
    2711             :                  * d_lookup() would've found anyway.  If it is, just return it;
    2712             :                  * otherwise we really have to repeat the whole thing.
    2713             :                  */
    2714     2548220 :                 if (unlikely(dentry->d_name.hash != hash))
    2715           0 :                         goto mismatch;
    2716     2548220 :                 if (unlikely(dentry->d_parent != parent))
    2717           0 :                         goto mismatch;
    2718     2548220 :                 if (unlikely(d_unhashed(dentry)))
    2719        7075 :                         goto mismatch;
    2720     2541145 :                 if (unlikely(!d_same_name(dentry, parent, name)))
    2721           0 :                         goto mismatch;
    2722             :                 /* OK, it *is* a hashed match; return it */
    2723     2541145 :                 spin_unlock(&dentry->d_lock);
    2724     2541138 :                 dput(new);
    2725     2541138 :                 return dentry;
    2726             :         }
    2727   832578761 :         rcu_read_unlock();
    2728             :         /* we can't take ->d_lock here; it's OK, though. */
    2729   832593381 :         new->d_flags |= DCACHE_PAR_LOOKUP;
    2730   832593381 :         new->d_wait = wq;
    2731   832593381 :         hlist_bl_add_head_rcu(&new->d_u.d_in_lookup_hash, b);
    2732   832466827 :         hlist_bl_unlock(b);
    2733   832466827 :         return new;
    2734        7075 : mismatch:
    2735        7075 :         spin_unlock(&dentry->d_lock);
    2736        7075 :         dput(dentry);
    2737        7075 :         goto retry;
    2738             : }
    2739             : EXPORT_SYMBOL(d_alloc_parallel);
    2740             : 
    2741             : /*
    2742             :  * - Unhash the dentry
    2743             :  * - Retrieve and clear the waitqueue head in dentry
    2744             :  * - Return the waitqueue head
    2745             :  */
    2746   832568716 : static wait_queue_head_t *__d_lookup_unhash(struct dentry *dentry)
    2747             : {
    2748   832568716 :         wait_queue_head_t *d_wait;
    2749   832568716 :         struct hlist_bl_head *b;
    2750             : 
    2751   832568716 :         lockdep_assert_held(&dentry->d_lock);
    2752             : 
    2753   832568716 :         b = in_lookup_hash(dentry->d_parent, dentry->d_name.hash);
    2754   832568716 :         hlist_bl_lock(b);
    2755   832694225 :         dentry->d_flags &= ~DCACHE_PAR_LOOKUP;
    2756   832694225 :         __hlist_bl_del(&dentry->d_u.d_in_lookup_hash);
    2757   832706417 :         d_wait = dentry->d_wait;
    2758   832706417 :         dentry->d_wait = NULL;
    2759   832706417 :         hlist_bl_unlock(b);
    2760   832659286 :         INIT_HLIST_NODE(&dentry->d_u.d_alias);
    2761   832659286 :         INIT_LIST_HEAD(&dentry->d_lru);
    2762   832659286 :         return d_wait;
    2763             : }
    2764             : 
    2765     1221089 : void __d_lookup_unhash_wake(struct dentry *dentry)
    2766             : {
    2767     1221089 :         spin_lock(&dentry->d_lock);
    2768     1221086 :         wake_up_all(__d_lookup_unhash(dentry));
    2769     1221067 :         spin_unlock(&dentry->d_lock);
    2770     1221062 : }
    2771             : EXPORT_SYMBOL(__d_lookup_unhash_wake);
    2772             : 
    2773             : /* inode->i_lock held if inode is non-NULL */
    2774             : 
    2775   929461457 : static inline void __d_add(struct dentry *dentry, struct inode *inode)
    2776             : {
    2777   929461457 :         wait_queue_head_t *d_wait;
    2778   929461457 :         struct inode *dir = NULL;
    2779   929461457 :         unsigned n;
    2780   929461457 :         spin_lock(&dentry->d_lock);
    2781   929749995 :         if (unlikely(d_in_lookup(dentry))) {
    2782   826029841 :                 dir = dentry->d_parent->d_inode;
    2783   826029841 :                 n = start_dir_add(dir);
    2784   826342852 :                 d_wait = __d_lookup_unhash(dentry);
    2785             :         }
    2786   930081447 :         if (inode) {
    2787    62102201 :                 unsigned add_flags = d_flags_for_inode(inode);
    2788    62091623 :                 hlist_add_head(&dentry->d_u.d_alias, &inode->i_dentry);
    2789    62091623 :                 raw_write_seqcount_begin(&dentry->d_seq);
    2790    62091457 :                 __d_set_inode_and_type(dentry, inode, add_flags);
    2791    62091351 :                 raw_write_seqcount_end(&dentry->d_seq);
    2792    62091254 :                 fsnotify_update_flags(dentry);
    2793             :         }
    2794   930070375 :         __d_rehash(dentry);
    2795   929858681 :         if (dir)
    2796   826149834 :                 end_dir_add(dir, n, d_wait);
    2797   929567200 :         spin_unlock(&dentry->d_lock);
    2798   929914701 :         if (inode)
    2799    62102043 :                 spin_unlock(&inode->i_lock);
    2800   929909079 : }
    2801             : 
    2802             : /**
    2803             :  * d_add - add dentry to hash queues
    2804             :  * @entry: dentry to add
    2805             :  * @inode: The inode to attach to this dentry
    2806             :  *
    2807             :  * This adds the entry to the hash queues and initializes @inode.
    2808             :  * The entry was actually filled in earlier during d_alloc().
    2809             :  */
    2810             : 
    2811   737716309 : void d_add(struct dentry *entry, struct inode *inode)
    2812             : {
    2813   737716309 :         if (inode) {
    2814           8 :                 security_d_instantiate(entry, inode);
    2815           8 :                 spin_lock(&inode->i_lock);
    2816             :         }
    2817   737716309 :         __d_add(entry, inode);
    2818   737856019 : }
    2819             : EXPORT_SYMBOL(d_add);
    2820             : 
    2821             : /**
    2822             :  * d_exact_alias - find and hash an exact unhashed alias
    2823             :  * @entry: dentry to add
    2824             :  * @inode: The inode to go with this dentry
    2825             :  *
    2826             :  * If an unhashed dentry with the same name/parent and desired
    2827             :  * inode already exists, hash and return it.  Otherwise, return
    2828             :  * NULL.
    2829             :  *
    2830             :  * Parent directory should be locked.
    2831             :  */
    2832       27203 : struct dentry *d_exact_alias(struct dentry *entry, struct inode *inode)
    2833             : {
    2834       27203 :         struct dentry *alias;
    2835       27203 :         unsigned int hash = entry->d_name.hash;
    2836             : 
    2837       27203 :         spin_lock(&inode->i_lock);
    2838       54406 :         hlist_for_each_entry(alias, &inode->i_dentry, d_u.d_alias) {
    2839             :                 /*
    2840             :                  * Don't need alias->d_lock here, because aliases with
    2841             :                  * d_parent == entry->d_parent are not subject to name or
    2842             :                  * parent changes, because the parent inode i_mutex is held.
    2843             :                  */
    2844           1 :                 if (alias->d_name.hash != hash)
    2845           0 :                         continue;
    2846           1 :                 if (alias->d_parent != entry->d_parent)
    2847           0 :                         continue;
    2848           1 :                 if (!d_same_name(alias, entry->d_parent, &entry->d_name))
    2849           0 :                         continue;
    2850           0 :                 spin_lock(&alias->d_lock);
    2851           0 :                 if (!d_unhashed(alias)) {
    2852           0 :                         spin_unlock(&alias->d_lock);
    2853           0 :                         alias = NULL;
    2854             :                 } else {
    2855           0 :                         __dget_dlock(alias);
    2856           0 :                         __d_rehash(alias);
    2857           0 :                         spin_unlock(&alias->d_lock);
    2858             :                 }
    2859           0 :                 spin_unlock(&inode->i_lock);
    2860           0 :                 return alias;
    2861             :         }
    2862       27202 :         spin_unlock(&inode->i_lock);
    2863       27202 :         return NULL;
    2864             : }
    2865             : EXPORT_SYMBOL(d_exact_alias);
    2866             : 
    2867    12974550 : static void swap_names(struct dentry *dentry, struct dentry *target)
    2868             : {
    2869    12974550 :         if (unlikely(dname_external(target))) {
    2870        1651 :                 if (unlikely(dname_external(dentry))) {
    2871             :                         /*
    2872             :                          * Both external: swap the pointers
    2873             :                          */
    2874         452 :                         swap(target->d_name.name, dentry->d_name.name);
    2875             :                 } else {
    2876             :                         /*
    2877             :                          * dentry:internal, target:external.  Steal target's
    2878             :                          * storage and make target internal.
    2879             :                          */
    2880        2398 :                         memcpy(target->d_iname, dentry->d_name.name,
    2881             :                                         dentry->d_name.len + 1);
    2882        1199 :                         dentry->d_name.name = target->d_name.name;
    2883        1199 :                         target->d_name.name = target->d_iname;
    2884             :                 }
    2885             :         } else {
    2886    12972899 :                 if (unlikely(dname_external(dentry))) {
    2887             :                         /*
    2888             :                          * dentry:external, target:internal.  Give dentry's
    2889             :                          * storage to target and make dentry internal
    2890             :                          */
    2891        2334 :                         memcpy(dentry->d_iname, target->d_name.name,
    2892             :                                         target->d_name.len + 1);
    2893        1167 :                         target->d_name.name = dentry->d_name.name;
    2894        1167 :                         dentry->d_name.name = dentry->d_iname;
    2895             :                 } else {
    2896             :                         /*
    2897             :                          * Both are internal.
    2898             :                          */
    2899             :                         unsigned int i;
    2900             :                         BUILD_BUG_ON(!IS_ALIGNED(DNAME_INLINE_LEN, sizeof(long)));
    2901    64858660 :                         for (i = 0; i < DNAME_INLINE_LEN / sizeof(long); i++) {
    2902    51886928 :                                 swap(((long *) &dentry->d_iname)[i],
    2903             :                                      ((long *) &target->d_iname)[i]);
    2904             :                         }
    2905             :                 }
    2906             :         }
    2907    12974550 :         swap(dentry->d_name.hash_len, target->d_name.hash_len);
    2908    12974550 : }
    2909             : 
    2910    41540811 : static void copy_name(struct dentry *dentry, struct dentry *target)
    2911             : {
    2912    41540811 :         struct external_name *old_name = NULL;
    2913    41540811 :         if (unlikely(dname_external(dentry)))
    2914     1136180 :                 old_name = external_name(dentry);
    2915    41540811 :         if (unlikely(dname_external(target))) {
    2916     1063154 :                 atomic_inc(&external_name(target)->u.count);
    2917     1063154 :                 dentry->d_name = target->d_name;
    2918             :         } else {
    2919    80955314 :                 memcpy(dentry->d_iname, target->d_name.name,
    2920             :                                 target->d_name.len + 1);
    2921    40477657 :                 dentry->d_name.name = dentry->d_iname;
    2922    40477657 :                 dentry->d_name.hash_len = target->d_name.hash_len;
    2923             :         }
    2924    41540811 :         if (old_name && likely(atomic_dec_and_test(&old_name->u.count)))
    2925           0 :                 kfree_rcu(old_name, u.head);
    2926    41540811 : }
    2927             : 
    2928             : /*
    2929             :  * __d_move - move a dentry
    2930             :  * @dentry: entry to move
    2931             :  * @target: new dentry
    2932             :  * @exchange: exchange the two dentries
    2933             :  *
    2934             :  * Update the dcache to reflect the move of a file name. Negative
    2935             :  * dcache entries should not be moved in this way. Caller must hold
    2936             :  * rename_lock, the i_mutex of the source and target directories,
    2937             :  * and the sb->s_vfs_rename_mutex if they differ. See lock_rename().
    2938             :  */
    2939    54515361 : static void __d_move(struct dentry *dentry, struct dentry *target,
    2940             :                      bool exchange)
    2941             : {
    2942    54515361 :         struct dentry *old_parent, *p;
    2943    54515361 :         wait_queue_head_t *d_wait;
    2944    54515361 :         struct inode *dir = NULL;
    2945    54515361 :         unsigned n;
    2946             : 
    2947    54515361 :         WARN_ON(!dentry->d_inode);
    2948    54515361 :         if (WARN_ON(dentry == target))
    2949             :                 return;
    2950             : 
    2951    54515361 :         BUG_ON(d_ancestor(target, dentry));
    2952    54515361 :         old_parent = dentry->d_parent;
    2953    54515361 :         p = d_ancestor(old_parent, target);
    2954    54515361 :         if (IS_ROOT(dentry)) {
    2955     5047514 :                 BUG_ON(p);
    2956     5047514 :                 spin_lock(&target->d_parent->d_lock);
    2957    49467847 :         } else if (!p) {
    2958             :                 /* target is not a descendent of dentry->d_parent */
    2959    40027946 :                 spin_lock(&target->d_parent->d_lock);
    2960    40027946 :                 spin_lock_nested(&old_parent->d_lock, DENTRY_D_LOCK_NESTED);
    2961             :         } else {
    2962     9439901 :                 BUG_ON(p == dentry);
    2963     9439901 :                 spin_lock(&old_parent->d_lock);
    2964     9439901 :                 if (p != target)
    2965     1832686 :                         spin_lock_nested(&target->d_parent->d_lock,
    2966             :                                         DENTRY_D_LOCK_NESTED);
    2967             :         }
    2968    54515361 :         spin_lock_nested(&dentry->d_lock, 2);
    2969    54515361 :         spin_lock_nested(&target->d_lock, 3);
    2970             : 
    2971    54515361 :         if (unlikely(d_in_lookup(target))) {
    2972     5047514 :                 dir = target->d_parent->d_inode;
    2973     5047514 :                 n = start_dir_add(dir);
    2974     5047514 :                 d_wait = __d_lookup_unhash(target);
    2975             :         }
    2976             : 
    2977    54515361 :         write_seqcount_begin(&dentry->d_seq);
    2978    54515361 :         write_seqcount_begin_nested(&target->d_seq, DENTRY_D_LOCK_NESTED);
    2979             : 
    2980             :         /* unhash both */
    2981    54515361 :         if (!d_unhashed(dentry))
    2982    49467847 :                 ___d_drop(dentry);
    2983    54515361 :         if (!d_unhashed(target))
    2984    49467847 :                 ___d_drop(target);
    2985             : 
    2986             :         /* ... and switch them in the tree */
    2987    54515361 :         dentry->d_parent = target->d_parent;
    2988    54515361 :         if (!exchange) {
    2989    41540811 :                 copy_name(dentry, target);
    2990    41540811 :                 target->d_hash.pprev = NULL;
    2991    41540811 :                 dentry->d_parent->d_lockref.count++;
    2992    41540811 :                 if (dentry != old_parent) /* wasn't IS_ROOT */
    2993    36493297 :                         WARN_ON(!--old_parent->d_lockref.count);
    2994             :         } else {
    2995    12974550 :                 target->d_parent = old_parent;
    2996    12974550 :                 swap_names(dentry, target);
    2997    12974550 :                 list_move(&target->d_child, &target->d_parent->d_subdirs);
    2998    12974550 :                 __d_rehash(target);
    2999    12974550 :                 fsnotify_update_flags(target);
    3000             :         }
    3001    54515361 :         list_move(&dentry->d_child, &dentry->d_parent->d_subdirs);
    3002    54515361 :         __d_rehash(dentry);
    3003    54515361 :         fsnotify_update_flags(dentry);
    3004    54515361 :         fscrypt_handle_d_move(dentry);
    3005             : 
    3006    54515361 :         write_seqcount_end(&target->d_seq);
    3007    54515361 :         write_seqcount_end(&dentry->d_seq);
    3008             : 
    3009    54515361 :         if (dir)
    3010     5047514 :                 end_dir_add(dir, n, d_wait);
    3011             : 
    3012    54515361 :         if (dentry->d_parent != old_parent)
    3013    46908146 :                 spin_unlock(&dentry->d_parent->d_lock);
    3014    54515361 :         if (dentry != old_parent)
    3015    49467847 :                 spin_unlock(&old_parent->d_lock);
    3016    54515361 :         spin_unlock(&target->d_lock);
    3017    54515361 :         spin_unlock(&dentry->d_lock);
    3018             : }
    3019             : 
    3020             : /*
    3021             :  * d_move - move a dentry
    3022             :  * @dentry: entry to move
    3023             :  * @target: new dentry
    3024             :  *
    3025             :  * Update the dcache to reflect the move of a file name. Negative
    3026             :  * dcache entries should not be moved in this way. See the locking
    3027             :  * requirements for __d_move.
    3028             :  */
    3029    36492630 : void d_move(struct dentry *dentry, struct dentry *target)
    3030             : {
    3031    36492630 :         write_seqlock(&rename_lock);
    3032    36493297 :         __d_move(dentry, target, false);
    3033    36493297 :         write_sequnlock(&rename_lock);
    3034    36493297 : }
    3035             : EXPORT_SYMBOL(d_move);
    3036             : 
    3037             : /*
    3038             :  * d_exchange - exchange two dentries
    3039             :  * @dentry1: first dentry
    3040             :  * @dentry2: second dentry
    3041             :  */
    3042    12974463 : void d_exchange(struct dentry *dentry1, struct dentry *dentry2)
    3043             : {
    3044    12974463 :         write_seqlock(&rename_lock);
    3045             : 
    3046    12974550 :         WARN_ON(!dentry1->d_inode);
    3047    12974550 :         WARN_ON(!dentry2->d_inode);
    3048    12974550 :         WARN_ON(IS_ROOT(dentry1));
    3049    12974550 :         WARN_ON(IS_ROOT(dentry2));
    3050             : 
    3051    12974550 :         __d_move(dentry1, dentry2, true);
    3052             : 
    3053    12974550 :         write_sequnlock(&rename_lock);
    3054    12974550 : }
    3055             : 
    3056             : /**
    3057             :  * d_ancestor - search for an ancestor
    3058             :  * @p1: ancestor dentry
    3059             :  * @p2: child dentry
    3060             :  *
    3061             :  * Returns the ancestor dentry of p2 which is a child of p1, if p1 is
    3062             :  * an ancestor of p2, else NULL.
    3063             :  */
    3064    82487555 : struct dentry *d_ancestor(struct dentry *p1, struct dentry *p2)
    3065             : {
    3066   137002916 :         struct dentry *p;
    3067             : 
    3068 10372488975 :         for (p = p2; !IS_ROOT(p); p = p->d_parent) {
    3069 10188105897 :                 if (p->d_parent == p1)
    3070     3649432 :                         return p;
    3071             :         }
    3072             :         return NULL;
    3073             : }
    3074             : 
    3075             : /*
    3076             :  * This helper attempts to cope with remotely renamed directories
    3077             :  *
    3078             :  * It assumes that the caller is already holding
    3079             :  * dentry->d_parent->d_inode->i_mutex, and rename_lock
    3080             :  *
    3081             :  * Note: If ever the locking in lock_rename() changes, then please
    3082             :  * remember to update this too...
    3083             :  */
    3084           0 : static int __d_unalias(struct inode *inode,
    3085             :                 struct dentry *dentry, struct dentry *alias)
    3086             : {
    3087           0 :         struct mutex *m1 = NULL;
    3088           0 :         struct rw_semaphore *m2 = NULL;
    3089           0 :         int ret = -ESTALE;
    3090             : 
    3091             :         /* If alias and dentry share a parent, then no extra locks required */
    3092           0 :         if (alias->d_parent == dentry->d_parent)
    3093           0 :                 goto out_unalias;
    3094             : 
    3095             :         /* See lock_rename() */
    3096           0 :         if (!mutex_trylock(&dentry->d_sb->s_vfs_rename_mutex))
    3097           0 :                 goto out_err;
    3098           0 :         m1 = &dentry->d_sb->s_vfs_rename_mutex;
    3099           0 :         if (!inode_trylock_shared(alias->d_parent->d_inode))
    3100           0 :                 goto out_err;
    3101           0 :         m2 = &alias->d_parent->d_inode->i_rwsem;
    3102           0 : out_unalias:
    3103           0 :         __d_move(alias, dentry, false);
    3104           0 :         ret = 0;
    3105           0 : out_err:
    3106           0 :         if (m2)
    3107           0 :                 up_read(m2);
    3108           0 :         if (m1)
    3109           0 :                 mutex_unlock(m1);
    3110           0 :         return ret;
    3111             : }
    3112             : 
    3113             : /**
    3114             :  * d_splice_alias - splice a disconnected dentry into the tree if one exists
    3115             :  * @inode:  the inode which may have a disconnected dentry
    3116             :  * @dentry: a negative dentry which we want to point to the inode.
    3117             :  *
    3118             :  * If inode is a directory and has an IS_ROOT alias, then d_move that in
    3119             :  * place of the given dentry and return it, else simply d_add the inode
    3120             :  * to the dentry and return NULL.
    3121             :  *
    3122             :  * If a non-IS_ROOT directory is found, the filesystem is corrupt, and
    3123             :  * we should error out: directories can't have multiple aliases.
    3124             :  *
    3125             :  * This is needed in the lookup routine of any filesystem that is exportable
    3126             :  * (via knfsd) so that we can build dcache paths to directories effectively.
    3127             :  *
    3128             :  * If a dentry was found and moved, then it is returned.  Otherwise NULL
    3129             :  * is returned.  This matches the expected return value of ->lookup.
    3130             :  *
    3131             :  * Cluster filesystems may call this function with a negative, hashed dentry.
    3132             :  * In that case, we know that the inode will be a regular file, and also this
    3133             :  * will only occur during atomic_open. So we need to check for the dentry
    3134             :  * being already hashed only in the final case.
    3135             :  */
    3136   197180040 : struct dentry *d_splice_alias(struct inode *inode, struct dentry *dentry)
    3137             : {
    3138   197180040 :         if (IS_ERR(inode))
    3139             :                 return ERR_CAST(inode);
    3140             : 
    3141   197117578 :         BUG_ON(!d_unhashed(dentry));
    3142             : 
    3143   197117578 :         if (!inode)
    3144   129999081 :                 goto out;
    3145             : 
    3146    67118497 :         security_d_instantiate(dentry, inode);
    3147    67118497 :         spin_lock(&inode->i_lock);
    3148    67133870 :         if (S_ISDIR(inode->i_mode)) {
    3149    23349776 :                 struct dentry *new = __d_find_any_alias(inode);
    3150    23353747 :                 if (unlikely(new)) {
    3151             :                         /* The reference to new ensures it remains an alias */
    3152     5043122 :                         spin_unlock(&inode->i_lock);
    3153     5042363 :                         write_seqlock(&rename_lock);
    3154     5047514 :                         if (unlikely(d_ancestor(new, dentry))) {
    3155           0 :                                 write_sequnlock(&rename_lock);
    3156           0 :                                 dput(new);
    3157           0 :                                 new = ERR_PTR(-ELOOP);
    3158           0 :                                 pr_warn_ratelimited(
    3159             :                                         "VFS: Lookup of '%s' in %s %s"
    3160             :                                         " would have caused loop\n",
    3161             :                                         dentry->d_name.name,
    3162             :                                         inode->i_sb->s_type->name,
    3163             :                                         inode->i_sb->s_id);
    3164     5047514 :                         } else if (!IS_ROOT(new)) {
    3165           0 :                                 struct dentry *old_parent = dget(new->d_parent);
    3166           0 :                                 int err = __d_unalias(inode, dentry, new);
    3167           0 :                                 write_sequnlock(&rename_lock);
    3168           0 :                                 if (err) {
    3169           0 :                                         dput(new);
    3170           0 :                                         new = ERR_PTR(err);
    3171             :                                 }
    3172           0 :                                 dput(old_parent);
    3173             :                         } else {
    3174     5047514 :                                 __d_move(new, dentry, false);
    3175     5047514 :                                 write_sequnlock(&rename_lock);
    3176             :                         }
    3177     5047514 :                         iput(inode);
    3178     5047514 :                         return new;
    3179             :                 }
    3180             :         }
    3181    62094719 : out:
    3182   192093800 :         __d_add(dentry, inode);
    3183   192093800 :         return NULL;
    3184             : }
    3185             : EXPORT_SYMBOL(d_splice_alias);
    3186             : 
    3187             : /*
    3188             :  * Test whether new_dentry is a subdirectory of old_dentry.
    3189             :  *
    3190             :  * Trivially implemented using the dcache structure
    3191             :  */
    3192             : 
    3193             : /**
    3194             :  * is_subdir - is new dentry a subdirectory of old_dentry
    3195             :  * @new_dentry: new dentry
    3196             :  * @old_dentry: old dentry
    3197             :  *
    3198             :  * Returns true if new_dentry is a subdirectory of the parent (at any depth).
    3199             :  * Returns false otherwise.
    3200             :  * Caller must ensure that "new_dentry" is pinned before calling is_subdir()
    3201             :  */
    3202             :   
    3203    12927658 : bool is_subdir(struct dentry *new_dentry, struct dentry *old_dentry)
    3204             : {
    3205    12927658 :         bool result;
    3206    12927658 :         unsigned seq;
    3207             : 
    3208    12927658 :         if (new_dentry == old_dentry)
    3209             :                 return true;
    3210             : 
    3211    12919373 :         do {
    3212             :                 /* for restarting inner loop in case of seq retry */
    3213    12919373 :                 seq = read_seqbegin(&rename_lock);
    3214             :                 /*
    3215             :                  * Need rcu_readlock to protect against the d_parent trashing
    3216             :                  * due to d_move
    3217             :                  */
    3218    12919907 :                 rcu_read_lock();
    3219    12920008 :                 if (d_ancestor(old_dentry, new_dentry))
    3220             :                         result = true;
    3221             :                 else
    3222      906384 :                         result = false;
    3223    12920008 :                 rcu_read_unlock();
    3224    12920035 :         } while (read_seqretry(&rename_lock, seq));
    3225             : 
    3226             :         return result;
    3227             : }
    3228             : EXPORT_SYMBOL(is_subdir);
    3229             : 
    3230         767 : static enum d_walk_ret d_genocide_kill(void *data, struct dentry *dentry)
    3231             : {
    3232         767 :         struct dentry *root = data;
    3233         767 :         if (dentry != root) {
    3234          63 :                 if (d_unhashed(dentry) || !dentry->d_inode)
    3235             :                         return D_WALK_SKIP;
    3236             : 
    3237          63 :                 if (!(dentry->d_flags & DCACHE_GENOCIDE)) {
    3238          63 :                         dentry->d_flags |= DCACHE_GENOCIDE;
    3239          63 :                         dentry->d_lockref.count--;
    3240             :                 }
    3241             :         }
    3242             :         return D_WALK_CONTINUE;
    3243             : }
    3244             : 
    3245         704 : void d_genocide(struct dentry *parent)
    3246             : {
    3247         704 :         d_walk(parent, parent, d_genocide_kill);
    3248         704 : }
    3249             : 
    3250             : EXPORT_SYMBOL(d_genocide);
    3251             : 
    3252     8759740 : void d_tmpfile(struct file *file, struct inode *inode)
    3253             : {
    3254     8759740 :         struct dentry *dentry = file->f_path.dentry;
    3255             : 
    3256     8759740 :         inode_dec_link_count(inode);
    3257    17943438 :         BUG_ON(dentry->d_name.name != dentry->d_iname ||
    3258             :                 !hlist_unhashed(&dentry->d_u.d_alias) ||
    3259             :                 !d_unlinked(dentry));
    3260     8971719 :         spin_lock(&dentry->d_parent->d_lock);
    3261     8967676 :         spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
    3262     8956690 :         dentry->d_name.len = sprintf(dentry->d_iname, "#%llu",
    3263     8956690 :                                 (unsigned long long)inode->i_ino);
    3264     8956690 :         spin_unlock(&dentry->d_lock);
    3265     8443588 :         spin_unlock(&dentry->d_parent->d_lock);
    3266     8670376 :         d_instantiate(dentry, inode);
    3267     8898533 : }
    3268             : EXPORT_SYMBOL(d_tmpfile);
    3269             : 
    3270             : static __initdata unsigned long dhash_entries;
    3271           0 : static int __init set_dhash_entries(char *str)
    3272             : {
    3273           0 :         if (!str)
    3274             :                 return 0;
    3275           0 :         dhash_entries = simple_strtoul(str, &str, 0);
    3276           0 :         return 1;
    3277             : }
    3278             : __setup("dhash_entries=", set_dhash_entries);
    3279             : 
    3280           0 : static void __init dcache_init_early(void)
    3281             : {
    3282             :         /* If hashes are distributed across NUMA nodes, defer
    3283             :          * hash allocation until vmalloc space is available.
    3284             :          */
    3285           0 :         if (hashdist)
    3286             :                 return;
    3287             : 
    3288           0 :         dentry_hashtable =
    3289           0 :                 alloc_large_system_hash("Dentry cache",
    3290             :                                         sizeof(struct hlist_bl_head),
    3291             :                                         dhash_entries,
    3292             :                                         13,
    3293             :                                         HASH_EARLY | HASH_ZERO,
    3294             :                                         &d_hash_shift,
    3295             :                                         NULL,
    3296             :                                         0,
    3297             :                                         0);
    3298           0 :         d_hash_shift = 32 - d_hash_shift;
    3299             : }
    3300             : 
    3301           0 : static void __init dcache_init(void)
    3302             : {
    3303             :         /*
    3304             :          * A constructor could be added for stable state like the lists,
    3305             :          * but it is probably not worth it because of the cache nature
    3306             :          * of the dcache.
    3307             :          */
    3308           0 :         dentry_cache = KMEM_CACHE_USERCOPY(dentry,
    3309             :                 SLAB_RECLAIM_ACCOUNT|SLAB_PANIC|SLAB_MEM_SPREAD|SLAB_ACCOUNT,
    3310             :                 d_iname);
    3311             : 
    3312             :         /* Hash may have been set up in dcache_init_early */
    3313           0 :         if (!hashdist)
    3314             :                 return;
    3315             : 
    3316           0 :         dentry_hashtable =
    3317           0 :                 alloc_large_system_hash("Dentry cache",
    3318             :                                         sizeof(struct hlist_bl_head),
    3319             :                                         dhash_entries,
    3320             :                                         13,
    3321             :                                         HASH_ZERO,
    3322             :                                         &d_hash_shift,
    3323             :                                         NULL,
    3324             :                                         0,
    3325             :                                         0);
    3326           0 :         d_hash_shift = 32 - d_hash_shift;
    3327             : }
    3328             : 
    3329             : /* SLAB cache for __getname() consumers */
    3330             : struct kmem_cache *names_cachep __read_mostly;
    3331             : EXPORT_SYMBOL(names_cachep);
    3332             : 
    3333           0 : void __init vfs_caches_init_early(void)
    3334             : {
    3335           0 :         int i;
    3336             : 
    3337           0 :         for (i = 0; i < ARRAY_SIZE(in_lookup_hashtable); i++)
    3338           0 :                 INIT_HLIST_BL_HEAD(&in_lookup_hashtable[i]);
    3339             : 
    3340           0 :         dcache_init_early();
    3341           0 :         inode_init_early();
    3342           0 : }
    3343             : 
    3344           0 : void __init vfs_caches_init(void)
    3345             : {
    3346           0 :         names_cachep = kmem_cache_create_usercopy("names_cache", PATH_MAX, 0,
    3347             :                         SLAB_HWCACHE_ALIGN|SLAB_PANIC, 0, PATH_MAX, NULL);
    3348             : 
    3349           0 :         dcache_init();
    3350           0 :         inode_init();
    3351           0 :         files_init();
    3352           0 :         files_maxfiles_init();
    3353           0 :         mnt_init();
    3354           0 :         bdev_cache_init();
    3355           0 :         chrdev_init();
    3356           0 : }

Generated by: LCOV version 1.14