LCOV - code coverage report
Current view: top level - fs - dcache.c (source / functions) Hit Total Coverage
Test: fstests of 6.5.0-rc3-achx @ Mon Jul 31 20:08:12 PDT 2023 Lines: 1186 1448 81.9 %
Date: 2023-07-31 20:08:12 Functions: 96 111 86.5 %

          Line data    Source code
       1             : // SPDX-License-Identifier: GPL-2.0-only
       2             : /*
       3             :  * fs/dcache.c
       4             :  *
       5             :  * Complete reimplementation
       6             :  * (C) 1997 Thomas Schoebel-Theuer,
       7             :  * with heavy changes by Linus Torvalds
       8             :  */
       9             : 
      10             : /*
      11             :  * Notes on the allocation strategy:
      12             :  *
      13             :  * The dcache is a master of the icache - whenever a dcache entry
      14             :  * exists, the inode will always exist. "iput()" is done either when
      15             :  * the dcache entry is deleted or garbage collected.
      16             :  */
      17             : 
      18             : #include <linux/ratelimit.h>
      19             : #include <linux/string.h>
      20             : #include <linux/mm.h>
      21             : #include <linux/fs.h>
      22             : #include <linux/fscrypt.h>
      23             : #include <linux/fsnotify.h>
      24             : #include <linux/slab.h>
      25             : #include <linux/init.h>
      26             : #include <linux/hash.h>
      27             : #include <linux/cache.h>
      28             : #include <linux/export.h>
      29             : #include <linux/security.h>
      30             : #include <linux/seqlock.h>
      31             : #include <linux/memblock.h>
      32             : #include <linux/bit_spinlock.h>
      33             : #include <linux/rculist_bl.h>
      34             : #include <linux/list_lru.h>
      35             : #include "internal.h"
      36             : #include "mount.h"
      37             : 
      38             : /*
      39             :  * Usage:
      40             :  * dcache->d_inode->i_lock protects:
      41             :  *   - i_dentry, d_u.d_alias, d_inode of aliases
      42             :  * dcache_hash_bucket lock protects:
      43             :  *   - the dcache hash table
      44             :  * s_roots bl list spinlock protects:
      45             :  *   - the s_roots list (see __d_drop)
      46             :  * dentry->d_sb->s_dentry_lru_lock protects:
      47             :  *   - the dcache lru lists and counters
      48             :  * d_lock protects:
      49             :  *   - d_flags
      50             :  *   - d_name
      51             :  *   - d_lru
      52             :  *   - d_count
      53             :  *   - d_unhashed()
      54             :  *   - d_parent and d_subdirs
      55             :  *   - childrens' d_child and d_parent
      56             :  *   - d_u.d_alias, d_inode
      57             :  *
      58             :  * Ordering:
      59             :  * dentry->d_inode->i_lock
      60             :  *   dentry->d_lock
      61             :  *     dentry->d_sb->s_dentry_lru_lock
      62             :  *     dcache_hash_bucket lock
      63             :  *     s_roots lock
      64             :  *
      65             :  * If there is an ancestor relationship:
      66             :  * dentry->d_parent->...->d_parent->d_lock
      67             :  *   ...
      68             :  *     dentry->d_parent->d_lock
      69             :  *       dentry->d_lock
      70             :  *
      71             :  * If no ancestor relationship:
      72             :  * arbitrary, since it's serialized on rename_lock
      73             :  */
      74             : int sysctl_vfs_cache_pressure __read_mostly = 100;
      75             : EXPORT_SYMBOL_GPL(sysctl_vfs_cache_pressure);
      76             : 
      77             : __cacheline_aligned_in_smp DEFINE_SEQLOCK(rename_lock);
      78             : 
      79             : EXPORT_SYMBOL(rename_lock);
      80             : 
      81             : static struct kmem_cache *dentry_cache __read_mostly;
      82             : 
      83             : const struct qstr empty_name = QSTR_INIT("", 0);
      84             : EXPORT_SYMBOL(empty_name);
      85             : const struct qstr slash_name = QSTR_INIT("/", 1);
      86             : EXPORT_SYMBOL(slash_name);
      87             : const struct qstr dotdot_name = QSTR_INIT("..", 2);
      88             : EXPORT_SYMBOL(dotdot_name);
      89             : 
      90             : /*
      91             :  * This is the single most critical data structure when it comes
      92             :  * to the dcache: the hashtable for lookups. Somebody should try
      93             :  * to make this good - I've just made it work.
      94             :  *
      95             :  * This hash-function tries to avoid losing too many bits of hash
      96             :  * information, yet avoid using a prime hash-size or similar.
      97             :  */
      98             : 
      99             : static unsigned int d_hash_shift __read_mostly;
     100             : 
     101             : static struct hlist_bl_head *dentry_hashtable __read_mostly;
     102             : 
     103 68363260058 : static inline struct hlist_bl_head *d_hash(unsigned int hash)
     104             : {
     105 68363260058 :         return dentry_hashtable + (hash >> d_hash_shift);
     106             : }
     107             : 
     108             : #define IN_LOOKUP_SHIFT 10
     109             : static struct hlist_bl_head in_lookup_hashtable[1 << IN_LOOKUP_SHIFT];
     110             : 
     111             : static inline struct hlist_bl_head *in_lookup_hash(const struct dentry *parent,
     112             :                                         unsigned int hash)
     113             : {
     114  1837467825 :         hash += (unsigned long) parent / L1_CACHE_BYTES;
     115  1837467825 :         return in_lookup_hashtable + hash_32(hash, IN_LOOKUP_SHIFT);
     116             : }
     117             : 
     118             : struct dentry_stat_t {
     119             :         long nr_dentry;
     120             :         long nr_unused;
     121             :         long age_limit;         /* age in seconds */
     122             :         long want_pages;        /* pages requested by system */
     123             :         long nr_negative;       /* # of unused negative dentries */
     124             :         long dummy;             /* Reserved for future use */
     125             : };
     126             : 
     127             : static DEFINE_PER_CPU(long, nr_dentry);
     128             : static DEFINE_PER_CPU(long, nr_dentry_unused);
     129             : static DEFINE_PER_CPU(long, nr_dentry_negative);
     130             : 
     131             : #if defined(CONFIG_SYSCTL) && defined(CONFIG_PROC_FS)
     132             : /* Statistics gathering. */
     133             : static struct dentry_stat_t dentry_stat = {
     134             :         .age_limit = 45,
     135             : };
     136             : 
     137             : /*
     138             :  * Here we resort to our own counters instead of using generic per-cpu counters
     139             :  * for consistency with what the vfs inode code does. We are expected to harvest
     140             :  * better code and performance by having our own specialized counters.
     141             :  *
     142             :  * Please note that the loop is done over all possible CPUs, not over all online
     143             :  * CPUs. The reason for this is that we don't want to play games with CPUs going
     144             :  * on and off. If one of them goes off, we will just keep their counters.
     145             :  *
     146             :  * glommer: See cffbc8a for details, and if you ever intend to change this,
     147             :  * please update all vfs counters to match.
     148             :  */
     149         903 : static long get_nr_dentry(void)
     150             : {
     151         903 :         int i;
     152         903 :         long sum = 0;
     153        4515 :         for_each_possible_cpu(i)
     154        3612 :                 sum += per_cpu(nr_dentry, i);
     155         903 :         return sum < 0 ? 0 : sum;
     156             : }
     157             : 
     158         903 : static long get_nr_dentry_unused(void)
     159             : {
     160         903 :         int i;
     161         903 :         long sum = 0;
     162        4515 :         for_each_possible_cpu(i)
     163        3612 :                 sum += per_cpu(nr_dentry_unused, i);
     164         903 :         return sum < 0 ? 0 : sum;
     165             : }
     166             : 
     167         903 : static long get_nr_dentry_negative(void)
     168             : {
     169         903 :         int i;
     170         903 :         long sum = 0;
     171             : 
     172        4515 :         for_each_possible_cpu(i)
     173        3612 :                 sum += per_cpu(nr_dentry_negative, i);
     174         903 :         return sum < 0 ? 0 : sum;
     175             : }
     176             : 
     177         903 : static int proc_nr_dentry(struct ctl_table *table, int write, void *buffer,
     178             :                           size_t *lenp, loff_t *ppos)
     179             : {
     180         903 :         dentry_stat.nr_dentry = get_nr_dentry();
     181         903 :         dentry_stat.nr_unused = get_nr_dentry_unused();
     182         903 :         dentry_stat.nr_negative = get_nr_dentry_negative();
     183         903 :         return proc_doulongvec_minmax(table, write, buffer, lenp, ppos);
     184             : }
     185             : 
     186             : static struct ctl_table fs_dcache_sysctls[] = {
     187             :         {
     188             :                 .procname       = "dentry-state",
     189             :                 .data           = &dentry_stat,
     190             :                 .maxlen         = 6*sizeof(long),
     191             :                 .mode           = 0444,
     192             :                 .proc_handler   = proc_nr_dentry,
     193             :         },
     194             :         { }
     195             : };
     196             : 
     197           0 : static int __init init_fs_dcache_sysctls(void)
     198             : {
     199           0 :         register_sysctl_init("fs", fs_dcache_sysctls);
     200           0 :         return 0;
     201             : }
     202             : fs_initcall(init_fs_dcache_sysctls);
     203             : #endif
     204             : 
     205             : /*
     206             :  * Compare 2 name strings, return 0 if they match, otherwise non-zero.
     207             :  * The strings are both count bytes long, and count is non-zero.
     208             :  */
     209             : #ifdef CONFIG_DCACHE_WORD_ACCESS
     210             : 
     211             : #include <asm/word-at-a-time.h>
     212             : /*
     213             :  * NOTE! 'cs' and 'scount' come from a dentry, so it has a
     214             :  * aligned allocation for this particular component. We don't
     215             :  * strictly need the load_unaligned_zeropad() safety, but it
     216             :  * doesn't hurt either.
     217             :  *
     218             :  * In contrast, 'ct' and 'tcount' can be from a pathname, and do
     219             :  * need the careful unaligned handling.
     220             :  */
     221 64180414322 : static inline int dentry_string_cmp(const unsigned char *cs, const unsigned char *ct, unsigned tcount)
     222             : {
     223 65721865981 :         unsigned long a,b,mask;
     224             : 
     225 65721865981 :         for (;;) {
     226 65721865981 :                 a = read_word_at_a_time(cs);
     227 65721865981 :                 b = load_unaligned_zeropad(ct);
     228 65756598733 :                 if (tcount < sizeof(unsigned long))
     229             :                         break;
     230  2030610529 :                 if (unlikely(a != b))
     231             :                         return 1;
     232  2030610379 :                 cs += sizeof(unsigned long);
     233  2030610379 :                 ct += sizeof(unsigned long);
     234  2030610379 :                 tcount -= sizeof(unsigned long);
     235  2030610379 :                 if (!tcount)
     236             :                         return 0;
     237             :         }
     238 63725988204 :         mask = bytemask_from_count(tcount);
     239 63725988204 :         return unlikely(!!((a ^ b) & mask));
     240             : }
     241             : 
     242             : #else
     243             : 
     244             : static inline int dentry_string_cmp(const unsigned char *cs, const unsigned char *ct, unsigned tcount)
     245             : {
     246             :         do {
     247             :                 if (*cs != *ct)
     248             :                         return 1;
     249             :                 cs++;
     250             :                 ct++;
     251             :                 tcount--;
     252             :         } while (tcount);
     253             :         return 0;
     254             : }
     255             : 
     256             : #endif
     257             : 
     258             : static inline int dentry_cmp(const struct dentry *dentry, const unsigned char *ct, unsigned tcount)
     259             : {
     260             :         /*
     261             :          * Be careful about RCU walk racing with rename:
     262             :          * use 'READ_ONCE' to fetch the name pointer.
     263             :          *
     264             :          * NOTE! Even if a rename will mean that the length
     265             :          * was not loaded atomically, we don't care. The
     266             :          * RCU walk will check the sequence count eventually,
     267             :          * and catch it. And we won't overrun the buffer,
     268             :          * because we're reading the name pointer atomically,
     269             :          * and a dentry name is guaranteed to be properly
     270             :          * terminated with a NUL byte.
     271             :          *
     272             :          * End result: even if 'len' is wrong, we'll exit
     273             :          * early because the data cannot match (there can
     274             :          * be no NUL in the ct/tcount data)
     275             :          */
     276 64217486339 :         const unsigned char *cs = READ_ONCE(dentry->d_name.name);
     277             : 
     278 64217486339 :         return dentry_string_cmp(cs, ct, tcount);
     279             : }
     280             : 
     281             : struct external_name {
     282             :         union {
     283             :                 atomic_t count;
     284             :                 struct rcu_head head;
     285             :         } u;
     286             :         unsigned char name[];
     287             : };
     288             : 
     289             : static inline struct external_name *external_name(struct dentry *dentry)
     290             : {
     291   441850613 :         return container_of(dentry->d_name.name, struct external_name, name[0]);
     292             : }
     293             : 
     294  1228118942 : static void __d_free(struct rcu_head *head)
     295             : {
     296  1262201116 :         struct dentry *dentry = container_of(head, struct dentry, d_u.d_rcu);
     297             : 
     298  1228118942 :         kmem_cache_free(dentry_cache, dentry); 
     299    34087215 : }
     300             : 
     301   440728586 : static void __d_free_external(struct rcu_head *head)
     302             : {
     303   440728586 :         struct dentry *dentry = container_of(head, struct dentry, d_u.d_rcu);
     304   440728586 :         kfree(external_name(dentry));
     305   440673693 :         kmem_cache_free(dentry_cache, dentry);
     306   441405414 : }
     307             : 
     308             : static inline int dname_external(const struct dentry *dentry)
     309             : {
     310  1872633554 :         return dentry->d_name.name != dentry->d_iname;
     311             : }
     312             : 
     313    51436605 : void take_dentry_name_snapshot(struct name_snapshot *name, struct dentry *dentry)
     314             : {
     315    51436605 :         spin_lock(&dentry->d_lock);
     316    51437214 :         name->name = dentry->d_name;
     317    51437214 :         if (unlikely(dname_external(dentry))) {
     318     1123289 :                 atomic_inc(&external_name(dentry)->u.count);
     319             :         } else {
     320   100627850 :                 memcpy(name->inline_name, dentry->d_iname,
     321             :                        dentry->d_name.len + 1);
     322    50313925 :                 name->name.name = name->inline_name;
     323             :         }
     324    51437379 :         spin_unlock(&dentry->d_lock);
     325    51436995 : }
     326             : EXPORT_SYMBOL(take_dentry_name_snapshot);
     327             : 
     328    51437840 : void release_dentry_name_snapshot(struct name_snapshot *name)
     329             : {
     330    51437840 :         if (unlikely(name->name.name != name->inline_name)) {
     331     1123646 :                 struct external_name *p;
     332     1123646 :                 p = container_of(name->name.name, struct external_name, name[0]);
     333     1123646 :                 if (unlikely(atomic_dec_and_test(&p->u.count)))
     334     1122021 :                         kfree_rcu(p, u.head);
     335             :         }
     336    51437832 : }
     337             : EXPORT_SYMBOL(release_dentry_name_snapshot);
     338             : 
     339             : static inline void __d_set_inode_and_type(struct dentry *dentry,
     340             :                                           struct inode *inode,
     341             :                                           unsigned type_flags)
     342             : {
     343   852999737 :         unsigned flags;
     344             : 
     345   852999737 :         dentry->d_inode = inode;
     346   852999737 :         flags = READ_ONCE(dentry->d_flags);
     347   852999737 :         flags &= ~(DCACHE_ENTRY_TYPE | DCACHE_FALLTHRU);
     348   852999737 :         flags |= type_flags;
     349  1705977206 :         smp_store_release(&dentry->d_flags, flags);
     350             : }
     351             : 
     352             : static inline void __d_clear_type_and_inode(struct dentry *dentry)
     353             : {
     354   849797018 :         unsigned flags = READ_ONCE(dentry->d_flags);
     355             : 
     356   849797018 :         flags &= ~(DCACHE_ENTRY_TYPE | DCACHE_FALLTHRU);
     357   849797018 :         WRITE_ONCE(dentry->d_flags, flags);
     358   849797018 :         dentry->d_inode = NULL;
     359   849797018 :         if (dentry->d_flags & DCACHE_LRU_LIST)
     360    59100623 :                 this_cpu_inc(nr_dentry_negative);
     361             : }
     362             : 
     363  1711861996 : static void dentry_free(struct dentry *dentry)
     364             : {
     365  1711861996 :         WARN_ON(!hlist_unhashed(&dentry->d_u.d_alias));
     366  1711861996 :         if (unlikely(dname_external(dentry))) {
     367   443531131 :                 struct external_name *p = external_name(dentry);
     368   443531131 :                 if (likely(atomic_dec_and_test(&p->u.count))) {
     369   443402386 :                         call_rcu(&dentry->d_u.d_rcu, __d_free_external);
     370   443402386 :                         return;
     371             :                 }
     372             :         }
     373             :         /* if dentry was never visible to RCU, immediate free is OK */
     374  1269379869 :         if (dentry->d_flags & DCACHE_NORCU)
     375    34082174 :                 __d_free(&dentry->d_u.d_rcu);
     376             :         else
     377  1235297695 :                 call_rcu(&dentry->d_u.d_rcu, __d_free);
     378             : }
     379             : 
     380             : /*
     381             :  * Release the dentry's inode, using the filesystem
     382             :  * d_iput() operation if defined.
     383             :  */
     384   850904582 : static void dentry_unlink_inode(struct dentry * dentry)
     385             :         __releases(dentry->d_lock)
     386             :         __releases(dentry->d_inode->i_lock)
     387             : {
     388   850904582 :         struct inode *inode = dentry->d_inode;
     389             : 
     390   850904582 :         raw_write_seqcount_begin(&dentry->d_seq);
     391   849797018 :         __d_clear_type_and_inode(dentry);
     392   849701961 :         hlist_del_init(&dentry->d_u.d_alias);
     393   849701961 :         raw_write_seqcount_end(&dentry->d_seq);
     394   848922607 :         spin_unlock(&dentry->d_lock);
     395   855171518 :         spin_unlock(&inode->i_lock);
     396   855432787 :         if (!inode->i_nlink)
     397   515118737 :                 fsnotify_inoderemove(inode);
     398   853856575 :         if (dentry->d_op && dentry->d_op->d_iput)
     399      759973 :                 dentry->d_op->d_iput(dentry, inode);
     400             :         else
     401   853096602 :                 iput(inode);
     402   852157809 : }
     403             : 
     404             : /*
     405             :  * The DCACHE_LRU_LIST bit is set whenever the 'd_lru' entry
     406             :  * is in use - which includes both the "real" per-superblock
     407             :  * LRU list _and_ the DCACHE_SHRINK_LIST use.
     408             :  *
     409             :  * The DCACHE_SHRINK_LIST bit is set whenever the dentry is
     410             :  * on the shrink list (ie not on the superblock LRU list).
     411             :  *
     412             :  * The per-cpu "nr_dentry_unused" counters are updated with
     413             :  * the DCACHE_LRU_LIST bit.
     414             :  *
     415             :  * The per-cpu "nr_dentry_negative" counters are only updated
     416             :  * when deleted from or added to the per-superblock LRU list, not
     417             :  * from/to the shrink list. That is to avoid an unneeded dec/inc
     418             :  * pair when moving from LRU to shrink list in select_collect().
     419             :  *
     420             :  * These helper functions make sure we always follow the
     421             :  * rules. d_lock must be held by the caller.
     422             :  */
     423             : #define D_FLAG_VERIFY(dentry,x) WARN_ON_ONCE(((dentry)->d_flags & (DCACHE_LRU_LIST | DCACHE_SHRINK_LIST)) != (x))
     424   180491633 : static void d_lru_add(struct dentry *dentry)
     425             : {
     426   180491633 :         D_FLAG_VERIFY(dentry, 0);
     427   180491633 :         dentry->d_flags |= DCACHE_LRU_LIST;
     428   180491633 :         this_cpu_inc(nr_dentry_unused);
     429   180338938 :         if (d_is_negative(dentry))
     430    41175775 :                 this_cpu_inc(nr_dentry_negative);
     431   180337988 :         WARN_ON_ONCE(!list_lru_add(&dentry->d_sb->s_dentry_lru, &dentry->d_lru));
     432   181339278 : }
     433             : 
     434   141132248 : static void d_lru_del(struct dentry *dentry)
     435             : {
     436   141132248 :         D_FLAG_VERIFY(dentry, DCACHE_LRU_LIST);
     437   141132248 :         dentry->d_flags &= ~DCACHE_LRU_LIST;
     438   141132248 :         this_cpu_dec(nr_dentry_unused);
     439   141132088 :         if (d_is_negative(dentry))
     440    71834706 :                 this_cpu_dec(nr_dentry_negative);
     441   141132070 :         WARN_ON_ONCE(!list_lru_del(&dentry->d_sb->s_dentry_lru, &dentry->d_lru));
     442   141132946 : }
     443             : 
     444   189305071 : static void d_shrink_del(struct dentry *dentry)
     445             : {
     446   189305071 :         D_FLAG_VERIFY(dentry, DCACHE_SHRINK_LIST | DCACHE_LRU_LIST);
     447   189305071 :         list_del_init(&dentry->d_lru);
     448   189303914 :         dentry->d_flags &= ~(DCACHE_SHRINK_LIST | DCACHE_LRU_LIST);
     449   189303914 :         this_cpu_dec(nr_dentry_unused);
     450   189303924 : }
     451             : 
     452   150210824 : static void d_shrink_add(struct dentry *dentry, struct list_head *list)
     453             : {
     454   150210824 :         D_FLAG_VERIFY(dentry, 0);
     455   150210824 :         list_add(&dentry->d_lru, list);
     456   150210783 :         dentry->d_flags |= DCACHE_SHRINK_LIST | DCACHE_LRU_LIST;
     457   150210783 :         this_cpu_inc(nr_dentry_unused);
     458   150210806 : }
     459             : 
     460             : /*
     461             :  * These can only be called under the global LRU lock, ie during the
     462             :  * callback for freeing the LRU list. "isolate" removes it from the
     463             :  * LRU lists entirely, while shrink_move moves it to the indicated
     464             :  * private list.
     465             :  */
     466     1242551 : static void d_lru_isolate(struct list_lru_one *lru, struct dentry *dentry)
     467             : {
     468     1242551 :         D_FLAG_VERIFY(dentry, DCACHE_LRU_LIST);
     469     1242551 :         dentry->d_flags &= ~DCACHE_LRU_LIST;
     470     1242551 :         this_cpu_dec(nr_dentry_unused);
     471     1242551 :         if (d_is_negative(dentry))
     472           0 :                 this_cpu_dec(nr_dentry_negative);
     473     1242551 :         list_lru_isolate(lru, &dentry->d_lru);
     474     1242551 : }
     475             : 
     476    39095424 : static void d_lru_shrink_move(struct list_lru_one *lru, struct dentry *dentry,
     477             :                               struct list_head *list)
     478             : {
     479    39095424 :         D_FLAG_VERIFY(dentry, DCACHE_LRU_LIST);
     480    39095424 :         dentry->d_flags |= DCACHE_SHRINK_LIST;
     481    39095424 :         if (d_is_negative(dentry))
     482     3058156 :                 this_cpu_dec(nr_dentry_negative);
     483    39095424 :         list_lru_isolate_move(lru, &dentry->d_lru, list);
     484    39095424 : }
     485             : 
     486  1103199538 : static void ___d_drop(struct dentry *dentry)
     487             : {
     488  1103199538 :         struct hlist_bl_head *b;
     489             :         /*
     490             :          * Hashed dentries are normally on the dentry hashtable,
     491             :          * with the exception of those newly allocated by
     492             :          * d_obtain_root, which are always IS_ROOT:
     493             :          */
     494  1103199538 :         if (unlikely(IS_ROOT(dentry)))
     495           0 :                 b = &dentry->d_sb->s_roots;
     496             :         else
     497  1103199538 :                 b = d_hash(dentry->d_name.hash);
     498             : 
     499  1103192567 :         hlist_bl_lock(b);
     500  1103195900 :         __hlist_bl_del(&dentry->d_hash);
     501  1103198545 :         hlist_bl_unlock(b);
     502  1103192881 : }
     503             : 
     504  1725671584 : void __d_drop(struct dentry *dentry)
     505             : {
     506  1725671584 :         if (!d_unhashed(dentry)) {
     507  1001276984 :                 ___d_drop(dentry);
     508  1001267942 :                 dentry->d_hash.pprev = NULL;
     509  1001267942 :                 write_seqcount_invalidate(&dentry->d_seq);
     510             :         }
     511  1725662241 : }
     512             : EXPORT_SYMBOL(__d_drop);
     513             : 
     514             : /**
     515             :  * d_drop - drop a dentry
     516             :  * @dentry: dentry to drop
     517             :  *
     518             :  * d_drop() unhashes the entry from the parent dentry hashes, so that it won't
     519             :  * be found through a VFS lookup any more. Note that this is different from
     520             :  * deleting the dentry - d_delete will try to mark the dentry negative if
     521             :  * possible, giving a successful _negative_ lookup, while d_drop will
     522             :  * just make the cache lookup fail.
     523             :  *
     524             :  * d_drop() is used mainly for stuff that wants to invalidate a dentry for some
     525             :  * reason (NFS timeouts or autofs deletes).
     526             :  *
     527             :  * __d_drop requires dentry->d_lock
     528             :  *
     529             :  * ___d_drop doesn't mark dentry as "unhashed"
     530             :  * (dentry->d_hash.pprev will be LIST_POISON2, not NULL).
     531             :  */
     532      193484 : void d_drop(struct dentry *dentry)
     533             : {
     534      193484 :         spin_lock(&dentry->d_lock);
     535      193487 :         __d_drop(dentry);
     536      193488 :         spin_unlock(&dentry->d_lock);
     537      193485 : }
     538             : EXPORT_SYMBOL(d_drop);
     539             : 
     540  1709733098 : static inline void dentry_unlist(struct dentry *dentry, struct dentry *parent)
     541             : {
     542  1709733098 :         struct dentry *next;
     543             :         /*
     544             :          * Inform d_walk() and shrink_dentry_list() that we are no longer
     545             :          * attached to the dentry tree
     546             :          */
     547  1709733098 :         dentry->d_flags |= DCACHE_DENTRY_KILLED;
     548  1709733098 :         if (unlikely(list_empty(&dentry->d_child)))
     549             :                 return;
     550  1061351283 :         __list_del_entry(&dentry->d_child);
     551             :         /*
     552             :          * Cursors can move around the list of children.  While we'd been
     553             :          * a normal list member, it didn't matter - ->d_child.next would've
     554             :          * been updated.  However, from now on it won't be and for the
     555             :          * things like d_walk() it might end up with a nasty surprise.
     556             :          * Normally d_walk() doesn't care about cursors moving around -
     557             :          * ->d_lock on parent prevents that and since a cursor has no children
     558             :          * of its own, we get through it without ever unlocking the parent.
     559             :          * There is one exception, though - if we ascend from a child that
     560             :          * gets killed as soon as we unlock it, the next sibling is found
     561             :          * using the value left in its ->d_child.next.  And if _that_
     562             :          * pointed to a cursor, and cursor got moved (e.g. by lseek())
     563             :          * before d_walk() regains parent->d_lock, we'll end up skipping
     564             :          * everything the cursor had been moved past.
     565             :          *
     566             :          * Solution: make sure that the pointer left behind in ->d_child.next
     567             :          * points to something that won't be moving around.  I.e. skip the
     568             :          * cursors.
     569             :          */
     570  1061351283 :         while (dentry->d_child.next != &parent->d_subdirs) {
     571   986919083 :                 next = list_entry(dentry->d_child.next, struct dentry, d_child);
     572   986919083 :                 if (likely(!(next->d_flags & DCACHE_DENTRY_CURSOR)))
     573             :                         break;
     574           0 :                 dentry->d_child.next = next->d_child.next;
     575             :         }
     576             : }
     577             : 
     578  1713011078 : static void __dentry_kill(struct dentry *dentry)
     579             : {
     580  1713011078 :         struct dentry *parent = NULL;
     581  1713011078 :         bool can_free = true;
     582  1713011078 :         if (!IS_ROOT(dentry))
     583  1067457223 :                 parent = dentry->d_parent;
     584             : 
     585             :         /*
     586             :          * The dentry is now unrecoverably dead to the world.
     587             :          */
     588  1713011078 :         lockref_mark_dead(&dentry->d_lockref);
     589             : 
     590             :         /*
     591             :          * inform the fs via d_prune that this dentry is about to be
     592             :          * unhashed and destroyed.
     593             :          */
     594  1711402161 :         if (dentry->d_flags & DCACHE_OP_PRUNE)
     595        5613 :                 dentry->d_op->d_prune(dentry);
     596             : 
     597  1711402161 :         if (dentry->d_flags & DCACHE_LRU_LIST) {
     598     1897093 :                 if (!(dentry->d_flags & DCACHE_SHRINK_LIST))
     599     1897087 :                         d_lru_del(dentry);
     600             :         }
     601             :         /* if it was on the hash then remove it */
     602  1711402227 :         __d_drop(dentry);
     603  1709510737 :         dentry_unlist(dentry, parent);
     604  1710043235 :         if (parent)
     605  1067440684 :                 spin_unlock(&parent->d_lock);
     606  1710063056 :         if (dentry->d_inode)
     607   782490824 :                 dentry_unlink_inode(dentry);
     608             :         else
     609   927572232 :                 spin_unlock(&dentry->d_lock);
     610  1709908418 :         this_cpu_dec(nr_dentry);
     611  1710248081 :         if (dentry->d_op && dentry->d_op->d_release)
     612     2764319 :                 dentry->d_op->d_release(dentry);
     613             : 
     614  1710247946 :         spin_lock(&dentry->d_lock);
     615  1713165954 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
     616           0 :                 dentry->d_flags |= DCACHE_MAY_FREE;
     617           0 :                 can_free = false;
     618             :         }
     619  1713165954 :         spin_unlock(&dentry->d_lock);
     620  1713159331 :         if (likely(can_free))
     621  1713159331 :                 dentry_free(dentry);
     622  1711228615 :         cond_resched();
     623  1710809791 : }
     624             : 
     625     2657505 : static struct dentry *__lock_parent(struct dentry *dentry)
     626             : {
     627     2657505 :         struct dentry *parent;
     628     2657505 :         rcu_read_lock();
     629     2657521 :         spin_unlock(&dentry->d_lock);
     630     2664396 : again:
     631     2664396 :         parent = READ_ONCE(dentry->d_parent);
     632     2664396 :         spin_lock(&parent->d_lock);
     633             :         /*
     634             :          * We can't blindly lock dentry until we are sure
     635             :          * that we won't violate the locking order.
     636             :          * Any changes of dentry->d_parent must have
     637             :          * been done with parent->d_lock held, so
     638             :          * spin_lock() above is enough of a barrier
     639             :          * for checking if it's still our child.
     640             :          */
     641     2665346 :         if (unlikely(parent != dentry->d_parent)) {
     642           0 :                 spin_unlock(&parent->d_lock);
     643           0 :                 goto again;
     644             :         }
     645     2665346 :         rcu_read_unlock();
     646     2665346 :         if (parent != dentry)
     647     2665346 :                 spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
     648             :         else
     649             :                 parent = NULL;
     650     2665345 :         return parent;
     651             : }
     652             : 
     653       12215 : static inline struct dentry *lock_parent(struct dentry *dentry)
     654             : {
     655       12215 :         struct dentry *parent = dentry->d_parent;
     656       12215 :         if (IS_ROOT(dentry))
     657             :                 return NULL;
     658          14 :         if (likely(spin_trylock(&parent->d_lock)))
     659             :                 return parent;
     660           0 :         return __lock_parent(dentry);
     661             : }
     662             : 
     663  3998154858 : static inline bool retain_dentry(struct dentry *dentry)
     664             : {
     665  3998154858 :         WARN_ON(d_in_lookup(dentry));
     666             : 
     667             :         /* Unreachable? Get rid of it */
     668  3998154858 :         if (unlikely(d_unhashed(dentry)))
     669             :                 return false;
     670             : 
     671  3273143204 :         if (unlikely(dentry->d_flags & DCACHE_DISCONNECTED))
     672             :                 return false;
     673             : 
     674  3273143204 :         if (unlikely(dentry->d_flags & DCACHE_OP_DELETE)) {
     675  1051491914 :                 if (dentry->d_op->d_delete(dentry))
     676             :                         return false;
     677             :         }
     678             : 
     679  2472246292 :         if (unlikely(dentry->d_flags & DCACHE_DONTCACHE))
     680             :                 return false;
     681             : 
     682             :         /* retain; LRU fodder */
     683  2472246265 :         dentry->d_lockref.count--;
     684  2472246265 :         if (unlikely(!(dentry->d_flags & DCACHE_LRU_LIST)))
     685   180677206 :                 d_lru_add(dentry);
     686  2291569059 :         else if (unlikely(!(dentry->d_flags & DCACHE_REFERENCED)))
     687   148363777 :                 dentry->d_flags |= DCACHE_REFERENCED;
     688             :         return true;
     689             : }
     690             : 
     691   588014911 : void d_mark_dontcache(struct inode *inode)
     692             : {
     693   588014911 :         struct dentry *de;
     694             : 
     695   588014911 :         spin_lock(&inode->i_lock);
     696  1176568785 :         hlist_for_each_entry(de, &inode->i_dentry, d_u.d_alias) {
     697        5924 :                 spin_lock(&de->d_lock);
     698          27 :                 de->d_flags |= DCACHE_DONTCACHE;
     699          27 :                 spin_unlock(&de->d_lock);
     700             :         }
     701   588278582 :         inode->i_state |= I_DONTCACHE;
     702   588278582 :         spin_unlock(&inode->i_lock);
     703   588304020 : }
     704             : EXPORT_SYMBOL(d_mark_dontcache);
     705             : 
     706             : /*
     707             :  * Finish off a dentry we've decided to kill.
     708             :  * dentry->d_lock must be held, returns with it unlocked.
     709             :  * Returns dentry requiring refcount drop, or NULL if we're done.
     710             :  */
     711  1523064133 : static struct dentry *dentry_kill(struct dentry *dentry)
     712             :         __releases(dentry->d_lock)
     713             : {
     714  1523064133 :         struct inode *inode = dentry->d_inode;
     715  1523064133 :         struct dentry *parent = NULL;
     716             : 
     717  2194361029 :         if (inode && unlikely(!spin_trylock(&inode->i_lock)))
     718       11916 :                 goto slow_positive;
     719             : 
     720  1525214027 :         if (!IS_ROOT(dentry)) {
     721   878638183 :                 parent = dentry->d_parent;
     722   878638183 :                 if (unlikely(!spin_trylock(&parent->d_lock))) {
     723     2660432 :                         parent = __lock_parent(dentry);
     724     2665345 :                         if (likely(inode || !dentry->d_inode))
     725     2665345 :                                 goto got_locks;
     726             :                         /* negative that became positive */
     727           0 :                         if (parent)
     728           0 :                                 spin_unlock(&parent->d_lock);
     729           0 :                         inode = dentry->d_inode;
     730           0 :                         goto slow_positive;
     731             :                 }
     732             :         }
     733  1522763621 :         __dentry_kill(dentry);
     734  1522763621 :         return parent;
     735             : 
     736       11916 : slow_positive:
     737       11916 :         spin_unlock(&dentry->d_lock);
     738       11862 :         spin_lock(&inode->i_lock);
     739       12215 :         spin_lock(&dentry->d_lock);
     740       12215 :         parent = lock_parent(dentry);
     741     2677560 : got_locks:
     742     2677560 :         if (unlikely(dentry->d_lockref.count != 1)) {
     743      364572 :                 dentry->d_lockref.count--;
     744     2312988 :         } else if (likely(!retain_dentry(dentry))) {
     745     2312988 :                 __dentry_kill(dentry);
     746     2312988 :                 return parent;
     747             :         }
     748             :         /* we are keeping it, after all */
     749      364572 :         if (inode)
     750           1 :                 spin_unlock(&inode->i_lock);
     751      364572 :         if (parent)
     752      364572 :                 spin_unlock(&parent->d_lock);
     753      364572 :         spin_unlock(&dentry->d_lock);
     754      364572 :         return NULL;
     755             : }
     756             : 
     757             : /*
     758             :  * Try to do a lockless dput(), and return whether that was successful.
     759             :  *
     760             :  * If unsuccessful, we return false, having already taken the dentry lock.
     761             :  *
     762             :  * The caller needs to hold the RCU read lock, so that the dentry is
     763             :  * guaranteed to stay around even if the refcount goes down to zero!
     764             :  */
     765 17942251515 : static inline bool fast_dput(struct dentry *dentry)
     766             : {
     767 17942251515 :         int ret;
     768 17942251515 :         unsigned int d_flags;
     769             : 
     770             :         /*
     771             :          * If we have a d_op->d_delete() operation, we sould not
     772             :          * let the dentry count go to zero, so use "put_or_lock".
     773             :          */
     774 17942251515 :         if (unlikely(dentry->d_flags & DCACHE_OP_DELETE))
     775  7883649198 :                 return lockref_put_or_lock(&dentry->d_lockref);
     776             : 
     777             :         /*
     778             :          * .. otherwise, we can try to just decrement the
     779             :          * lockref optimistically.
     780             :          */
     781 10058602317 :         ret = lockref_put_return(&dentry->d_lockref);
     782             : 
     783             :         /*
     784             :          * If the lockref_put_return() failed due to the lock being held
     785             :          * by somebody else, the fast path has failed. We will need to
     786             :          * get the lock, and then check the count again.
     787             :          */
     788 10058030919 :         if (unlikely(ret < 0)) {
     789 10058030919 :                 spin_lock(&dentry->d_lock);
     790 10068722199 :                 if (dentry->d_lockref.count > 1) {
     791  7135180198 :                         dentry->d_lockref.count--;
     792  7135180198 :                         spin_unlock(&dentry->d_lock);
     793  7135180198 :                         return true;
     794             :                 }
     795             :                 return false;
     796             :         }
     797             : 
     798             :         /*
     799             :          * If we weren't the last ref, we're done.
     800             :          */
     801           0 :         if (ret)
     802             :                 return true;
     803             : 
     804             :         /*
     805             :          * Careful, careful. The reference count went down
     806             :          * to zero, but we don't hold the dentry lock, so
     807             :          * somebody else could get it again, and do another
     808             :          * dput(), and we need to not race with that.
     809             :          *
     810             :          * However, there is a very special and common case
     811             :          * where we don't care, because there is nothing to
     812             :          * do: the dentry is still hashed, it does not have
     813             :          * a 'delete' op, and it's referenced and already on
     814             :          * the LRU list.
     815             :          *
     816             :          * NOTE! Since we aren't locked, these values are
     817             :          * not "stable". However, it is sufficient that at
     818             :          * some point after we dropped the reference the
     819             :          * dentry was hashed and the flags had the proper
     820             :          * value. Other dentry users may have re-gotten
     821             :          * a reference to the dentry and change that, but
     822             :          * our work is done - we can leave the dentry
     823             :          * around with a zero refcount.
     824             :          *
     825             :          * Nevertheless, there are two cases that we should kill
     826             :          * the dentry anyway.
     827             :          * 1. free disconnected dentries as soon as their refcount
     828             :          *    reached zero.
     829             :          * 2. free dentries if they should not be cached.
     830             :          */
     831           0 :         smp_rmb();
     832           0 :         d_flags = READ_ONCE(dentry->d_flags);
     833           0 :         d_flags &= DCACHE_REFERENCED | DCACHE_LRU_LIST |
     834             :                         DCACHE_DISCONNECTED | DCACHE_DONTCACHE;
     835             : 
     836             :         /* Nothing to do? Dropping the reference was all we needed? */
     837           0 :         if (d_flags == (DCACHE_REFERENCED | DCACHE_LRU_LIST) && !d_unhashed(dentry))
     838             :                 return true;
     839             : 
     840             :         /*
     841             :          * Not the fast normal case? Get the lock. We've already decremented
     842             :          * the refcount, but we'll need to re-check the situation after
     843             :          * getting the lock.
     844             :          */
     845           0 :         spin_lock(&dentry->d_lock);
     846             : 
     847             :         /*
     848             :          * Did somebody else grab a reference to it in the meantime, and
     849             :          * we're no longer the last user after all? Alternatively, somebody
     850             :          * else could have killed it and marked it dead. Either way, we
     851             :          * don't need to do anything else.
     852             :          */
     853           0 :         if (dentry->d_lockref.count) {
     854           0 :                 spin_unlock(&dentry->d_lock);
     855           0 :                 return true;
     856             :         }
     857             : 
     858             :         /*
     859             :          * Re-get the reference we optimistically dropped. We hold the
     860             :          * lock, and we just tested that it was zero, so we can just
     861             :          * set it to 1.
     862             :          */
     863           0 :         dentry->d_lockref.count = 1;
     864           0 :         return false;
     865             : }
     866             : 
     867             : 
     868             : /* 
     869             :  * This is dput
     870             :  *
     871             :  * This is complicated by the fact that we do not want to put
     872             :  * dentries that are no longer on any hash chain on the unused
     873             :  * list: we'd much rather just get rid of them immediately.
     874             :  *
     875             :  * However, that implies that we have to traverse the dentry
     876             :  * tree upwards to the parents which might _also_ now be
     877             :  * scheduled for deletion (it may have been only waiting for
     878             :  * its last child to go away).
     879             :  *
     880             :  * This tail recursion is done by hand as we don't want to depend
     881             :  * on the compiler to always get this right (gcc generally doesn't).
     882             :  * Real recursion would eat up our stack space.
     883             :  */
     884             : 
     885             : /*
     886             :  * dput - release a dentry
     887             :  * @dentry: dentry to release 
     888             :  *
     889             :  * Release a dentry. This will drop the usage count and if appropriate
     890             :  * call the dentry unlink method as well as removing it from the queues and
     891             :  * releasing its resources. If the parent dentries were scheduled for release
     892             :  * they too may now get deleted.
     893             :  */
     894 24201359608 : void dput(struct dentry *dentry)
     895             : {
     896 25723373237 :         while (dentry) {
     897 17928163897 :                 might_sleep();
     898             : 
     899 17936996575 :                 rcu_read_lock();
     900 17932586770 :                 if (likely(fast_dput(dentry))) {
     901 13953074321 :                         rcu_read_unlock();
     902 13953074321 :                         return;
     903             :                 }
     904             : 
     905             :                 /* Slow case: now with the dentry lock held */
     906  3994172921 :                 rcu_read_unlock();
     907             : 
     908  3994701111 :                 if (likely(retain_dentry(dentry))) {
     909  2471997177 :                         spin_unlock(&dentry->d_lock);
     910  2471997177 :                         return;
     911             :                 }
     912             : 
     913  1523209221 :                 dentry = dentry_kill(dentry);
     914             :         }
     915             : }
     916             : EXPORT_SYMBOL(dput);
     917             : 
     918   188966139 : static void __dput_to_list(struct dentry *dentry, struct list_head *list)
     919             : __must_hold(&dentry->d_lock)
     920             : {
     921   188966139 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
     922             :                 /* let the owner of the list it's on deal with it */
     923       55034 :                 --dentry->d_lockref.count;
     924             :         } else {
     925   188911105 :                 if (dentry->d_flags & DCACHE_LRU_LIST)
     926      692772 :                         d_lru_del(dentry);
     927   188911241 :                 if (!--dentry->d_lockref.count)
     928    19837768 :                         d_shrink_add(dentry, list);
     929             :         }
     930   188966276 : }
     931             : 
     932      378616 : void dput_to_list(struct dentry *dentry, struct list_head *list)
     933             : {
     934      378616 :         rcu_read_lock();
     935      378616 :         if (likely(fast_dput(dentry))) {
     936      279650 :                 rcu_read_unlock();
     937      279650 :                 return;
     938             :         }
     939       98966 :         rcu_read_unlock();
     940       98966 :         if (!retain_dentry(dentry))
     941           0 :                 __dput_to_list(dentry, list);
     942       98966 :         spin_unlock(&dentry->d_lock);
     943             : }
     944             : 
     945             : /* This must be called with d_lock held */
     946             : static inline void __dget_dlock(struct dentry *dentry)
     947             : {
     948  1057031588 :         dentry->d_lockref.count++;
     949             : }
     950             : 
     951             : static inline void __dget(struct dentry *dentry)
     952             : {
     953   253206162 :         lockref_get(&dentry->d_lockref);
     954             : }
     955             : 
     956   862105482 : struct dentry *dget_parent(struct dentry *dentry)
     957             : {
     958   862105482 :         int gotref;
     959   862105482 :         struct dentry *ret;
     960   862105482 :         unsigned seq;
     961             : 
     962             :         /*
     963             :          * Do optimistic parent lookup without any
     964             :          * locking.
     965             :          */
     966   862105482 :         rcu_read_lock();
     967   861650566 :         seq = raw_seqcount_begin(&dentry->d_seq);
     968   861651459 :         ret = READ_ONCE(dentry->d_parent);
     969   861651459 :         gotref = lockref_get_not_zero(&ret->d_lockref);
     970   862797987 :         rcu_read_unlock();
     971   862792321 :         if (likely(gotref)) {
     972   862792321 :                 if (!read_seqcount_retry(&dentry->d_seq, seq))
     973             :                         return ret;
     974           3 :                 dput(ret);
     975             :         }
     976             : 
     977           0 : repeat:
     978             :         /*
     979             :          * Don't need rcu_dereference because we re-check it was correct under
     980             :          * the lock.
     981             :          */
     982           3 :         rcu_read_lock();
     983           3 :         ret = dentry->d_parent;
     984           3 :         spin_lock(&ret->d_lock);
     985           3 :         if (unlikely(ret != dentry->d_parent)) {
     986           0 :                 spin_unlock(&ret->d_lock);
     987           0 :                 rcu_read_unlock();
     988           0 :                 goto repeat;
     989             :         }
     990           3 :         rcu_read_unlock();
     991           3 :         BUG_ON(!ret->d_lockref.count);
     992           3 :         ret->d_lockref.count++;
     993           3 :         spin_unlock(&ret->d_lock);
     994           3 :         return ret;
     995             : }
     996             : EXPORT_SYMBOL(dget_parent);
     997             : 
     998             : static struct dentry * __d_find_any_alias(struct inode *inode)
     999             : {
    1000   625207468 :         struct dentry *alias;
    1001             : 
    1002   625207468 :         if (hlist_empty(&inode->i_dentry))
    1003             :                 return NULL;
    1004   253206162 :         alias = hlist_entry(inode->i_dentry.first, struct dentry, d_u.d_alias);
    1005         192 :         __dget(alias);
    1006   253205970 :         return alias;
    1007             : }
    1008             : 
    1009             : /**
    1010             :  * d_find_any_alias - find any alias for a given inode
    1011             :  * @inode: inode to find an alias for
    1012             :  *
    1013             :  * If any aliases exist for the given inode, take and return a
    1014             :  * reference for one of them.  If no aliases exist, return %NULL.
    1015             :  */
    1016   405796414 : struct dentry *d_find_any_alias(struct inode *inode)
    1017             : {
    1018   405796414 :         struct dentry *de;
    1019             : 
    1020   405796414 :         spin_lock(&inode->i_lock);
    1021   413473810 :         de = __d_find_any_alias(inode);
    1022   412506654 :         spin_unlock(&inode->i_lock);
    1023   410549252 :         return de;
    1024             : }
    1025             : EXPORT_SYMBOL(d_find_any_alias);
    1026             : 
    1027    11580821 : static struct dentry *__d_find_alias(struct inode *inode)
    1028             : {
    1029    11580821 :         struct dentry *alias;
    1030             : 
    1031    11580821 :         if (S_ISDIR(inode->i_mode))
    1032    23038534 :                 return __d_find_any_alias(inode);
    1033             : 
    1034      123106 :         hlist_for_each_entry(alias, &inode->i_dentry, d_u.d_alias) {
    1035       61553 :                 spin_lock(&alias->d_lock);
    1036       61549 :                 if (!d_unhashed(alias)) {
    1037       61549 :                         __dget_dlock(alias);
    1038       61549 :                         spin_unlock(&alias->d_lock);
    1039       61549 :                         return alias;
    1040             :                 }
    1041           0 :                 spin_unlock(&alias->d_lock);
    1042             :         }
    1043             :         return NULL;
    1044             : }
    1045             : 
    1046             : /**
    1047             :  * d_find_alias - grab a hashed alias of inode
    1048             :  * @inode: inode in question
    1049             :  *
    1050             :  * If inode has a hashed alias, or is a directory and has any alias,
    1051             :  * acquire the reference to alias and return it. Otherwise return NULL.
    1052             :  * Notice that if inode is a directory there can be only one alias and
    1053             :  * it can be unhashed only if it has no children, or if it is the root
    1054             :  * of a filesystem, or if the directory was renamed and d_revalidate
    1055             :  * was the first vfs operation to notice.
    1056             :  *
    1057             :  * If the inode has an IS_ROOT, DCACHE_DISCONNECTED alias, then prefer
    1058             :  * any other hashed alias over that one.
    1059             :  */
    1060    11579364 : struct dentry *d_find_alias(struct inode *inode)
    1061             : {
    1062    11579364 :         struct dentry *de = NULL;
    1063             : 
    1064    11579364 :         if (!hlist_empty(&inode->i_dentry)) {
    1065    11578778 :                 spin_lock(&inode->i_lock);
    1066    11580829 :                 de = __d_find_alias(inode);
    1067    11580819 :                 spin_unlock(&inode->i_lock);
    1068             :         }
    1069    11581407 :         return de;
    1070             : }
    1071             : EXPORT_SYMBOL(d_find_alias);
    1072             : 
    1073             : /*
    1074             :  *  Caller MUST be holding rcu_read_lock() and be guaranteed
    1075             :  *  that inode won't get freed until rcu_read_unlock().
    1076             :  */
    1077           0 : struct dentry *d_find_alias_rcu(struct inode *inode)
    1078             : {
    1079           0 :         struct hlist_head *l = &inode->i_dentry;
    1080           0 :         struct dentry *de = NULL;
    1081             : 
    1082           0 :         spin_lock(&inode->i_lock);
    1083             :         // ->i_dentry and ->i_rcu are colocated, but the latter won't be
    1084             :         // used without having I_FREEING set, which means no aliases left
    1085           0 :         if (likely(!(inode->i_state & I_FREEING) && !hlist_empty(l))) {
    1086           0 :                 if (S_ISDIR(inode->i_mode)) {
    1087           0 :                         de = hlist_entry(l->first, struct dentry, d_u.d_alias);
    1088             :                 } else {
    1089           0 :                         hlist_for_each_entry(de, l, d_u.d_alias)
    1090           0 :                                 if (!d_unhashed(de))
    1091             :                                         break;
    1092             :                 }
    1093             :         }
    1094           0 :         spin_unlock(&inode->i_lock);
    1095           0 :         return de;
    1096             : }
    1097             : 
    1098             : /*
    1099             :  *      Try to kill dentries associated with this inode.
    1100             :  * WARNING: you must own a reference to inode.
    1101             :  */
    1102         170 : void d_prune_aliases(struct inode *inode)
    1103             : {
    1104         170 :         struct dentry *dentry;
    1105         170 : restart:
    1106         170 :         spin_lock(&inode->i_lock);
    1107         510 :         hlist_for_each_entry(dentry, &inode->i_dentry, d_u.d_alias) {
    1108         170 :                 spin_lock(&dentry->d_lock);
    1109         170 :                 if (!dentry->d_lockref.count) {
    1110           0 :                         struct dentry *parent = lock_parent(dentry);
    1111           0 :                         if (likely(!dentry->d_lockref.count)) {
    1112           0 :                                 __dentry_kill(dentry);
    1113           0 :                                 dput(parent);
    1114           0 :                                 goto restart;
    1115             :                         }
    1116           0 :                         if (parent)
    1117           0 :                                 spin_unlock(&parent->d_lock);
    1118             :                 }
    1119         170 :                 spin_unlock(&dentry->d_lock);
    1120             :         }
    1121         170 :         spin_unlock(&inode->i_lock);
    1122         170 : }
    1123             : EXPORT_SYMBOL(d_prune_aliases);
    1124             : 
    1125             : /*
    1126             :  * Lock a dentry from shrink list.
    1127             :  * Called under rcu_read_lock() and dentry->d_lock; the former
    1128             :  * guarantees that nothing we access will be freed under us.
    1129             :  * Note that dentry is *not* protected from concurrent dentry_kill(),
    1130             :  * d_delete(), etc.
    1131             :  *
    1132             :  * Return false if dentry has been disrupted or grabbed, leaving
    1133             :  * the caller to kick it off-list.  Otherwise, return true and have
    1134             :  * that dentry's inode and parent both locked.
    1135             :  */
    1136   189305286 : static bool shrink_lock_dentry(struct dentry *dentry)
    1137             : {
    1138   189305286 :         struct inode *inode;
    1139   189305286 :         struct dentry *parent;
    1140             : 
    1141   189305286 :         if (dentry->d_lockref.count)
    1142             :                 return false;
    1143             : 
    1144   188967495 :         inode = dentry->d_inode;
    1145   304058163 :         if (inode && unlikely(!spin_trylock(&inode->i_lock))) {
    1146          33 :                 spin_unlock(&dentry->d_lock);
    1147          33 :                 spin_lock(&inode->i_lock);
    1148          33 :                 spin_lock(&dentry->d_lock);
    1149          33 :                 if (unlikely(dentry->d_lockref.count))
    1150           0 :                         goto out;
    1151             :                 /* changed inode means that somebody had grabbed it */
    1152          33 :                 if (unlikely(inode != dentry->d_inode))
    1153           0 :                         goto out;
    1154             :         }
    1155             : 
    1156   188967796 :         parent = dentry->d_parent;
    1157   377935876 :         if (IS_ROOT(dentry) || likely(spin_trylock(&parent->d_lock)))
    1158   188966918 :                 return true;
    1159             : 
    1160        1162 :         spin_unlock(&dentry->d_lock);
    1161        1162 :         spin_lock(&parent->d_lock);
    1162        1162 :         if (unlikely(parent != dentry->d_parent)) {
    1163           0 :                 spin_unlock(&parent->d_lock);
    1164           0 :                 spin_lock(&dentry->d_lock);
    1165           0 :                 goto out;
    1166             :         }
    1167        1162 :         spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
    1168        1162 :         if (likely(!dentry->d_lockref.count))
    1169             :                 return true;
    1170           0 :         spin_unlock(&parent->d_lock);
    1171           0 : out:
    1172           0 :         if (inode)
    1173           0 :                 spin_unlock(&inode->i_lock);
    1174             :         return false;
    1175             : }
    1176             : 
    1177    15315361 : void shrink_dentry_list(struct list_head *list)
    1178             : {
    1179   204617892 :         while (!list_empty(list)) {
    1180   189305415 :                 struct dentry *dentry, *parent;
    1181             : 
    1182   189305415 :                 dentry = list_entry(list->prev, struct dentry, d_lru);
    1183   189305415 :                 spin_lock(&dentry->d_lock);
    1184   189305855 :                 rcu_read_lock();
    1185   189305744 :                 if (!shrink_lock_dentry(dentry)) {
    1186      337791 :                         bool can_free = false;
    1187      337791 :                         rcu_read_unlock();
    1188      337791 :                         d_shrink_del(dentry);
    1189      337791 :                         if (dentry->d_lockref.count < 0)
    1190           0 :                                 can_free = dentry->d_flags & DCACHE_MAY_FREE;
    1191      337791 :                         spin_unlock(&dentry->d_lock);
    1192      337791 :                         if (can_free)
    1193           0 :                                 dentry_free(dentry);
    1194      337791 :                         continue;
    1195             :                 }
    1196   188967950 :                 rcu_read_unlock();
    1197   188967937 :                 d_shrink_del(dentry);
    1198   188966266 :                 parent = dentry->d_parent;
    1199   188966266 :                 if (parent != dentry)
    1200   188966266 :                         __dput_to_list(parent, list);
    1201   188966215 :                 __dentry_kill(dentry);
    1202             :         }
    1203    15312477 : }
    1204             : 
    1205    85293365 : static enum lru_status dentry_lru_isolate(struct list_head *item,
    1206             :                 struct list_lru_one *lru, spinlock_t *lru_lock, void *arg)
    1207             : {
    1208    85293365 :         struct list_head *freeable = arg;
    1209    85293365 :         struct dentry   *dentry = container_of(item, struct dentry, d_lru);
    1210             : 
    1211             : 
    1212             :         /*
    1213             :          * we are inverting the lru lock/dentry->d_lock here,
    1214             :          * so use a trylock. If we fail to get the lock, just skip
    1215             :          * it
    1216             :          */
    1217    85293365 :         if (!spin_trylock(&dentry->d_lock))
    1218             :                 return LRU_SKIP;
    1219             : 
    1220             :         /*
    1221             :          * Referenced dentries are still in use. If they have active
    1222             :          * counts, just remove them from the LRU. Otherwise give them
    1223             :          * another pass through the LRU.
    1224             :          */
    1225    85293365 :         if (dentry->d_lockref.count) {
    1226     1242551 :                 d_lru_isolate(lru, dentry);
    1227     1242551 :                 spin_unlock(&dentry->d_lock);
    1228     1242551 :                 return LRU_REMOVED;
    1229             :         }
    1230             : 
    1231    84050814 :         if (dentry->d_flags & DCACHE_REFERENCED) {
    1232    46821705 :                 dentry->d_flags &= ~DCACHE_REFERENCED;
    1233    46821705 :                 spin_unlock(&dentry->d_lock);
    1234             : 
    1235             :                 /*
    1236             :                  * The list move itself will be made by the common LRU code. At
    1237             :                  * this point, we've dropped the dentry->d_lock but keep the
    1238             :                  * lru lock. This is safe to do, since every list movement is
    1239             :                  * protected by the lru lock even if both locks are held.
    1240             :                  *
    1241             :                  * This is guaranteed by the fact that all LRU management
    1242             :                  * functions are intermediated by the LRU API calls like
    1243             :                  * list_lru_add and list_lru_del. List movement in this file
    1244             :                  * only ever occur through this functions or through callbacks
    1245             :                  * like this one, that are called from the LRU API.
    1246             :                  *
    1247             :                  * The only exceptions to this are functions like
    1248             :                  * shrink_dentry_list, and code that first checks for the
    1249             :                  * DCACHE_SHRINK_LIST flag.  Those are guaranteed to be
    1250             :                  * operating only with stack provided lists after they are
    1251             :                  * properly isolated from the main list.  It is thus, always a
    1252             :                  * local access.
    1253             :                  */
    1254    46821705 :                 return LRU_ROTATE;
    1255             :         }
    1256             : 
    1257    37229109 :         d_lru_shrink_move(lru, dentry, freeable);
    1258    37229109 :         spin_unlock(&dentry->d_lock);
    1259             : 
    1260    37229109 :         return LRU_REMOVED;
    1261             : }
    1262             : 
    1263             : /**
    1264             :  * prune_dcache_sb - shrink the dcache
    1265             :  * @sb: superblock
    1266             :  * @sc: shrink control, passed to list_lru_shrink_walk()
    1267             :  *
    1268             :  * Attempt to shrink the superblock dcache LRU by @sc->nr_to_scan entries. This
    1269             :  * is done when we need more memory and called from the superblock shrinker
    1270             :  * function.
    1271             :  *
    1272             :  * This function may fail to free any resources if all the dentries are in
    1273             :  * use.
    1274             :  */
    1275      354363 : long prune_dcache_sb(struct super_block *sb, struct shrink_control *sc)
    1276             : {
    1277      354363 :         LIST_HEAD(dispose);
    1278      354363 :         long freed;
    1279             : 
    1280      354363 :         freed = list_lru_shrink_walk(&sb->s_dentry_lru, sc,
    1281             :                                      dentry_lru_isolate, &dispose);
    1282      354363 :         shrink_dentry_list(&dispose);
    1283      354363 :         return freed;
    1284             : }
    1285             : 
    1286     1866315 : static enum lru_status dentry_lru_isolate_shrink(struct list_head *item,
    1287             :                 struct list_lru_one *lru, spinlock_t *lru_lock, void *arg)
    1288             : {
    1289     1866315 :         struct list_head *freeable = arg;
    1290     1866315 :         struct dentry   *dentry = container_of(item, struct dentry, d_lru);
    1291             : 
    1292             :         /*
    1293             :          * we are inverting the lru lock/dentry->d_lock here,
    1294             :          * so use a trylock. If we fail to get the lock, just skip
    1295             :          * it
    1296             :          */
    1297     1866315 :         if (!spin_trylock(&dentry->d_lock))
    1298             :                 return LRU_SKIP;
    1299             : 
    1300     1866315 :         d_lru_shrink_move(lru, dentry, freeable);
    1301     1866315 :         spin_unlock(&dentry->d_lock);
    1302             : 
    1303     1866315 :         return LRU_REMOVED;
    1304             : }
    1305             : 
    1306             : 
    1307             : /**
    1308             :  * shrink_dcache_sb - shrink dcache for a superblock
    1309             :  * @sb: superblock
    1310             :  *
    1311             :  * Shrink the dcache for the specified super block. This is used to free
    1312             :  * the dcache before unmounting a file system.
    1313             :  */
    1314        8815 : void shrink_dcache_sb(struct super_block *sb)
    1315             : {
    1316       10419 :         do {
    1317       10419 :                 LIST_HEAD(dispose);
    1318             : 
    1319       10419 :                 list_lru_walk(&sb->s_dentry_lru,
    1320             :                         dentry_lru_isolate_shrink, &dispose, 1024);
    1321       10419 :                 shrink_dentry_list(&dispose);
    1322       10419 :         } while (list_lru_count(&sb->s_dentry_lru) > 0);
    1323        8815 : }
    1324             : EXPORT_SYMBOL(shrink_dcache_sb);
    1325             : 
    1326             : /**
    1327             :  * enum d_walk_ret - action to talke during tree walk
    1328             :  * @D_WALK_CONTINUE:    contrinue walk
    1329             :  * @D_WALK_QUIT:        quit walk
    1330             :  * @D_WALK_NORETRY:     quit when retry is needed
    1331             :  * @D_WALK_SKIP:        skip this dentry and its children
    1332             :  */
    1333             : enum d_walk_ret {
    1334             :         D_WALK_CONTINUE,
    1335             :         D_WALK_QUIT,
    1336             :         D_WALK_NORETRY,
    1337             :         D_WALK_SKIP,
    1338             : };
    1339             : 
    1340             : /**
    1341             :  * d_walk - walk the dentry tree
    1342             :  * @parent:     start of walk
    1343             :  * @data:       data passed to @enter() and @finish()
    1344             :  * @enter:      callback when first entering the dentry
    1345             :  *
    1346             :  * The @enter() callbacks are called with d_lock held.
    1347             :  */
    1348    37611365 : static void d_walk(struct dentry *parent, void *data,
    1349             :                    enum d_walk_ret (*enter)(void *, struct dentry *))
    1350             : {
    1351    37611365 :         struct dentry *this_parent;
    1352    37611365 :         struct list_head *next;
    1353    37611365 :         unsigned seq = 0;
    1354    37611365 :         enum d_walk_ret ret;
    1355    37611365 :         bool retry = true;
    1356             : 
    1357    37611842 : again:
    1358    37611842 :         read_seqbegin_or_lock(&rename_lock, &seq);
    1359    37611343 :         this_parent = parent;
    1360    37611343 :         spin_lock(&this_parent->d_lock);
    1361             : 
    1362    37616908 :         ret = enter(data, this_parent);
    1363    37609899 :         switch (ret) {
    1364             :         case D_WALK_CONTINUE:
    1365             :                 break;
    1366           0 :         case D_WALK_QUIT:
    1367             :         case D_WALK_SKIP:
    1368           0 :                 goto out_unlock;
    1369           0 :         case D_WALK_NORETRY:
    1370           0 :                 retry = false;
    1371           0 :                 break;
    1372             :         }
    1373             : repeat:
    1374    47517897 :         next = this_parent->d_subdirs.next;
    1375             : resume:
    1376   185556959 :         while (next != &this_parent->d_subdirs) {
    1377   140286631 :                 struct list_head *tmp = next;
    1378   140286631 :                 struct dentry *dentry = list_entry(tmp, struct dentry, d_child);
    1379   140286631 :                 next = tmp->next;
    1380             : 
    1381   140286631 :                 if (unlikely(dentry->d_flags & DCACHE_DENTRY_CURSOR))
    1382           0 :                         continue;
    1383             : 
    1384   140286631 :                 spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
    1385             : 
    1386   140287065 :                 ret = enter(data, dentry);
    1387   140287195 :                 switch (ret) {
    1388             :                 case D_WALK_CONTINUE:
    1389             :                         break;
    1390       28857 :                 case D_WALK_QUIT:
    1391       28857 :                         spin_unlock(&dentry->d_lock);
    1392       28857 :                         goto out_unlock;
    1393   140035756 :                 case D_WALK_NORETRY:
    1394   140035756 :                         retry = false;
    1395   140035756 :                         break;
    1396           0 :                 case D_WALK_SKIP:
    1397           0 :                         spin_unlock(&dentry->d_lock);
    1398           0 :                         continue;
    1399             :                 }
    1400             : 
    1401   140258338 :                 if (!list_empty(&dentry->d_subdirs)) {
    1402     9907998 :                         spin_unlock(&this_parent->d_lock);
    1403     9907998 :                         spin_release(&dentry->d_lock.dep_map, _RET_IP_);
    1404     9907998 :                         this_parent = dentry;
    1405     9907998 :                         spin_acquire(&this_parent->d_lock.dep_map, 0, 1, _RET_IP_);
    1406     9907998 :                         goto repeat;
    1407             :                 }
    1408   130350340 :                 spin_unlock(&dentry->d_lock);
    1409             :         }
    1410             :         /*
    1411             :          * All done at this level ... ascend and resume the search.
    1412             :          */
    1413    45270328 :         rcu_read_lock();
    1414    47429765 : ascend:
    1415    47429765 :         if (this_parent != parent) {
    1416     9848679 :                 struct dentry *child = this_parent;
    1417     9848679 :                 this_parent = child->d_parent;
    1418             : 
    1419     9848679 :                 spin_unlock(&child->d_lock);
    1420     9848453 :                 spin_lock(&this_parent->d_lock);
    1421             : 
    1422             :                 /* might go back up the wrong parent if we have had a rename. */
    1423     9848452 :                 if (need_seqretry(&rename_lock, seq))
    1424          92 :                         goto rename_retry;
    1425             :                 /* go into the first sibling still alive */
    1426     9848360 :                 do {
    1427     9848360 :                         next = child->d_child.next;
    1428     9848360 :                         if (next == &this_parent->d_subdirs)
    1429     2159907 :                                 goto ascend;
    1430     7688453 :                         child = list_entry(next, struct dentry, d_child);
    1431     7688453 :                 } while (unlikely(child->d_flags & DCACHE_DENTRY_KILLED));
    1432     7688453 :                 rcu_read_unlock();
    1433     7688453 :                 goto resume;
    1434             :         }
    1435    37581086 :         if (need_seqretry(&rename_lock, seq))
    1436        1980 :                 goto rename_retry;
    1437    37579757 :         rcu_read_unlock();
    1438             : 
    1439    37609433 : out_unlock:
    1440    37609433 :         spin_unlock(&this_parent->d_lock);
    1441    37614436 :         done_seqretry(&rename_lock, seq);
    1442             :         return;
    1443             : 
    1444        2072 : rename_retry:
    1445        2072 :         spin_unlock(&this_parent->d_lock);
    1446        2072 :         rcu_read_unlock();
    1447        2072 :         BUG_ON(seq & 1);
    1448        2072 :         if (!retry)
    1449             :                 return;
    1450         477 :         seq = 1;
    1451         477 :         goto again;
    1452             : }
    1453             : 
    1454             : struct check_mount {
    1455             :         struct vfsmount *mnt;
    1456             :         unsigned int mounted;
    1457             : };
    1458             : 
    1459           0 : static enum d_walk_ret path_check_mount(void *data, struct dentry *dentry)
    1460             : {
    1461           0 :         struct check_mount *info = data;
    1462           0 :         struct path path = { .mnt = info->mnt, .dentry = dentry };
    1463             : 
    1464           0 :         if (likely(!d_mountpoint(dentry)))
    1465             :                 return D_WALK_CONTINUE;
    1466           0 :         if (__path_is_mountpoint(&path)) {
    1467           0 :                 info->mounted = 1;
    1468           0 :                 return D_WALK_QUIT;
    1469             :         }
    1470             :         return D_WALK_CONTINUE;
    1471             : }
    1472             : 
    1473             : /**
    1474             :  * path_has_submounts - check for mounts over a dentry in the
    1475             :  *                      current namespace.
    1476             :  * @parent: path to check.
    1477             :  *
    1478             :  * Return true if the parent or its subdirectories contain
    1479             :  * a mount point in the current namespace.
    1480             :  */
    1481           0 : int path_has_submounts(const struct path *parent)
    1482             : {
    1483           0 :         struct check_mount data = { .mnt = parent->mnt, .mounted = 0 };
    1484             : 
    1485           0 :         read_seqlock_excl(&mount_lock);
    1486           0 :         d_walk(parent->dentry, &data, path_check_mount);
    1487           0 :         read_sequnlock_excl(&mount_lock);
    1488             : 
    1489           0 :         return data.mounted;
    1490             : }
    1491             : EXPORT_SYMBOL(path_has_submounts);
    1492             : 
    1493             : /*
    1494             :  * Called by mount code to set a mountpoint and check if the mountpoint is
    1495             :  * reachable (e.g. NFS can unhash a directory dentry and then the complete
    1496             :  * subtree can become unreachable).
    1497             :  *
    1498             :  * Only one of d_invalidate() and d_set_mounted() must succeed.  For
    1499             :  * this reason take rename_lock and d_lock on dentry and ancestors.
    1500             :  */
    1501      378616 : int d_set_mounted(struct dentry *dentry)
    1502             : {
    1503      378616 :         struct dentry *p;
    1504      378616 :         int ret = -ENOENT;
    1505      378616 :         write_seqlock(&rename_lock);
    1506      380463 :         for (p = dentry->d_parent; !IS_ROOT(p); p = p->d_parent) {
    1507             :                 /* Need exclusion wrt. d_invalidate() */
    1508        1847 :                 spin_lock(&p->d_lock);
    1509        1847 :                 if (unlikely(d_unhashed(p))) {
    1510           0 :                         spin_unlock(&p->d_lock);
    1511           0 :                         goto out;
    1512             :                 }
    1513        1847 :                 spin_unlock(&p->d_lock);
    1514             :         }
    1515      378616 :         spin_lock(&dentry->d_lock);
    1516      378616 :         if (!d_unlinked(dentry)) {
    1517      378616 :                 ret = -EBUSY;
    1518      378616 :                 if (!d_mountpoint(dentry)) {
    1519      378616 :                         dentry->d_flags |= DCACHE_MOUNTED;
    1520      378616 :                         ret = 0;
    1521             :                 }
    1522             :         }
    1523      378616 :         spin_unlock(&dentry->d_lock);
    1524      378616 : out:
    1525      378616 :         write_sequnlock(&rename_lock);
    1526      378616 :         return ret;
    1527             : }
    1528             : 
    1529             : /*
    1530             :  * Search the dentry child list of the specified parent,
    1531             :  * and move any unused dentries to the end of the unused
    1532             :  * list for prune_dcache(). We descend to the next level
    1533             :  * whenever the d_subdirs list is non-empty and continue
    1534             :  * searching.
    1535             :  *
    1536             :  * It returns zero iff there are no unused children,
    1537             :  * otherwise  it returns the number of children moved to
    1538             :  * the end of the unused list. This may not be the total
    1539             :  * number of unused children, because select_parent can
    1540             :  * drop the lock and return early due to latency
    1541             :  * constraints.
    1542             :  */
    1543             : 
    1544             : struct select_data {
    1545             :         struct dentry *start;
    1546             :         union {
    1547             :                 long found;
    1548             :                 struct dentry *victim;
    1549             :         };
    1550             :         struct list_head dispose;
    1551             : };
    1552             : 
    1553   165358704 : static enum d_walk_ret select_collect(void *_data, struct dentry *dentry)
    1554             : {
    1555   165358704 :         struct select_data *data = _data;
    1556   165358704 :         enum d_walk_ret ret = D_WALK_CONTINUE;
    1557             : 
    1558   165358704 :         if (data->start == dentry)
    1559    25072112 :                 goto out;
    1560             : 
    1561   140286592 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
    1562           0 :                 data->found++;
    1563             :         } else {
    1564   140286592 :                 if (dentry->d_flags & DCACHE_LRU_LIST)
    1565   138542672 :                         d_lru_del(dentry);
    1566   140286852 :                 if (!dentry->d_lockref.count) {
    1567   130373098 :                         d_shrink_add(dentry, &data->dispose);
    1568   130372949 :                         data->found++;
    1569             :                 }
    1570             :         }
    1571             :         /*
    1572             :          * We can return to the caller if we have found some (this
    1573             :          * ensures forward progress). We'll be coming back to find
    1574             :          * the rest.
    1575             :          */
    1576   140286703 :         if (!list_empty(&data->dispose))
    1577   140064518 :                 ret = need_resched() ? D_WALK_QUIT : D_WALK_NORETRY;
    1578      222185 : out:
    1579   165358815 :         return ret;
    1580             : }
    1581             : 
    1582           0 : static enum d_walk_ret select_collect2(void *_data, struct dentry *dentry)
    1583             : {
    1584           0 :         struct select_data *data = _data;
    1585           0 :         enum d_walk_ret ret = D_WALK_CONTINUE;
    1586             : 
    1587           0 :         if (data->start == dentry)
    1588           0 :                 goto out;
    1589             : 
    1590           0 :         if (dentry->d_flags & DCACHE_SHRINK_LIST) {
    1591           0 :                 if (!dentry->d_lockref.count) {
    1592           0 :                         rcu_read_lock();
    1593           0 :                         data->victim = dentry;
    1594           0 :                         return D_WALK_QUIT;
    1595             :                 }
    1596             :         } else {
    1597           0 :                 if (dentry->d_flags & DCACHE_LRU_LIST)
    1598           0 :                         d_lru_del(dentry);
    1599           0 :                 if (!dentry->d_lockref.count)
    1600           0 :                         d_shrink_add(dentry, &data->dispose);
    1601             :         }
    1602             :         /*
    1603             :          * We can return to the caller if we have found some (this
    1604             :          * ensures forward progress). We'll be coming back to find
    1605             :          * the rest.
    1606             :          */
    1607           0 :         if (!list_empty(&data->dispose))
    1608           0 :                 ret = need_resched() ? D_WALK_QUIT : D_WALK_NORETRY;
    1609           0 : out:
    1610             :         return ret;
    1611             : }
    1612             : 
    1613             : /**
    1614             :  * shrink_dcache_parent - prune dcache
    1615             :  * @parent: parent of entries to prune
    1616             :  *
    1617             :  * Prune the dcache to remove unused children of the parent dentry.
    1618             :  */
    1619    14123015 : void shrink_dcache_parent(struct dentry *parent)
    1620             : {
    1621    25071359 :         for (;;) {
    1622    25071359 :                 struct select_data data = {.start = parent};
    1623             : 
    1624    25071359 :                 INIT_LIST_HEAD(&data.dispose);
    1625    25071359 :                 d_walk(parent, &data, select_collect);
    1626             : 
    1627    25072407 :                 if (!list_empty(&data.dispose)) {
    1628    10951445 :                         shrink_dentry_list(&data.dispose);
    1629    10948344 :                         continue;
    1630             :                 }
    1631             : 
    1632    14120962 :                 cond_resched();
    1633    14118970 :                 if (!data.found)
    1634             :                         break;
    1635           0 :                 data.victim = NULL;
    1636           0 :                 d_walk(parent, &data, select_collect2);
    1637           0 :                 if (data.victim) {
    1638           0 :                         struct dentry *parent;
    1639           0 :                         spin_lock(&data.victim->d_lock);
    1640           0 :                         if (!shrink_lock_dentry(data.victim)) {
    1641           0 :                                 spin_unlock(&data.victim->d_lock);
    1642           0 :                                 rcu_read_unlock();
    1643             :                         } else {
    1644           0 :                                 rcu_read_unlock();
    1645           0 :                                 parent = data.victim->d_parent;
    1646           0 :                                 if (parent != data.victim)
    1647           0 :                                         __dput_to_list(parent, &data.dispose);
    1648           0 :                                 __dentry_kill(data.victim);
    1649             :                         }
    1650             :                 }
    1651           0 :                 if (!list_empty(&data.dispose))
    1652           0 :                         shrink_dentry_list(&data.dispose);
    1653             :         }
    1654    14118970 : }
    1655             : EXPORT_SYMBOL(shrink_dcache_parent);
    1656             : 
    1657      119457 : static enum d_walk_ret umount_check(void *_data, struct dentry *dentry)
    1658             : {
    1659             :         /* it has busy descendents; complain about those instead */
    1660      119457 :         if (!list_empty(&dentry->d_subdirs))
    1661             :                 return D_WALK_CONTINUE;
    1662             : 
    1663             :         /* root with refcount 1 is fine */
    1664      119453 :         if (dentry == _data && dentry->d_lockref.count == 1)
    1665             :                 return D_WALK_CONTINUE;
    1666             : 
    1667           0 :         printk(KERN_ERR "BUG: Dentry %p{i=%lx,n=%pd} "
    1668             :                         " still in use (%d) [unmount of %s %s]\n",
    1669             :                        dentry,
    1670             :                        dentry->d_inode ?
    1671             :                        dentry->d_inode->i_ino : 0UL,
    1672             :                        dentry,
    1673             :                        dentry->d_lockref.count,
    1674             :                        dentry->d_sb->s_type->name,
    1675             :                        dentry->d_sb->s_id);
    1676           0 :         WARN_ON(1);
    1677             :         return D_WALK_CONTINUE;
    1678             : }
    1679             : 
    1680      119455 : static void do_one_tree(struct dentry *dentry)
    1681             : {
    1682      119455 :         shrink_dcache_parent(dentry);
    1683      119453 :         d_walk(dentry, dentry, umount_check);
    1684      119451 :         d_drop(dentry);
    1685      119448 :         dput(dentry);
    1686      119453 : }
    1687             : 
    1688             : /*
    1689             :  * destroy the dentries attached to a superblock on unmounting
    1690             :  */
    1691      119454 : void shrink_dcache_for_umount(struct super_block *sb)
    1692             : {
    1693      119454 :         struct dentry *dentry;
    1694             : 
    1695      119454 :         WARN(down_read_trylock(&sb->s_umount), "s_umount should've been locked");
    1696             : 
    1697      119454 :         dentry = sb->s_root;
    1698      119454 :         sb->s_root = NULL;
    1699      119454 :         do_one_tree(dentry);
    1700             : 
    1701      119454 :         while (!hlist_bl_empty(&sb->s_roots)) {
    1702           0 :                 dentry = dget(hlist_bl_entry(hlist_bl_first(&sb->s_roots), struct dentry, d_hash));
    1703           0 :                 do_one_tree(dentry);
    1704             :         }
    1705      119454 : }
    1706             : 
    1707    12425550 : static enum d_walk_ret find_submount(void *_data, struct dentry *dentry)
    1708             : {
    1709    12425550 :         struct dentry **victim = _data;
    1710    12425550 :         if (d_mountpoint(dentry)) {
    1711           0 :                 __dget_dlock(dentry);
    1712           0 :                 *victim = dentry;
    1713           0 :                 return D_WALK_QUIT;
    1714             :         }
    1715             :         return D_WALK_CONTINUE;
    1716             : }
    1717             : 
    1718             : /**
    1719             :  * d_invalidate - detach submounts, prune dcache, and drop
    1720             :  * @dentry: dentry to invalidate (aka detach, prune and drop)
    1721             :  */
    1722    13230229 : void d_invalidate(struct dentry *dentry)
    1723             : {
    1724    13230229 :         bool had_submounts = false;
    1725    13230229 :         spin_lock(&dentry->d_lock);
    1726    13231669 :         if (d_unhashed(dentry)) {
    1727        4618 :                 spin_unlock(&dentry->d_lock);
    1728        4618 :                 return;
    1729             :         }
    1730    13227051 :         __d_drop(dentry);
    1731    13226793 :         spin_unlock(&dentry->d_lock);
    1732             : 
    1733             :         /* Negative dentries can be dropped without further checks */
    1734    13227052 :         if (!dentry->d_inode)
    1735             :                 return;
    1736             : 
    1737    12428508 :         shrink_dcache_parent(dentry);
    1738           0 :         for (;;) {
    1739    12425438 :                 struct dentry *victim = NULL;
    1740    12425438 :                 d_walk(dentry, &victim, find_submount);
    1741    12423342 :                 if (!victim) {
    1742    12423342 :                         if (had_submounts)
    1743           0 :                                 shrink_dcache_parent(dentry);
    1744    12423342 :                         return;
    1745             :                 }
    1746           0 :                 had_submounts = true;
    1747           0 :                 detach_mounts(victim);
    1748           0 :                 dput(victim);
    1749             :         }
    1750             : }
    1751             : EXPORT_SYMBOL(d_invalidate);
    1752             : 
    1753             : /**
    1754             :  * __d_alloc    -       allocate a dcache entry
    1755             :  * @sb: filesystem it will belong to
    1756             :  * @name: qstr of the name
    1757             :  *
    1758             :  * Allocates a dentry. It returns %NULL if there is insufficient memory
    1759             :  * available. On a success the dentry is returned. The name passed in is
    1760             :  * copied and the copy passed in may be reused after this call.
    1761             :  */
    1762             :  
    1763  1705614053 : static struct dentry *__d_alloc(struct super_block *sb, const struct qstr *name)
    1764             : {
    1765  1705614053 :         struct dentry *dentry;
    1766  1705614053 :         char *dname;
    1767  1705614053 :         int err;
    1768             : 
    1769  1705614053 :         dentry = kmem_cache_alloc_lru(dentry_cache, &sb->s_dentry_lru,
    1770             :                                       GFP_KERNEL);
    1771  1706190845 :         if (!dentry)
    1772             :                 return NULL;
    1773             : 
    1774             :         /*
    1775             :          * We guarantee that the inline name is always NUL-terminated.
    1776             :          * This way the memcpy() done by the name switching in rename
    1777             :          * will still always have a NUL at the end, even if we might
    1778             :          * be overwriting an internal NUL character
    1779             :          */
    1780  1706190845 :         dentry->d_iname[DNAME_INLINE_LEN-1] = 0;
    1781  1706190845 :         if (unlikely(!name)) {
    1782   176653758 :                 name = &slash_name;
    1783   176653758 :                 dname = dentry->d_iname;
    1784  1529537087 :         } else if (name->len > DNAME_INLINE_LEN-1) {
    1785   443812237 :                 size_t size = offsetof(struct external_name, name[1]);
    1786   443812237 :                 struct external_name *p = kmalloc(size + name->len,
    1787             :                                                   GFP_KERNEL_ACCOUNT |
    1788             :                                                   __GFP_RECLAIMABLE);
    1789   444412505 :                 if (!p) {
    1790           0 :                         kmem_cache_free(dentry_cache, dentry); 
    1791           0 :                         return NULL;
    1792             :                 }
    1793   444412505 :                 atomic_set(&p->u.count, 1);
    1794   444412505 :                 dname = p->name;
    1795             :         } else  {
    1796  1085724850 :                 dname = dentry->d_iname;
    1797             :         }       
    1798             : 
    1799  1706791113 :         dentry->d_name.len = name->len;
    1800  1706791113 :         dentry->d_name.hash = name->hash;
    1801  3413582226 :         memcpy(dname, name->name, name->len);
    1802  1706791113 :         dname[name->len] = 0;
    1803             : 
    1804             :         /* Make sure we always see the terminating NUL character */
    1805  1706791113 :         smp_store_release(&dentry->d_name.name, dname); /* ^^^ */
    1806             : 
    1807  1705698297 :         dentry->d_lockref.count = 1;
    1808  1705698297 :         dentry->d_flags = 0;
    1809  1705698297 :         spin_lock_init(&dentry->d_lock);
    1810  1697747800 :         seqcount_spinlock_init(&dentry->d_seq, &dentry->d_lock);
    1811  1697747800 :         dentry->d_inode = NULL;
    1812  1697747800 :         dentry->d_parent = dentry;
    1813  1697747800 :         dentry->d_sb = sb;
    1814  1697747800 :         dentry->d_op = NULL;
    1815  1697747800 :         dentry->d_fsdata = NULL;
    1816  1697747800 :         INIT_HLIST_BL_NODE(&dentry->d_hash);
    1817  1697747800 :         INIT_LIST_HEAD(&dentry->d_lru);
    1818  1697747800 :         INIT_LIST_HEAD(&dentry->d_subdirs);
    1819  1697747800 :         INIT_HLIST_NODE(&dentry->d_u.d_alias);
    1820  1697747800 :         INIT_LIST_HEAD(&dentry->d_child);
    1821  1697747800 :         d_set_d_op(dentry, dentry->d_sb->s_d_op);
    1822             : 
    1823  1705278236 :         if (dentry->d_op && dentry->d_op->d_init) {
    1824           0 :                 err = dentry->d_op->d_init(dentry);
    1825           0 :                 if (err) {
    1826           0 :                         if (dname_external(dentry))
    1827           0 :                                 kfree(external_name(dentry));
    1828           0 :                         kmem_cache_free(dentry_cache, dentry);
    1829           0 :                         return NULL;
    1830             :                 }
    1831             :         }
    1832             : 
    1833  1705278236 :         this_cpu_inc(nr_dentry);
    1834             : 
    1835  1705278236 :         return dentry;
    1836             : }
    1837             : 
    1838             : /**
    1839             :  * d_alloc      -       allocate a dcache entry
    1840             :  * @parent: parent of entry to allocate
    1841             :  * @name: qstr of the name
    1842             :  *
    1843             :  * Allocates a dentry. It returns %NULL if there is insufficient memory
    1844             :  * available. On a success the dentry is returned. The name passed in is
    1845             :  * copied and the copy passed in may be reused after this call.
    1846             :  */
    1847  1056208083 : struct dentry *d_alloc(struct dentry * parent, const struct qstr *name)
    1848             : {
    1849  1056208083 :         struct dentry *dentry = __d_alloc(parent->d_sb, name);
    1850  1055505345 :         if (!dentry)
    1851             :                 return NULL;
    1852  1055505345 :         spin_lock(&parent->d_lock);
    1853             :         /*
    1854             :          * don't need child lock because it is not subject
    1855             :          * to concurrency here
    1856             :          */
    1857  1056970039 :         __dget_dlock(parent);
    1858  1056970039 :         dentry->d_parent = parent;
    1859  1056970039 :         list_add(&dentry->d_child, &parent->d_subdirs);
    1860  1056928906 :         spin_unlock(&parent->d_lock);
    1861             : 
    1862  1056928906 :         return dentry;
    1863             : }
    1864             : EXPORT_SYMBOL(d_alloc);
    1865             : 
    1866        5610 : struct dentry *d_alloc_anon(struct super_block *sb)
    1867             : {
    1868        5610 :         return __d_alloc(sb, NULL);
    1869             : }
    1870             : EXPORT_SYMBOL(d_alloc_anon);
    1871             : 
    1872     6092333 : struct dentry *d_alloc_cursor(struct dentry * parent)
    1873             : {
    1874     6092333 :         struct dentry *dentry = d_alloc_anon(parent->d_sb);
    1875     6091924 :         if (dentry) {
    1876     6091924 :                 dentry->d_flags |= DCACHE_DENTRY_CURSOR;
    1877    12184042 :                 dentry->d_parent = dget(parent);
    1878             :         }
    1879     6092118 :         return dentry;
    1880             : }
    1881             : 
    1882             : /**
    1883             :  * d_alloc_pseudo - allocate a dentry (for lookup-less filesystems)
    1884             :  * @sb: the superblock
    1885             :  * @name: qstr of the name
    1886             :  *
    1887             :  * For a filesystem that just pins its dentries in memory and never
    1888             :  * performs lookups at all, return an unhashed IS_ROOT dentry.
    1889             :  * This is used for pipes, sockets et.al. - the stuff that should
    1890             :  * never be anyone's children or parents.  Unlike all other
    1891             :  * dentries, these will not have RCU delay between dropping the
    1892             :  * last reference and freeing them.
    1893             :  *
    1894             :  * The only user is alloc_file_pseudo() and that's what should
    1895             :  * be considered a public interface.  Don't use directly.
    1896             :  */
    1897   474344212 : struct dentry *d_alloc_pseudo(struct super_block *sb, const struct qstr *name)
    1898             : {
    1899   474344212 :         struct dentry *dentry = __d_alloc(sb, name);
    1900   473916962 :         if (likely(dentry))
    1901   473916962 :                 dentry->d_flags |= DCACHE_NORCU;
    1902   473916962 :         return dentry;
    1903             : }
    1904             : 
    1905         124 : struct dentry *d_alloc_name(struct dentry *parent, const char *name)
    1906             : {
    1907         124 :         struct qstr q;
    1908             : 
    1909         124 :         q.name = name;
    1910         124 :         q.hash_len = hashlen_string(parent, name);
    1911         124 :         return d_alloc(parent, &q);
    1912             : }
    1913             : EXPORT_SYMBOL(d_alloc_name);
    1914             : 
    1915  2972121033 : void d_set_d_op(struct dentry *dentry, const struct dentry_operations *op)
    1916             : {
    1917  2972121033 :         WARN_ON_ONCE(dentry->d_op);
    1918  2972121033 :         WARN_ON_ONCE(dentry->d_flags & (DCACHE_OP_HASH   |
    1919             :                                 DCACHE_OP_COMPARE       |
    1920             :                                 DCACHE_OP_REVALIDATE    |
    1921             :                                 DCACHE_OP_WEAK_REVALIDATE       |
    1922             :                                 DCACHE_OP_DELETE        |
    1923             :                                 DCACHE_OP_REAL));
    1924  2972121033 :         dentry->d_op = op;
    1925  2972121033 :         if (!op)
    1926             :                 return;
    1927  1307827809 :         if (op->d_hash)
    1928           0 :                 dentry->d_flags |= DCACHE_OP_HASH;
    1929  1307827809 :         if (op->d_compare)
    1930        3715 :                 dentry->d_flags |= DCACHE_OP_COMPARE;
    1931  1307827809 :         if (op->d_revalidate)
    1932    27298644 :                 dentry->d_flags |= DCACHE_OP_REVALIDATE;
    1933  1307827809 :         if (op->d_weak_revalidate)
    1934     1545962 :                 dentry->d_flags |= DCACHE_OP_WEAK_REVALIDATE;
    1935  1307827809 :         if (op->d_delete)
    1936   828998813 :                 dentry->d_flags |= DCACHE_OP_DELETE;
    1937  1307827809 :         if (op->d_prune)
    1938       11367 :                 dentry->d_flags |= DCACHE_OP_PRUNE;
    1939  1307827809 :         if (op->d_real)
    1940      287063 :                 dentry->d_flags |= DCACHE_OP_REAL;
    1941             : 
    1942             : }
    1943             : EXPORT_SYMBOL(d_set_d_op);
    1944             : 
    1945             : 
    1946             : /*
    1947             :  * d_set_fallthru - Mark a dentry as falling through to a lower layer
    1948             :  * @dentry - The dentry to mark
    1949             :  *
    1950             :  * Mark a dentry as falling through to the lower layer (as set with
    1951             :  * d_pin_lower()).  This flag may be recorded on the medium.
    1952             :  */
    1953           0 : void d_set_fallthru(struct dentry *dentry)
    1954             : {
    1955           0 :         spin_lock(&dentry->d_lock);
    1956           0 :         dentry->d_flags |= DCACHE_FALLTHRU;
    1957           0 :         spin_unlock(&dentry->d_lock);
    1958           0 : }
    1959             : EXPORT_SYMBOL(d_set_fallthru);
    1960             : 
    1961   850747734 : static unsigned d_flags_for_inode(struct inode *inode)
    1962             : {
    1963   850747734 :         unsigned add_flags = DCACHE_REGULAR_TYPE;
    1964             : 
    1965   850747734 :         if (!inode)
    1966             :                 return DCACHE_MISS_TYPE;
    1967             : 
    1968   850747734 :         if (S_ISDIR(inode->i_mode)) {
    1969    37972399 :                 add_flags = DCACHE_DIRECTORY_TYPE;
    1970    37972399 :                 if (unlikely(!(inode->i_opflags & IOP_LOOKUP))) {
    1971    29907108 :                         if (unlikely(!inode->i_op->lookup))
    1972             :                                 add_flags = DCACHE_AUTODIR_TYPE;
    1973             :                         else
    1974    29907108 :                                 inode->i_opflags |= IOP_LOOKUP;
    1975             :                 }
    1976    37972399 :                 goto type_determined;
    1977             :         }
    1978             : 
    1979   812775335 :         if (unlikely(!(inode->i_opflags & IOP_NOFOLLOW))) {
    1980   648461662 :                 if (unlikely(inode->i_op->get_link)) {
    1981    39498172 :                         add_flags = DCACHE_SYMLINK_TYPE;
    1982    39498172 :                         goto type_determined;
    1983             :                 }
    1984   608963490 :                 inode->i_opflags |= IOP_NOFOLLOW;
    1985             :         }
    1986             : 
    1987   773277163 :         if (unlikely(!S_ISREG(inode->i_mode)))
    1988    77356894 :                 add_flags = DCACHE_SPECIAL_TYPE;
    1989             : 
    1990   695920269 : type_determined:
    1991   850747734 :         if (unlikely(IS_AUTOMOUNT(inode)))
    1992           0 :                 add_flags |= DCACHE_NEED_AUTOMOUNT;
    1993             :         return add_flags;
    1994             : }
    1995             : 
    1996   603095352 : static void __d_instantiate(struct dentry *dentry, struct inode *inode)
    1997             : {
    1998   603095352 :         unsigned add_flags = d_flags_for_inode(inode);
    1999   601887787 :         WARN_ON(d_in_lookup(dentry));
    2000             : 
    2001   601887787 :         spin_lock(&dentry->d_lock);
    2002             :         /*
    2003             :          * Decrement negative dentry count if it was in the LRU list.
    2004             :          */
    2005   603410204 :         if (dentry->d_flags & DCACHE_LRU_LIST)
    2006    25433093 :                 this_cpu_dec(nr_dentry_negative);
    2007   603246398 :         hlist_add_head(&dentry->d_u.d_alias, &inode->i_dentry);
    2008   603246398 :         raw_write_seqcount_begin(&dentry->d_seq);
    2009   602477984 :         __d_set_inode_and_type(dentry, inode, add_flags);
    2010   602439677 :         raw_write_seqcount_end(&dentry->d_seq);
    2011   602428853 :         fsnotify_update_flags(dentry);
    2012   602001689 :         spin_unlock(&dentry->d_lock);
    2013   603640986 : }
    2014             : 
    2015             : /**
    2016             :  * d_instantiate - fill in inode information for a dentry
    2017             :  * @entry: dentry to complete
    2018             :  * @inode: inode to attach to this dentry
    2019             :  *
    2020             :  * Fill in inode information in the entry.
    2021             :  *
    2022             :  * This turns negative dentries into productive full members
    2023             :  * of society.
    2024             :  *
    2025             :  * NOTE! This assumes that the inode count has been incremented
    2026             :  * (or otherwise set) by the caller to indicate that it is now
    2027             :  * in use by the dcache.
    2028             :  */
    2029             :  
    2030   597490730 : void d_instantiate(struct dentry *entry, struct inode * inode)
    2031             : {
    2032   597490730 :         BUG_ON(!hlist_unhashed(&entry->d_u.d_alias));
    2033   597490730 :         if (inode) {
    2034   597490730 :                 security_d_instantiate(entry, inode);
    2035   597490730 :                 spin_lock(&inode->i_lock);
    2036   598419505 :                 __d_instantiate(entry, inode);
    2037   598521873 :                 spin_unlock(&inode->i_lock);
    2038             :         }
    2039   598927393 : }
    2040             : EXPORT_SYMBOL(d_instantiate);
    2041             : 
    2042             : /*
    2043             :  * This should be equivalent to d_instantiate() + unlock_new_inode(),
    2044             :  * with lockdep-related part of unlock_new_inode() done before
    2045             :  * anything else.  Use that instead of open-coding d_instantiate()/
    2046             :  * unlock_new_inode() combinations.
    2047             :  */
    2048     5088871 : void d_instantiate_new(struct dentry *entry, struct inode *inode)
    2049             : {
    2050     5088871 :         BUG_ON(!hlist_unhashed(&entry->d_u.d_alias));
    2051     5088871 :         BUG_ON(!inode);
    2052     5088871 :         lockdep_annotate_inode_mutex_key(inode);
    2053     5088871 :         security_d_instantiate(entry, inode);
    2054     5088871 :         spin_lock(&inode->i_lock);
    2055     5089778 :         __d_instantiate(entry, inode);
    2056     5088913 :         WARN_ON(!(inode->i_state & I_NEW));
    2057     5088913 :         inode->i_state &= ~I_NEW & ~I_CREATING;
    2058     5088913 :         smp_mb();
    2059     5089977 :         wake_up_bit(&inode->i_state, __I_NEW);
    2060     5089027 :         spin_unlock(&inode->i_lock);
    2061     5089349 : }
    2062             : EXPORT_SYMBOL(d_instantiate_new);
    2063             : 
    2064      119410 : struct dentry *d_make_root(struct inode *root_inode)
    2065             : {
    2066      119410 :         struct dentry *res = NULL;
    2067             : 
    2068      119410 :         if (root_inode) {
    2069      119410 :                 res = d_alloc_anon(root_inode->i_sb);
    2070      119390 :                 if (res)
    2071      119390 :                         d_instantiate(res, root_inode);
    2072             :                 else
    2073           0 :                         iput(root_inode);
    2074             :         }
    2075      119417 :         return res;
    2076             : }
    2077             : EXPORT_SYMBOL(d_make_root);
    2078             : 
    2079   170351394 : static struct dentry *__d_instantiate_anon(struct dentry *dentry,
    2080             :                                            struct inode *inode,
    2081             :                                            bool disconnected)
    2082             : {
    2083   170351394 :         struct dentry *res;
    2084   170351394 :         unsigned add_flags;
    2085             : 
    2086   170351394 :         security_d_instantiate(dentry, inode);
    2087   170351394 :         spin_lock(&inode->i_lock);
    2088   175058861 :         res = __d_find_any_alias(inode);
    2089         192 :         if (res) {
    2090         192 :                 spin_unlock(&inode->i_lock);
    2091         192 :                 dput(dentry);
    2092         192 :                 goto out_iput;
    2093             :         }
    2094             : 
    2095             :         /* attach a disconnected dentry */
    2096   175058669 :         add_flags = d_flags_for_inode(inode);
    2097             : 
    2098   171890943 :         if (disconnected)
    2099   171320124 :                 add_flags |= DCACHE_DISCONNECTED;
    2100             : 
    2101   171890943 :         spin_lock(&dentry->d_lock);
    2102   175555243 :         __d_set_inode_and_type(dentry, inode, add_flags);
    2103   175571253 :         hlist_add_head(&dentry->d_u.d_alias, &inode->i_dentry);
    2104   175571253 :         if (!disconnected) {
    2105           0 :                 hlist_bl_lock(&dentry->d_sb->s_roots);
    2106           0 :                 hlist_bl_add_head(&dentry->d_hash, &dentry->d_sb->s_roots);
    2107           0 :                 hlist_bl_unlock(&dentry->d_sb->s_roots);
    2108             :         }
    2109   175571253 :         spin_unlock(&dentry->d_lock);
    2110   173305349 :         spin_unlock(&inode->i_lock);
    2111             : 
    2112   173305349 :         return dentry;
    2113             : 
    2114             :  out_iput:
    2115         192 :         iput(inode);
    2116         192 :         return res;
    2117             : }
    2118             : 
    2119           0 : struct dentry *d_instantiate_anon(struct dentry *dentry, struct inode *inode)
    2120             : {
    2121           0 :         return __d_instantiate_anon(dentry, inode, true);
    2122             : }
    2123             : EXPORT_SYMBOL(d_instantiate_anon);
    2124             : 
    2125   398192315 : static struct dentry *__d_obtain_alias(struct inode *inode, bool disconnected)
    2126             : {
    2127   398192315 :         struct dentry *tmp;
    2128   398192315 :         struct dentry *res;
    2129             : 
    2130   398192315 :         if (!inode)
    2131             :                 return ERR_PTR(-ESTALE);
    2132   398192315 :         if (IS_ERR(inode))
    2133             :                 return ERR_CAST(inode);
    2134             : 
    2135   398167976 :         res = d_find_any_alias(inode);
    2136   398603163 :         if (res)
    2137   226950980 :                 goto out_iput;
    2138             : 
    2139   171652183 :         tmp = d_alloc_anon(inode->i_sb);
    2140   170753002 :         if (!tmp) {
    2141           0 :                 res = ERR_PTR(-ENOMEM);
    2142           0 :                 goto out_iput;
    2143             :         }
    2144             : 
    2145   170753002 :         return __d_instantiate_anon(tmp, inode, disconnected);
    2146             : 
    2147   226950980 : out_iput:
    2148   226950980 :         iput(inode);
    2149   226950980 :         return res;
    2150             : }
    2151             : 
    2152             : /**
    2153             :  * d_obtain_alias - find or allocate a DISCONNECTED dentry for a given inode
    2154             :  * @inode: inode to allocate the dentry for
    2155             :  *
    2156             :  * Obtain a dentry for an inode resulting from NFS filehandle conversion or
    2157             :  * similar open by handle operations.  The returned dentry may be anonymous,
    2158             :  * or may have a full name (if the inode was already in the cache).
    2159             :  *
    2160             :  * When called on a directory inode, we must ensure that the inode only ever
    2161             :  * has one dentry.  If a dentry is found, that is returned instead of
    2162             :  * allocating a new one.
    2163             :  *
    2164             :  * On successful return, the reference to the inode has been transferred
    2165             :  * to the dentry.  In case of an error the reference on the inode is released.
    2166             :  * To make it easier to use in export operations a %NULL or IS_ERR inode may
    2167             :  * be passed in and the error will be propagated to the return value,
    2168             :  * with a %NULL @inode replaced by ERR_PTR(-ESTALE).
    2169             :  */
    2170   400919636 : struct dentry *d_obtain_alias(struct inode *inode)
    2171             : {
    2172   400919636 :         return __d_obtain_alias(inode, true);
    2173             : }
    2174             : EXPORT_SYMBOL(d_obtain_alias);
    2175             : 
    2176             : /**
    2177             :  * d_obtain_root - find or allocate a dentry for a given inode
    2178             :  * @inode: inode to allocate the dentry for
    2179             :  *
    2180             :  * Obtain an IS_ROOT dentry for the root of a filesystem.
    2181             :  *
    2182             :  * We must ensure that directory inodes only ever have one dentry.  If a
    2183             :  * dentry is found, that is returned instead of allocating a new one.
    2184             :  *
    2185             :  * On successful return, the reference to the inode has been transferred
    2186             :  * to the dentry.  In case of an error the reference on the inode is
    2187             :  * released.  A %NULL or IS_ERR inode may be passed in and will be the
    2188             :  * error will be propagate to the return value, with a %NULL @inode
    2189             :  * replaced by ERR_PTR(-ESTALE).
    2190             :  */
    2191           0 : struct dentry *d_obtain_root(struct inode *inode)
    2192             : {
    2193           0 :         return __d_obtain_alias(inode, false);
    2194             : }
    2195             : EXPORT_SYMBOL(d_obtain_root);
    2196             : 
    2197             : /**
    2198             :  * d_add_ci - lookup or allocate new dentry with case-exact name
    2199             :  * @inode:  the inode case-insensitive lookup has found
    2200             :  * @dentry: the negative dentry that was passed to the parent's lookup func
    2201             :  * @name:   the case-exact name to be associated with the returned dentry
    2202             :  *
    2203             :  * This is to avoid filling the dcache with case-insensitive names to the
    2204             :  * same inode, only the actual correct case is stored in the dcache for
    2205             :  * case-insensitive filesystems.
    2206             :  *
    2207             :  * For a case-insensitive lookup match and if the case-exact dentry
    2208             :  * already exists in the dcache, use it and return it.
    2209             :  *
    2210             :  * If no entry exists with the exact case name, allocate new dentry with
    2211             :  * the exact case, and return the spliced entry.
    2212             :  */
    2213      484528 : struct dentry *d_add_ci(struct dentry *dentry, struct inode *inode,
    2214             :                         struct qstr *name)
    2215             : {
    2216      484528 :         struct dentry *found, *res;
    2217             : 
    2218             :         /*
    2219             :          * First check if a dentry matching the name already exists,
    2220             :          * if not go ahead and create it now.
    2221             :          */
    2222      484528 :         found = d_hash_and_lookup(dentry->d_parent, name);
    2223      484528 :         if (found) {
    2224      357324 :                 iput(inode);
    2225      357324 :                 return found;
    2226             :         }
    2227      127204 :         if (d_in_lookup(dentry)) {
    2228      126951 :                 found = d_alloc_parallel(dentry->d_parent, name,
    2229             :                                         dentry->d_wait);
    2230      126951 :                 if (IS_ERR(found) || !d_in_lookup(found)) {
    2231           0 :                         iput(inode);
    2232           0 :                         return found;
    2233             :                 }
    2234             :         } else {
    2235         253 :                 found = d_alloc(dentry->d_parent, name);
    2236         253 :                 if (!found) {
    2237           0 :                         iput(inode);
    2238           0 :                         return ERR_PTR(-ENOMEM);
    2239             :                 } 
    2240             :         }
    2241      127204 :         res = d_splice_alias(inode, found);
    2242      127204 :         if (res) {
    2243           0 :                 d_lookup_done(found);
    2244           0 :                 dput(found);
    2245           0 :                 return res;
    2246             :         }
    2247             :         return found;
    2248             : }
    2249             : EXPORT_SYMBOL(d_add_ci);
    2250             : 
    2251             : /**
    2252             :  * d_same_name - compare dentry name with case-exact name
    2253             :  * @parent: parent dentry
    2254             :  * @dentry: the negative dentry that was passed to the parent's lookup func
    2255             :  * @name:   the case-exact name to be associated with the returned dentry
    2256             :  *
    2257             :  * Return: true if names are same, or false
    2258             :  */
    2259  1285471689 : bool d_same_name(const struct dentry *dentry, const struct dentry *parent,
    2260             :                  const struct qstr *name)
    2261             : {
    2262  1285471689 :         if (likely(!(parent->d_flags & DCACHE_OP_COMPARE))) {
    2263  1284968379 :                 if (dentry->d_name.len != name->len)
    2264             :                         return false;
    2265  1284873980 :                 return dentry_cmp(dentry, name->name, name->len) == 0;
    2266             :         }
    2267      503310 :         return parent->d_op->d_compare(dentry,
    2268      503310 :                                        dentry->d_name.len, dentry->d_name.name,
    2269      503310 :                                        name) == 0;
    2270             : }
    2271             : EXPORT_SYMBOL_GPL(d_same_name);
    2272             : 
    2273             : /*
    2274             :  * This is __d_lookup_rcu() when the parent dentry has
    2275             :  * DCACHE_OP_COMPARE, which makes things much nastier.
    2276             :  */
    2277        2777 : static noinline struct dentry *__d_lookup_rcu_op_compare(
    2278             :         const struct dentry *parent,
    2279             :         const struct qstr *name,
    2280             :         unsigned *seqp)
    2281             : {
    2282        2777 :         u64 hashlen = name->hash_len;
    2283        2777 :         struct hlist_bl_head *b = d_hash(hashlen_hash(hashlen));
    2284        2775 :         struct hlist_bl_node *node;
    2285        2775 :         struct dentry *dentry;
    2286             : 
    2287        2812 :         hlist_bl_for_each_entry_rcu(dentry, node, b, d_hash) {
    2288          38 :                 int tlen;
    2289          38 :                 const char *tname;
    2290          38 :                 unsigned seq;
    2291             : 
    2292          38 : seqretry:
    2293          38 :                 seq = raw_seqcount_begin(&dentry->d_seq);
    2294          38 :                 if (dentry->d_parent != parent)
    2295          37 :                         continue;
    2296           1 :                 if (d_unhashed(dentry))
    2297           0 :                         continue;
    2298           1 :                 if (dentry->d_name.hash != hashlen_hash(hashlen))
    2299           0 :                         continue;
    2300           1 :                 tlen = dentry->d_name.len;
    2301           1 :                 tname = dentry->d_name.name;
    2302             :                 /* we want a consistent (name,len) pair */
    2303           1 :                 if (read_seqcount_retry(&dentry->d_seq, seq)) {
    2304           0 :                         cpu_relax();
    2305           0 :                         goto seqretry;
    2306             :                 }
    2307           1 :                 if (parent->d_op->d_compare(dentry, tlen, tname, name) != 0)
    2308           0 :                         continue;
    2309           1 :                 *seqp = seq;
    2310           1 :                 return dentry;
    2311             :         }
    2312             :         return NULL;
    2313             : }
    2314             : 
    2315             : /**
    2316             :  * __d_lookup_rcu - search for a dentry (racy, store-free)
    2317             :  * @parent: parent dentry
    2318             :  * @name: qstr of name we wish to find
    2319             :  * @seqp: returns d_seq value at the point where the dentry was found
    2320             :  * Returns: dentry, or NULL
    2321             :  *
    2322             :  * __d_lookup_rcu is the dcache lookup function for rcu-walk name
    2323             :  * resolution (store-free path walking) design described in
    2324             :  * Documentation/filesystems/path-lookup.txt.
    2325             :  *
    2326             :  * This is not to be used outside core vfs.
    2327             :  *
    2328             :  * __d_lookup_rcu must only be used in rcu-walk mode, ie. with vfsmount lock
    2329             :  * held, and rcu_read_lock held. The returned dentry must not be stored into
    2330             :  * without taking d_lock and checking d_seq sequence count against @seq
    2331             :  * returned here.
    2332             :  *
    2333             :  * A refcount may be taken on the found dentry with the d_rcu_to_refcount
    2334             :  * function.
    2335             :  *
    2336             :  * Alternatively, __d_lookup_rcu may be called again to look up the child of
    2337             :  * the returned dentry, so long as its parent's seqlock is checked after the
    2338             :  * child is looked up. Thus, an interlocking stepping of sequence lock checks
    2339             :  * is formed, giving integrity down the path walk.
    2340             :  *
    2341             :  * NOTE! The caller *has* to check the resulting dentry against the sequence
    2342             :  * number we've returned before using any of the resulting dentry state!
    2343             :  */
    2344 64775580717 : struct dentry *__d_lookup_rcu(const struct dentry *parent,
    2345             :                                 const struct qstr *name,
    2346             :                                 unsigned *seqp)
    2347             : {
    2348 64775580717 :         u64 hashlen = name->hash_len;
    2349 64775580717 :         const unsigned char *str = name->name;
    2350 64775580717 :         struct hlist_bl_head *b = d_hash(hashlen_hash(hashlen));
    2351 64744815793 :         struct hlist_bl_node *node;
    2352 64744815793 :         struct dentry *dentry;
    2353             : 
    2354             :         /*
    2355             :          * Note: There is significant duplication with __d_lookup_rcu which is
    2356             :          * required to prevent single threaded performance regressions
    2357             :          * especially on architectures where smp_rmb (in seqcounts) are costly.
    2358             :          * Keep the two functions in sync.
    2359             :          */
    2360             : 
    2361 64744815793 :         if (unlikely(parent->d_flags & DCACHE_OP_COMPARE))
    2362        2779 :                 return __d_lookup_rcu_op_compare(parent, name, seqp);
    2363             : 
    2364             :         /*
    2365             :          * The hash list is protected using RCU.
    2366             :          *
    2367             :          * Carefully use d_seq when comparing a candidate dentry, to avoid
    2368             :          * races with d_move().
    2369             :          *
    2370             :          * It is possible that concurrent renames can mess up our list
    2371             :          * walk here and result in missing our dentry, resulting in the
    2372             :          * false-negative result. d_lookup() protects against concurrent
    2373             :          * renames using rename_lock seqlock.
    2374             :          *
    2375             :          * See Documentation/filesystems/path-lookup.txt for more details.
    2376             :          */
    2377 73586850925 :         hlist_bl_for_each_entry_rcu(dentry, node, b, d_hash) {
    2378 71795117834 :                 unsigned seq;
    2379             : 
    2380             :                 /*
    2381             :                  * The dentry sequence count protects us from concurrent
    2382             :                  * renames, and thus protects parent and name fields.
    2383             :                  *
    2384             :                  * The caller must perform a seqcount check in order
    2385             :                  * to do anything useful with the returned dentry.
    2386             :                  *
    2387             :                  * NOTE! We do a "raw" seqcount_begin here. That means that
    2388             :                  * we don't wait for the sequence count to stabilize if it
    2389             :                  * is in the middle of a sequence change. If we do the slow
    2390             :                  * dentry compare, we will do seqretries until it is stable,
    2391             :                  * and if we end up with a successful lookup, we actually
    2392             :                  * want to exit RCU lookup anyway.
    2393             :                  *
    2394             :                  * Note that raw_seqcount_begin still *does* smp_rmb(), so
    2395             :                  * we are still guaranteed NUL-termination of ->d_name.name.
    2396             :                  */
    2397 71795117834 :                 seq = raw_seqcount_begin(&dentry->d_seq);
    2398 71774640213 :                 if (dentry->d_parent != parent)
    2399  8810940509 :                         continue;
    2400 62963699704 :                 if (d_unhashed(dentry))
    2401       34759 :                         continue;
    2402 62963664945 :                 if (dentry->d_name.hash_len != hashlen)
    2403    31052586 :                         continue;
    2404 62932612359 :                 if (dentry_cmp(dentry, str, hashlen_len(hashlen)) != 0)
    2405       10057 :                         continue;
    2406 62935831996 :                 *seqp = seq;
    2407 62935831996 :                 return dentry;
    2408             :         }
    2409             :         return NULL;
    2410             : }
    2411             : 
    2412             : /**
    2413             :  * d_lookup - search for a dentry
    2414             :  * @parent: parent dentry
    2415             :  * @name: qstr of name we wish to find
    2416             :  * Returns: dentry, or NULL
    2417             :  *
    2418             :  * d_lookup searches the children of the parent dentry for the name in
    2419             :  * question. If the dentry is found its reference count is incremented and the
    2420             :  * dentry is returned. The caller must use dput to free the entry when it has
    2421             :  * finished using it. %NULL is returned if the dentry does not exist.
    2422             :  */
    2423   958543513 : struct dentry *d_lookup(const struct dentry *parent, const struct qstr *name)
    2424             : {
    2425   958558581 :         struct dentry *dentry;
    2426   958558581 :         unsigned seq;
    2427             : 
    2428   958558581 :         do {
    2429   958558581 :                 seq = read_seqbegin(&rename_lock);
    2430   958317472 :                 dentry = __d_lookup(parent, name);
    2431   959274332 :                 if (dentry)
    2432             :                         break;
    2433   210574297 :         } while (read_seqretry(&rename_lock, seq));
    2434   959272011 :         return dentry;
    2435             : }
    2436             : EXPORT_SYMBOL(d_lookup);
    2437             : 
    2438             : /**
    2439             :  * __d_lookup - search for a dentry (racy)
    2440             :  * @parent: parent dentry
    2441             :  * @name: qstr of name we wish to find
    2442             :  * Returns: dentry, or NULL
    2443             :  *
    2444             :  * __d_lookup is like d_lookup, however it may (rarely) return a
    2445             :  * false-negative result due to unrelated rename activity.
    2446             :  *
    2447             :  * __d_lookup is slightly faster by avoiding rename_lock read seqlock,
    2448             :  * however it must be used carefully, eg. with a following d_lookup in
    2449             :  * the case of failure.
    2450             :  *
    2451             :  * __d_lookup callers must be commented.
    2452             :  */
    2453  1509892440 : struct dentry *__d_lookup(const struct dentry *parent, const struct qstr *name)
    2454             : {
    2455  1509892440 :         unsigned int hash = name->hash;
    2456  1509892440 :         struct hlist_bl_head *b = d_hash(hash);
    2457  1509629523 :         struct hlist_bl_node *node;
    2458  1509629523 :         struct dentry *found = NULL;
    2459  1509629523 :         struct dentry *dentry;
    2460             : 
    2461             :         /*
    2462             :          * Note: There is significant duplication with __d_lookup_rcu which is
    2463             :          * required to prevent single threaded performance regressions
    2464             :          * especially on architectures where smp_rmb (in seqcounts) are costly.
    2465             :          * Keep the two functions in sync.
    2466             :          */
    2467             : 
    2468             :         /*
    2469             :          * The hash list is protected using RCU.
    2470             :          *
    2471             :          * Take d_lock when comparing a candidate dentry, to avoid races
    2472             :          * with d_move().
    2473             :          *
    2474             :          * It is possible that concurrent renames can mess up our list
    2475             :          * walk here and result in missing our dentry, resulting in the
    2476             :          * false-negative result. d_lookup() protects against concurrent
    2477             :          * renames using rename_lock seqlock.
    2478             :          *
    2479             :          * See Documentation/filesystems/path-lookup.txt for more details.
    2480             :          */
    2481  1509629523 :         rcu_read_lock();
    2482             :         
    2483  1600085582 :         hlist_bl_for_each_entry_rcu(dentry, node, b, d_hash) {
    2484             : 
    2485  1368798919 :                 if (dentry->d_name.hash != hash)
    2486    89615376 :                         continue;
    2487             : 
    2488  1279183543 :                 spin_lock(&dentry->d_lock);
    2489  1279992380 :                 if (dentry->d_parent != parent)
    2490       28445 :                         goto next;
    2491  1279963935 :                 if (d_unhashed(dentry))
    2492         265 :                         goto next;
    2493             : 
    2494  1279963670 :                 if (!d_same_name(dentry, parent, name))
    2495        8556 :                         goto next;
    2496             : 
    2497  1279660697 :                 dentry->d_lockref.count++;
    2498  1279660697 :                 found = dentry;
    2499  1279660697 :                 spin_unlock(&dentry->d_lock);
    2500             :                 break;
    2501       37266 : next:
    2502       37266 :                 spin_unlock(&dentry->d_lock);
    2503             :         }
    2504  1511203590 :         rcu_read_unlock();
    2505             : 
    2506  1511161643 :         return found;
    2507             : }
    2508             : 
    2509             : /**
    2510             :  * d_hash_and_lookup - hash the qstr then search for a dentry
    2511             :  * @dir: Directory to search in
    2512             :  * @name: qstr of name we wish to find
    2513             :  *
    2514             :  * On lookup failure NULL is returned; on bad name - ERR_PTR(-error)
    2515             :  */
    2516    23338805 : struct dentry *d_hash_and_lookup(struct dentry *dir, struct qstr *name)
    2517             : {
    2518             :         /*
    2519             :          * Check for a fs-specific hash function. Note that we must
    2520             :          * calculate the standard hash first, as the d_op->d_hash()
    2521             :          * routine may choose to leave the hash value unchanged.
    2522             :          */
    2523    23338805 :         name->hash = full_name_hash(dir, name->name, name->len);
    2524    23338805 :         if (dir->d_flags & DCACHE_OP_HASH) {
    2525           0 :                 int err = dir->d_op->d_hash(dir, name);
    2526           0 :                 if (unlikely(err < 0))
    2527           0 :                         return ERR_PTR(err);
    2528             :         }
    2529    23338805 :         return d_lookup(dir, name);
    2530             : }
    2531             : EXPORT_SYMBOL(d_hash_and_lookup);
    2532             : 
    2533             : /*
    2534             :  * When a file is deleted, we have two options:
    2535             :  * - turn this dentry into a negative dentry
    2536             :  * - unhash this dentry and free it.
    2537             :  *
    2538             :  * Usually, we want to just turn this into
    2539             :  * a negative dentry, but if anybody else is
    2540             :  * currently using the dentry or the inode
    2541             :  * we can't do that and we fall back on removing
    2542             :  * it from the hash queues and waiting for
    2543             :  * it to be deleted later when it has no users
    2544             :  */
    2545             :  
    2546             : /**
    2547             :  * d_delete - delete a dentry
    2548             :  * @dentry: The dentry to delete
    2549             :  *
    2550             :  * Turn the dentry into a negative dentry if possible, otherwise
    2551             :  * remove it from the hash queues so it can be deleted later
    2552             :  */
    2553             :  
    2554    68559567 : void d_delete(struct dentry * dentry)
    2555             : {
    2556    68559567 :         struct inode *inode = dentry->d_inode;
    2557             : 
    2558    68559567 :         spin_lock(&inode->i_lock);
    2559    68580158 :         spin_lock(&dentry->d_lock);
    2560             :         /*
    2561             :          * Are we the only user?
    2562             :          */
    2563    68564159 :         if (dentry->d_lockref.count == 1) {
    2564    68249187 :                 dentry->d_flags &= ~DCACHE_CANT_MOUNT;
    2565    68249187 :                 dentry_unlink_inode(dentry);
    2566             :         } else {
    2567      314972 :                 __d_drop(dentry);
    2568      314970 :                 spin_unlock(&dentry->d_lock);
    2569      314978 :                 spin_unlock(&inode->i_lock);
    2570             :         }
    2571    68576568 : }
    2572             : EXPORT_SYMBOL(d_delete);
    2573             : 
    2574  1102684674 : static void __d_rehash(struct dentry *entry)
    2575             : {
    2576  1102684674 :         struct hlist_bl_head *b = d_hash(entry->d_name.hash);
    2577             : 
    2578  1102284578 :         hlist_bl_lock(b);
    2579  1102908235 :         hlist_bl_add_head_rcu(&entry->d_hash, b);
    2580  1102911184 :         hlist_bl_unlock(b);
    2581  1102818467 : }
    2582             : 
    2583             : /**
    2584             :  * d_rehash     - add an entry back to the hash
    2585             :  * @entry: dentry to add to the hash
    2586             :  *
    2587             :  * Adds a dentry to the hash according to its name.
    2588             :  */
    2589             :  
    2590           0 : void d_rehash(struct dentry * entry)
    2591             : {
    2592           0 :         spin_lock(&entry->d_lock);
    2593           0 :         __d_rehash(entry);
    2594           0 :         spin_unlock(&entry->d_lock);
    2595           0 : }
    2596             : EXPORT_SYMBOL(d_rehash);
    2597             : 
    2598   913344917 : static inline unsigned start_dir_add(struct inode *dir)
    2599             : {
    2600   913344917 :         preempt_disable_nested();
    2601   918514058 :         for (;;) {
    2602   918514058 :                 unsigned n = dir->i_dir_seq;
    2603   918514058 :                 if (!(n & 1) && cmpxchg(&dir->i_dir_seq, n, n + 1) == n)
    2604   913778090 :                         return n;
    2605     5028789 :                 cpu_relax();
    2606             :         }
    2607             : }
    2608             : 
    2609   913791489 : static inline void end_dir_add(struct inode *dir, unsigned int n,
    2610             :                                wait_queue_head_t *d_wait)
    2611             : {
    2612   913791489 :         smp_store_release(&dir->i_dir_seq, n + 2);
    2613   913775257 :         preempt_enable_nested();
    2614   913775257 :         wake_up_all(d_wait);
    2615   913317744 : }
    2616             : 
    2617     2823033 : static void d_wait_lookup(struct dentry *dentry)
    2618             : {
    2619     2823033 :         if (d_in_lookup(dentry)) {
    2620      103238 :                 DECLARE_WAITQUEUE(wait, current);
    2621      103238 :                 add_wait_queue(dentry->d_wait, &wait);
    2622      103238 :                 do {
    2623      103238 :                         set_current_state(TASK_UNINTERRUPTIBLE);
    2624      103238 :                         spin_unlock(&dentry->d_lock);
    2625      103238 :                         schedule();
    2626      103220 :                         spin_lock(&dentry->d_lock);
    2627      103236 :                 } while (d_in_lookup(dentry));
    2628             :         }
    2629     2823031 : }
    2630             : 
    2631   922479729 : struct dentry *d_alloc_parallel(struct dentry *parent,
    2632             :                                 const struct qstr *name,
    2633             :                                 wait_queue_head_t *wq)
    2634             : {
    2635   922479729 :         unsigned int hash = name->hash;
    2636   922479729 :         struct hlist_bl_head *b = in_lookup_hash(parent, hash);
    2637   922479729 :         struct hlist_bl_node *node;
    2638   922479729 :         struct dentry *new = d_alloc(parent, name);
    2639   922987027 :         struct dentry *dentry;
    2640   922987027 :         unsigned seq, r_seq, d_seq;
    2641             : 
    2642   922987027 :         if (unlikely(!new))
    2643             :                 return ERR_PTR(-ENOMEM);
    2644             : 
    2645   922987027 : retry:
    2646   951645902 :         rcu_read_lock();
    2647   951605212 :         seq = smp_load_acquire(&parent->d_inode->i_dir_seq);
    2648   951605212 :         r_seq = read_seqbegin(&rename_lock);
    2649   951612655 :         dentry = __d_lookup_rcu(parent, name, &d_seq);
    2650   951537754 :         if (unlikely(dentry)) {
    2651     6559723 :                 if (!lockref_get_not_dead(&dentry->d_lockref)) {
    2652     1453569 :                         rcu_read_unlock();
    2653     1453567 :                         goto retry;
    2654             :                 }
    2655     5117323 :                 if (read_seqcount_retry(&dentry->d_seq, d_seq)) {
    2656           0 :                         rcu_read_unlock();
    2657           0 :                         dput(dentry);
    2658           0 :                         goto retry;
    2659             :                 }
    2660     5117274 :                 rcu_read_unlock();
    2661     5116473 :                 dput(new);
    2662     5116473 :                 return dentry;
    2663             :         }
    2664   944978031 :         if (unlikely(read_seqretry(&rename_lock, r_seq))) {
    2665        2466 :                 rcu_read_unlock();
    2666        2466 :                 goto retry;
    2667             :         }
    2668             : 
    2669   944946348 :         if (unlikely(seq & 1)) {
    2670    25583662 :                 rcu_read_unlock();
    2671    25595304 :                 goto retry;
    2672             :         }
    2673             : 
    2674   919362686 :         hlist_bl_lock(b);
    2675   919562395 :         if (unlikely(READ_ONCE(parent->d_inode->i_dir_seq) != seq)) {
    2676     1605368 :                 hlist_bl_unlock(b);
    2677     1605942 :                 rcu_read_unlock();
    2678     1606021 :                 goto retry;
    2679             :         }
    2680             :         /*
    2681             :          * No changes for the parent since the beginning of d_lookup().
    2682             :          * Since all removals from the chain happen with hlist_bl_lock(),
    2683             :          * any potential in-lookup matches are going to stay here until
    2684             :          * we unlock the chain.  All fields are stable in everything
    2685             :          * we encounter.
    2686             :          */
    2687   917968499 :         hlist_bl_for_each_entry(dentry, node, b, d_u.d_in_lookup_hash) {
    2688     2843060 :                 if (dentry->d_name.hash != hash)
    2689       11461 :                         continue;
    2690     2831599 :                 if (dentry->d_parent != parent)
    2691           0 :                         continue;
    2692     2831599 :                 if (!d_same_name(dentry, parent, name))
    2693          11 :                         continue;
    2694     2823396 :                 hlist_bl_unlock(b);
    2695             :                 /* now we can try to grab a reference */
    2696     2823180 :                 if (!lockref_get_not_dead(&dentry->d_lockref)) {
    2697         363 :                         rcu_read_unlock();
    2698         363 :                         goto retry;
    2699             :                 }
    2700             : 
    2701     2823028 :                 rcu_read_unlock();
    2702             :                 /*
    2703             :                  * somebody is likely to be still doing lookup for it;
    2704             :                  * wait for them to finish
    2705             :                  */
    2706     2823027 :                 spin_lock(&dentry->d_lock);
    2707     2823033 :                 d_wait_lookup(dentry);
    2708             :                 /*
    2709             :                  * it's not in-lookup anymore; in principle we should repeat
    2710             :                  * everything from dcache lookup, but it's likely to be what
    2711             :                  * d_lookup() would've found anyway.  If it is, just return it;
    2712             :                  * otherwise we really have to repeat the whole thing.
    2713             :                  */
    2714     2823030 :                 if (unlikely(dentry->d_name.hash != hash))
    2715           0 :                         goto mismatch;
    2716     2823030 :                 if (unlikely(dentry->d_parent != parent))
    2717           0 :                         goto mismatch;
    2718     2823030 :                 if (unlikely(d_unhashed(dentry)))
    2719        1154 :                         goto mismatch;
    2720     2821876 :                 if (unlikely(!d_same_name(dentry, parent, name)))
    2721           0 :                         goto mismatch;
    2722             :                 /* OK, it *is* a hashed match; return it */
    2723     2821877 :                 spin_unlock(&dentry->d_lock);
    2724     2821878 :                 dput(new);
    2725     2821878 :                 return dentry;
    2726             :         }
    2727   915125439 :         rcu_read_unlock();
    2728             :         /* we can't take ->d_lock here; it's OK, though. */
    2729   915114842 :         new->d_flags |= DCACHE_PAR_LOOKUP;
    2730   915114842 :         new->d_wait = wq;
    2731   915114842 :         hlist_bl_add_head_rcu(&new->d_u.d_in_lookup_hash, b);
    2732   914851386 :         hlist_bl_unlock(b);
    2733   914851386 :         return new;
    2734        1154 : mismatch:
    2735        1154 :         spin_unlock(&dentry->d_lock);
    2736        1154 :         dput(dentry);
    2737        1154 :         goto retry;
    2738             : }
    2739             : EXPORT_SYMBOL(d_alloc_parallel);
    2740             : 
    2741             : /*
    2742             :  * - Unhash the dentry
    2743             :  * - Retrieve and clear the waitqueue head in dentry
    2744             :  * - Return the waitqueue head
    2745             :  */
    2746   914988096 : static wait_queue_head_t *__d_lookup_unhash(struct dentry *dentry)
    2747             : {
    2748   914988096 :         wait_queue_head_t *d_wait;
    2749   914988096 :         struct hlist_bl_head *b;
    2750             : 
    2751   914988096 :         lockdep_assert_held(&dentry->d_lock);
    2752             : 
    2753   914988096 :         b = in_lookup_hash(dentry->d_parent, dentry->d_name.hash);
    2754   914988096 :         hlist_bl_lock(b);
    2755   915158712 :         dentry->d_flags &= ~DCACHE_PAR_LOOKUP;
    2756   915158712 :         __hlist_bl_del(&dentry->d_u.d_in_lookup_hash);
    2757   915069290 :         d_wait = dentry->d_wait;
    2758   915069290 :         dentry->d_wait = NULL;
    2759   915069290 :         hlist_bl_unlock(b);
    2760   915017155 :         INIT_HLIST_NODE(&dentry->d_u.d_alias);
    2761   915017155 :         INIT_LIST_HEAD(&dentry->d_lru);
    2762   915017155 :         return d_wait;
    2763             : }
    2764             : 
    2765     1250007 : void __d_lookup_unhash_wake(struct dentry *dentry)
    2766             : {
    2767     1250007 :         spin_lock(&dentry->d_lock);
    2768     1250001 :         wake_up_all(__d_lookup_unhash(dentry));
    2769     1249983 :         spin_unlock(&dentry->d_lock);
    2770     1249987 : }
    2771             : EXPORT_SYMBOL(__d_lookup_unhash_wake);
    2772             : 
    2773             : /* inode->i_lock held if inode is non-NULL */
    2774             : 
    2775  1034396901 : static inline void __d_add(struct dentry *dentry, struct inode *inode)
    2776             : {
    2777  1034396901 :         wait_queue_head_t *d_wait;
    2778  1034396901 :         struct inode *dir = NULL;
    2779  1034396901 :         unsigned n;
    2780  1034396901 :         spin_lock(&dentry->d_lock);
    2781  1034616334 :         if (unlikely(d_in_lookup(dentry))) {
    2782   909721955 :                 dir = dentry->d_parent->d_inode;
    2783   909721955 :                 n = start_dir_add(dir);
    2784   910060454 :                 d_wait = __d_lookup_unhash(dentry);
    2785             :         }
    2786  1034986340 :         if (inode) {
    2787    74972686 :                 unsigned add_flags = d_flags_for_inode(inode);
    2788    74966176 :                 hlist_add_head(&dentry->d_u.d_alias, &inode->i_dentry);
    2789    74966176 :                 raw_write_seqcount_begin(&dentry->d_seq);
    2790    74966510 :                 __d_set_inode_and_type(dentry, inode, add_flags);
    2791    74966539 :                 raw_write_seqcount_end(&dentry->d_seq);
    2792    74966432 :                 fsnotify_update_flags(dentry);
    2793             :         }
    2794  1034978292 :         __d_rehash(dentry);
    2795  1035020539 :         if (dir)
    2796   910112372 :                 end_dir_add(dir, n, d_wait);
    2797  1034504256 :         spin_unlock(&dentry->d_lock);
    2798  1034708943 :         if (inode)
    2799    74973584 :                 spin_unlock(&inode->i_lock);
    2800  1034699806 : }
    2801             : 
    2802             : /**
    2803             :  * d_add - add dentry to hash queues
    2804             :  * @entry: dentry to add
    2805             :  * @inode: The inode to attach to this dentry
    2806             :  *
    2807             :  * This adds the entry to the hash queues and initializes @inode.
    2808             :  * The entry was actually filled in earlier during d_alloc().
    2809             :  */
    2810             : 
    2811   802790881 : void d_add(struct dentry *entry, struct inode *inode)
    2812             : {
    2813   802790881 :         if (inode) {
    2814         124 :                 security_d_instantiate(entry, inode);
    2815         124 :                 spin_lock(&inode->i_lock);
    2816             :         }
    2817   802790881 :         __d_add(entry, inode);
    2818   802901287 : }
    2819             : EXPORT_SYMBOL(d_add);
    2820             : 
    2821             : /**
    2822             :  * d_exact_alias - find and hash an exact unhashed alias
    2823             :  * @entry: dentry to add
    2824             :  * @inode: The inode to go with this dentry
    2825             :  *
    2826             :  * If an unhashed dentry with the same name/parent and desired
    2827             :  * inode already exists, hash and return it.  Otherwise, return
    2828             :  * NULL.
    2829             :  *
    2830             :  * Parent directory should be locked.
    2831             :  */
    2832       30206 : struct dentry *d_exact_alias(struct dentry *entry, struct inode *inode)
    2833             : {
    2834       30206 :         struct dentry *alias;
    2835       30206 :         unsigned int hash = entry->d_name.hash;
    2836             : 
    2837       30206 :         spin_lock(&inode->i_lock);
    2838       60412 :         hlist_for_each_entry(alias, &inode->i_dentry, d_u.d_alias) {
    2839             :                 /*
    2840             :                  * Don't need alias->d_lock here, because aliases with
    2841             :                  * d_parent == entry->d_parent are not subject to name or
    2842             :                  * parent changes, because the parent inode i_mutex is held.
    2843             :                  */
    2844           0 :                 if (alias->d_name.hash != hash)
    2845           0 :                         continue;
    2846           0 :                 if (alias->d_parent != entry->d_parent)
    2847           0 :                         continue;
    2848           0 :                 if (!d_same_name(alias, entry->d_parent, &entry->d_name))
    2849           0 :                         continue;
    2850           0 :                 spin_lock(&alias->d_lock);
    2851           0 :                 if (!d_unhashed(alias)) {
    2852           0 :                         spin_unlock(&alias->d_lock);
    2853           0 :                         alias = NULL;
    2854             :                 } else {
    2855           0 :                         __dget_dlock(alias);
    2856           0 :                         __d_rehash(alias);
    2857           0 :                         spin_unlock(&alias->d_lock);
    2858             :                 }
    2859           0 :                 spin_unlock(&inode->i_lock);
    2860           0 :                 return alias;
    2861             :         }
    2862       30206 :         spin_unlock(&inode->i_lock);
    2863       30206 :         return NULL;
    2864             : }
    2865             : EXPORT_SYMBOL(d_exact_alias);
    2866             : 
    2867    13158267 : static void swap_names(struct dentry *dentry, struct dentry *target)
    2868             : {
    2869    13158267 :         if (unlikely(dname_external(target))) {
    2870        1640 :                 if (unlikely(dname_external(dentry))) {
    2871             :                         /*
    2872             :                          * Both external: swap the pointers
    2873             :                          */
    2874         437 :                         swap(target->d_name.name, dentry->d_name.name);
    2875             :                 } else {
    2876             :                         /*
    2877             :                          * dentry:internal, target:external.  Steal target's
    2878             :                          * storage and make target internal.
    2879             :                          */
    2880        2406 :                         memcpy(target->d_iname, dentry->d_name.name,
    2881             :                                         dentry->d_name.len + 1);
    2882        1203 :                         dentry->d_name.name = target->d_name.name;
    2883        1203 :                         target->d_name.name = target->d_iname;
    2884             :                 }
    2885             :         } else {
    2886    13156627 :                 if (unlikely(dname_external(dentry))) {
    2887             :                         /*
    2888             :                          * dentry:external, target:internal.  Give dentry's
    2889             :                          * storage to target and make dentry internal
    2890             :                          */
    2891        2380 :                         memcpy(dentry->d_iname, target->d_name.name,
    2892             :                                         target->d_name.len + 1);
    2893        1190 :                         target->d_name.name = dentry->d_name.name;
    2894        1190 :                         dentry->d_name.name = dentry->d_iname;
    2895             :                 } else {
    2896             :                         /*
    2897             :                          * Both are internal.
    2898             :                          */
    2899             :                         unsigned int i;
    2900             :                         BUILD_BUG_ON(!IS_ALIGNED(DNAME_INLINE_LEN, sizeof(long)));
    2901    65777185 :                         for (i = 0; i < DNAME_INLINE_LEN / sizeof(long); i++) {
    2902    52621748 :                                 swap(((long *) &dentry->d_iname)[i],
    2903             :                                      ((long *) &target->d_iname)[i]);
    2904             :                         }
    2905             :                 }
    2906             :         }
    2907    13158267 :         swap(dentry->d_name.hash_len, target->d_name.hash_len);
    2908    13158267 : }
    2909             : 
    2910    41508905 : static void copy_name(struct dentry *dentry, struct dentry *target)
    2911             : {
    2912    41508905 :         struct external_name *old_name = NULL;
    2913    41508905 :         if (unlikely(dname_external(dentry)))
    2914     1122027 :                 old_name = external_name(dentry);
    2915    41508905 :         if (unlikely(dname_external(target))) {
    2916     1049071 :                 atomic_inc(&external_name(target)->u.count);
    2917     1049071 :                 dentry->d_name = target->d_name;
    2918             :         } else {
    2919    80919668 :                 memcpy(dentry->d_iname, target->d_name.name,
    2920             :                                 target->d_name.len + 1);
    2921    40459834 :                 dentry->d_name.name = dentry->d_iname;
    2922    40459834 :                 dentry->d_name.hash_len = target->d_name.hash_len;
    2923             :         }
    2924    41508905 :         if (old_name && likely(atomic_dec_and_test(&old_name->u.count)))
    2925           0 :                 kfree_rcu(old_name, u.head);
    2926    41508905 : }
    2927             : 
    2928             : /*
    2929             :  * __d_move - move a dentry
    2930             :  * @dentry: entry to move
    2931             :  * @target: new dentry
    2932             :  * @exchange: exchange the two dentries
    2933             :  *
    2934             :  * Update the dcache to reflect the move of a file name. Negative
    2935             :  * dcache entries should not be moved in this way. Caller must hold
    2936             :  * rename_lock, the i_mutex of the source and target directories,
    2937             :  * and the sb->s_vfs_rename_mutex if they differ. See lock_rename().
    2938             :  */
    2939    54667172 : static void __d_move(struct dentry *dentry, struct dentry *target,
    2940             :                      bool exchange)
    2941             : {
    2942    54667172 :         struct dentry *old_parent, *p;
    2943    54667172 :         wait_queue_head_t *d_wait;
    2944    54667172 :         struct inode *dir = NULL;
    2945    54667172 :         unsigned n;
    2946             : 
    2947    54667172 :         WARN_ON(!dentry->d_inode);
    2948    54667172 :         if (WARN_ON(dentry == target))
    2949             :                 return;
    2950             : 
    2951    54667172 :         BUG_ON(d_ancestor(target, dentry));
    2952    54667172 :         old_parent = dentry->d_parent;
    2953    54667172 :         p = d_ancestor(old_parent, target);
    2954    54667172 :         if (IS_ROOT(dentry)) {
    2955     3704036 :                 BUG_ON(p);
    2956     3704036 :                 spin_lock(&target->d_parent->d_lock);
    2957    50963136 :         } else if (!p) {
    2958             :                 /* target is not a descendent of dentry->d_parent */
    2959    42441038 :                 spin_lock(&target->d_parent->d_lock);
    2960    42441038 :                 spin_lock_nested(&old_parent->d_lock, DENTRY_D_LOCK_NESTED);
    2961             :         } else {
    2962     8522098 :                 BUG_ON(p == dentry);
    2963     8522098 :                 spin_lock(&old_parent->d_lock);
    2964     8522098 :                 if (p != target)
    2965     1784556 :                         spin_lock_nested(&target->d_parent->d_lock,
    2966             :                                         DENTRY_D_LOCK_NESTED);
    2967             :         }
    2968    54667172 :         spin_lock_nested(&dentry->d_lock, 2);
    2969    54667172 :         spin_lock_nested(&target->d_lock, 3);
    2970             : 
    2971    54667172 :         if (unlikely(d_in_lookup(target))) {
    2972     3704036 :                 dir = target->d_parent->d_inode;
    2973     3704036 :                 n = start_dir_add(dir);
    2974     3704036 :                 d_wait = __d_lookup_unhash(target);
    2975             :         }
    2976             : 
    2977    54667172 :         write_seqcount_begin(&dentry->d_seq);
    2978    54667172 :         write_seqcount_begin_nested(&target->d_seq, DENTRY_D_LOCK_NESTED);
    2979             : 
    2980             :         /* unhash both */
    2981    54667172 :         if (!d_unhashed(dentry))
    2982    50963136 :                 ___d_drop(dentry);
    2983    54667172 :         if (!d_unhashed(target))
    2984    50963136 :                 ___d_drop(target);
    2985             : 
    2986             :         /* ... and switch them in the tree */
    2987    54667172 :         dentry->d_parent = target->d_parent;
    2988    54667172 :         if (!exchange) {
    2989    41508905 :                 copy_name(dentry, target);
    2990    41508905 :                 target->d_hash.pprev = NULL;
    2991    41508905 :                 dentry->d_parent->d_lockref.count++;
    2992    41508905 :                 if (dentry != old_parent) /* wasn't IS_ROOT */
    2993    37804869 :                         WARN_ON(!--old_parent->d_lockref.count);
    2994             :         } else {
    2995    13158267 :                 target->d_parent = old_parent;
    2996    13158267 :                 swap_names(dentry, target);
    2997    13158267 :                 list_move(&target->d_child, &target->d_parent->d_subdirs);
    2998    13158267 :                 __d_rehash(target);
    2999    13158267 :                 fsnotify_update_flags(target);
    3000             :         }
    3001    54667172 :         list_move(&dentry->d_child, &dentry->d_parent->d_subdirs);
    3002    54667172 :         __d_rehash(dentry);
    3003    54667172 :         fsnotify_update_flags(dentry);
    3004    54667172 :         fscrypt_handle_d_move(dentry);
    3005             : 
    3006    54667172 :         write_seqcount_end(&target->d_seq);
    3007    54667172 :         write_seqcount_end(&dentry->d_seq);
    3008             : 
    3009    54667172 :         if (dir)
    3010     3704036 :                 end_dir_add(dir, n, d_wait);
    3011             : 
    3012    54667172 :         if (dentry->d_parent != old_parent)
    3013    47929630 :                 spin_unlock(&dentry->d_parent->d_lock);
    3014    54667172 :         if (dentry != old_parent)
    3015    50963136 :                 spin_unlock(&old_parent->d_lock);
    3016    54667172 :         spin_unlock(&target->d_lock);
    3017    54667172 :         spin_unlock(&dentry->d_lock);
    3018             : }
    3019             : 
    3020             : /*
    3021             :  * d_move - move a dentry
    3022             :  * @dentry: entry to move
    3023             :  * @target: new dentry
    3024             :  *
    3025             :  * Update the dcache to reflect the move of a file name. Negative
    3026             :  * dcache entries should not be moved in this way. See the locking
    3027             :  * requirements for __d_move.
    3028             :  */
    3029    37804259 : void d_move(struct dentry *dentry, struct dentry *target)
    3030             : {
    3031    37804259 :         write_seqlock(&rename_lock);
    3032    37804869 :         __d_move(dentry, target, false);
    3033    37804869 :         write_sequnlock(&rename_lock);
    3034    37804869 : }
    3035             : EXPORT_SYMBOL(d_move);
    3036             : 
    3037             : /*
    3038             :  * d_exchange - exchange two dentries
    3039             :  * @dentry1: first dentry
    3040             :  * @dentry2: second dentry
    3041             :  */
    3042    13158223 : void d_exchange(struct dentry *dentry1, struct dentry *dentry2)
    3043             : {
    3044    13158223 :         write_seqlock(&rename_lock);
    3045             : 
    3046    13158267 :         WARN_ON(!dentry1->d_inode);
    3047    13158267 :         WARN_ON(!dentry2->d_inode);
    3048    13158267 :         WARN_ON(IS_ROOT(dentry1));
    3049    13158267 :         WARN_ON(IS_ROOT(dentry2));
    3050             : 
    3051    13158267 :         __d_move(dentry1, dentry2, true);
    3052             : 
    3053    13158267 :         write_sequnlock(&rename_lock);
    3054    13158267 : }
    3055             : 
    3056             : /**
    3057             :  * d_ancestor - search for an ancestor
    3058             :  * @p1: ancestor dentry
    3059             :  * @p2: child dentry
    3060             :  *
    3061             :  * Returns the ancestor dentry of p2 which is a child of p1, if p1 is
    3062             :  * an ancestor of p2, else NULL.
    3063             :  */
    3064    90428600 : struct dentry *d_ancestor(struct dentry *p1, struct dentry *p2)
    3065             : {
    3066   145095772 :         struct dentry *p;
    3067             : 
    3068 10619693829 :         for (p = p2; !IS_ROOT(p); p = p->d_parent) {
    3069 10428589952 :                 if (p->d_parent == p1)
    3070     4856518 :                         return p;
    3071             :         }
    3072             :         return NULL;
    3073             : }
    3074             : 
    3075             : /*
    3076             :  * This helper attempts to cope with remotely renamed directories
    3077             :  *
    3078             :  * It assumes that the caller is already holding
    3079             :  * dentry->d_parent->d_inode->i_mutex, and rename_lock
    3080             :  *
    3081             :  * Note: If ever the locking in lock_rename() changes, then please
    3082             :  * remember to update this too...
    3083             :  */
    3084           0 : static int __d_unalias(struct inode *inode,
    3085             :                 struct dentry *dentry, struct dentry *alias)
    3086             : {
    3087           0 :         struct mutex *m1 = NULL;
    3088           0 :         struct rw_semaphore *m2 = NULL;
    3089           0 :         int ret = -ESTALE;
    3090             : 
    3091             :         /* If alias and dentry share a parent, then no extra locks required */
    3092           0 :         if (alias->d_parent == dentry->d_parent)
    3093           0 :                 goto out_unalias;
    3094             : 
    3095             :         /* See lock_rename() */
    3096           0 :         if (!mutex_trylock(&dentry->d_sb->s_vfs_rename_mutex))
    3097           0 :                 goto out_err;
    3098           0 :         m1 = &dentry->d_sb->s_vfs_rename_mutex;
    3099           0 :         if (!inode_trylock_shared(alias->d_parent->d_inode))
    3100           0 :                 goto out_err;
    3101           0 :         m2 = &alias->d_parent->d_inode->i_rwsem;
    3102           0 : out_unalias:
    3103           0 :         __d_move(alias, dentry, false);
    3104           0 :         ret = 0;
    3105           0 : out_err:
    3106           0 :         if (m2)
    3107           0 :                 up_read(m2);
    3108           0 :         if (m1)
    3109           0 :                 mutex_unlock(m1);
    3110           0 :         return ret;
    3111             : }
    3112             : 
    3113             : /**
    3114             :  * d_splice_alias - splice a disconnected dentry into the tree if one exists
    3115             :  * @inode:  the inode which may have a disconnected dentry
    3116             :  * @dentry: a negative dentry which we want to point to the inode.
    3117             :  *
    3118             :  * If inode is a directory and has an IS_ROOT alias, then d_move that in
    3119             :  * place of the given dentry and return it, else simply d_add the inode
    3120             :  * to the dentry and return NULL.
    3121             :  *
    3122             :  * If a non-IS_ROOT directory is found, the filesystem is corrupt, and
    3123             :  * we should error out: directories can't have multiple aliases.
    3124             :  *
    3125             :  * This is needed in the lookup routine of any filesystem that is exportable
    3126             :  * (via knfsd) so that we can build dcache paths to directories effectively.
    3127             :  *
    3128             :  * If a dentry was found and moved, then it is returned.  Otherwise NULL
    3129             :  * is returned.  This matches the expected return value of ->lookup.
    3130             :  *
    3131             :  * Cluster filesystems may call this function with a negative, hashed dentry.
    3132             :  * In that case, we know that the inode will be a regular file, and also this
    3133             :  * will only occur during atomic_open. So we need to check for the dentry
    3134             :  * being already hashed only in the final case.
    3135             :  */
    3136   235671416 : struct dentry *d_splice_alias(struct inode *inode, struct dentry *dentry)
    3137             : {
    3138   235671416 :         if (IS_ERR(inode))
    3139             :                 return ERR_CAST(inode);
    3140             : 
    3141   235606817 :         BUG_ON(!d_unhashed(dentry));
    3142             : 
    3143   235606817 :         if (!inode)
    3144   156954051 :                 goto out;
    3145             : 
    3146    78652766 :         security_d_instantiate(dentry, inode);
    3147    78652766 :         spin_lock(&inode->i_lock);
    3148    78662899 :         if (S_ISDIR(inode->i_mode)) {
    3149    25155529 :                 struct dentry *new = __d_find_any_alias(inode);
    3150    25155242 :                 if (unlikely(new)) {
    3151             :                         /* The reference to new ensures it remains an alias */
    3152     3701455 :                         spin_unlock(&inode->i_lock);
    3153     3701326 :                         write_seqlock(&rename_lock);
    3154     3704036 :                         if (unlikely(d_ancestor(new, dentry))) {
    3155           0 :                                 write_sequnlock(&rename_lock);
    3156           0 :                                 dput(new);
    3157           0 :                                 new = ERR_PTR(-ELOOP);
    3158           0 :                                 pr_warn_ratelimited(
    3159             :                                         "VFS: Lookup of '%s' in %s %s"
    3160             :                                         " would have caused loop\n",
    3161             :                                         dentry->d_name.name,
    3162             :                                         inode->i_sb->s_type->name,
    3163             :                                         inode->i_sb->s_id);
    3164     3704036 :                         } else if (!IS_ROOT(new)) {
    3165           0 :                                 struct dentry *old_parent = dget(new->d_parent);
    3166           0 :                                 int err = __d_unalias(inode, dentry, new);
    3167           0 :                                 write_sequnlock(&rename_lock);
    3168           0 :                                 if (err) {
    3169           0 :                                         dput(new);
    3170           0 :                                         new = ERR_PTR(err);
    3171             :                                 }
    3172           0 :                                 dput(old_parent);
    3173             :                         } else {
    3174     3704036 :                                 __d_move(new, dentry, false);
    3175     3704036 :                                 write_sequnlock(&rename_lock);
    3176             :                         }
    3177     3704036 :                         iput(inode);
    3178     3704036 :                         return new;
    3179             :                 }
    3180             :         }
    3181    74961157 : out:
    3182   231915208 :         __d_add(dentry, inode);
    3183   231915208 :         return NULL;
    3184             : }
    3185             : EXPORT_SYMBOL(d_splice_alias);
    3186             : 
    3187             : /*
    3188             :  * Test whether new_dentry is a subdirectory of old_dentry.
    3189             :  *
    3190             :  * Trivially implemented using the dcache structure
    3191             :  */
    3192             : 
    3193             : /**
    3194             :  * is_subdir - is new dentry a subdirectory of old_dentry
    3195             :  * @new_dentry: new dentry
    3196             :  * @old_dentry: old dentry
    3197             :  *
    3198             :  * Returns true if new_dentry is a subdirectory of the parent (at any depth).
    3199             :  * Returns false otherwise.
    3200             :  * Caller must ensure that "new_dentry" is pinned before calling is_subdir()
    3201             :  */
    3202             :   
    3203    14710432 : bool is_subdir(struct dentry *new_dentry, struct dentry *old_dentry)
    3204             : {
    3205    14710432 :         bool result;
    3206    14710432 :         unsigned seq;
    3207             : 
    3208    14710432 :         if (new_dentry == old_dentry)
    3209             :                 return true;
    3210             : 
    3211    14701998 :         do {
    3212             :                 /* for restarting inner loop in case of seq retry */
    3213    14701998 :                 seq = read_seqbegin(&rename_lock);
    3214             :                 /*
    3215             :                  * Need rcu_readlock to protect against the d_parent trashing
    3216             :                  * due to d_move
    3217             :                  */
    3218    14702716 :                 rcu_read_lock();
    3219    14702465 :                 if (d_ancestor(old_dentry, new_dentry))
    3220             :                         result = true;
    3221             :                 else
    3222     1015545 :                         result = false;
    3223    14702465 :                 rcu_read_unlock();
    3224    14702741 :         } while (read_seqretry(&rename_lock, seq));
    3225             : 
    3226             :         return result;
    3227             : }
    3228             : EXPORT_SYMBOL(is_subdir);
    3229             : 
    3230         960 : static enum d_walk_ret d_genocide_kill(void *data, struct dentry *dentry)
    3231             : {
    3232         960 :         struct dentry *root = data;
    3233         960 :         if (dentry != root) {
    3234         213 :                 if (d_unhashed(dentry) || !dentry->d_inode)
    3235             :                         return D_WALK_SKIP;
    3236             : 
    3237         213 :                 if (!(dentry->d_flags & DCACHE_GENOCIDE)) {
    3238         213 :                         dentry->d_flags |= DCACHE_GENOCIDE;
    3239         213 :                         dentry->d_lockref.count--;
    3240             :                 }
    3241             :         }
    3242             :         return D_WALK_CONTINUE;
    3243             : }
    3244             : 
    3245         747 : void d_genocide(struct dentry *parent)
    3246             : {
    3247         747 :         d_walk(parent, parent, d_genocide_kill);
    3248         747 : }
    3249             : 
    3250             : EXPORT_SYMBOL(d_genocide);
    3251             : 
    3252     8655616 : void d_tmpfile(struct file *file, struct inode *inode)
    3253             : {
    3254     8655616 :         struct dentry *dentry = file->f_path.dentry;
    3255             : 
    3256     8655616 :         inode_dec_link_count(inode);
    3257    17914656 :         BUG_ON(dentry->d_name.name != dentry->d_iname ||
    3258             :                 !hlist_unhashed(&dentry->d_u.d_alias) ||
    3259             :                 !d_unlinked(dentry));
    3260     8957328 :         spin_lock(&dentry->d_parent->d_lock);
    3261     9003617 :         spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED);
    3262     9005166 :         dentry->d_name.len = sprintf(dentry->d_iname, "#%llu",
    3263     9005166 :                                 (unsigned long long)inode->i_ino);
    3264     9005166 :         spin_unlock(&dentry->d_lock);
    3265     8326284 :         spin_unlock(&dentry->d_parent->d_lock);
    3266     8607888 :         d_instantiate(dentry, inode);
    3267     8892461 : }
    3268             : EXPORT_SYMBOL(d_tmpfile);
    3269             : 
    3270             : static __initdata unsigned long dhash_entries;
    3271           0 : static int __init set_dhash_entries(char *str)
    3272             : {
    3273           0 :         if (!str)
    3274             :                 return 0;
    3275           0 :         dhash_entries = simple_strtoul(str, &str, 0);
    3276           0 :         return 1;
    3277             : }
    3278             : __setup("dhash_entries=", set_dhash_entries);
    3279             : 
    3280           0 : static void __init dcache_init_early(void)
    3281             : {
    3282             :         /* If hashes are distributed across NUMA nodes, defer
    3283             :          * hash allocation until vmalloc space is available.
    3284             :          */
    3285           0 :         if (hashdist)
    3286             :                 return;
    3287             : 
    3288           0 :         dentry_hashtable =
    3289           0 :                 alloc_large_system_hash("Dentry cache",
    3290             :                                         sizeof(struct hlist_bl_head),
    3291             :                                         dhash_entries,
    3292             :                                         13,
    3293             :                                         HASH_EARLY | HASH_ZERO,
    3294             :                                         &d_hash_shift,
    3295             :                                         NULL,
    3296             :                                         0,
    3297             :                                         0);
    3298           0 :         d_hash_shift = 32 - d_hash_shift;
    3299             : }
    3300             : 
    3301           0 : static void __init dcache_init(void)
    3302             : {
    3303             :         /*
    3304             :          * A constructor could be added for stable state like the lists,
    3305             :          * but it is probably not worth it because of the cache nature
    3306             :          * of the dcache.
    3307             :          */
    3308           0 :         dentry_cache = KMEM_CACHE_USERCOPY(dentry,
    3309             :                 SLAB_RECLAIM_ACCOUNT|SLAB_PANIC|SLAB_MEM_SPREAD|SLAB_ACCOUNT,
    3310             :                 d_iname);
    3311             : 
    3312             :         /* Hash may have been set up in dcache_init_early */
    3313           0 :         if (!hashdist)
    3314             :                 return;
    3315             : 
    3316           0 :         dentry_hashtable =
    3317           0 :                 alloc_large_system_hash("Dentry cache",
    3318             :                                         sizeof(struct hlist_bl_head),
    3319             :                                         dhash_entries,
    3320             :                                         13,
    3321             :                                         HASH_ZERO,
    3322             :                                         &d_hash_shift,
    3323             :                                         NULL,
    3324             :                                         0,
    3325             :                                         0);
    3326           0 :         d_hash_shift = 32 - d_hash_shift;
    3327             : }
    3328             : 
    3329             : /* SLAB cache for __getname() consumers */
    3330             : struct kmem_cache *names_cachep __read_mostly;
    3331             : EXPORT_SYMBOL(names_cachep);
    3332             : 
    3333           0 : void __init vfs_caches_init_early(void)
    3334             : {
    3335           0 :         int i;
    3336             : 
    3337           0 :         for (i = 0; i < ARRAY_SIZE(in_lookup_hashtable); i++)
    3338           0 :                 INIT_HLIST_BL_HEAD(&in_lookup_hashtable[i]);
    3339             : 
    3340           0 :         dcache_init_early();
    3341           0 :         inode_init_early();
    3342           0 : }
    3343             : 
    3344           0 : void __init vfs_caches_init(void)
    3345             : {
    3346           0 :         names_cachep = kmem_cache_create_usercopy("names_cache", PATH_MAX, 0,
    3347             :                         SLAB_HWCACHE_ALIGN|SLAB_PANIC, 0, PATH_MAX, NULL);
    3348             : 
    3349           0 :         dcache_init();
    3350           0 :         inode_init();
    3351           0 :         files_init();
    3352           0 :         files_maxfiles_init();
    3353           0 :         mnt_init();
    3354           0 :         bdev_cache_init();
    3355           0 :         chrdev_init();
    3356           0 : }

Generated by: LCOV version 1.14