hammer - Fix bugs, fix serious snapshot bug, flush adjustments
[dragonfly.git] / sys / vfs / hammer2 / hammer2_xops.c
1 /*
2  * Copyright (c) 2011-2018 The DragonFly Project.  All rights reserved.
3  *
4  * This code is derived from software contributed to The DragonFly Project
5  * by Matthew Dillon <dillon@dragonflybsd.org>
6  * by Venkatesh Srinivas <vsrinivas@dragonflybsd.org>
7  * by Daniel Flores (GSOC 2013 - mentored by Matthew Dillon, compression) 
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  *
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in
17  *    the documentation and/or other materials provided with the
18  *    distribution.
19  * 3. Neither the name of The DragonFly Project nor the names of its
20  *    contributors may be used to endorse or promote products derived
21  *    from this software without specific, prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
24  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
25  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
26  * FOR A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE
27  * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
28  * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
29  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
30  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
31  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
32  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
33  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34  * SUCH DAMAGE.
35  */
36 /*
37  * Per-node backend for kernel filesystem interface.
38  *
39  * This executes a VOP concurrently on multiple nodes, each node via its own
40  * thread, and competes to advance the original request.  The original
41  * request is retired the moment all requirements are met, even if the
42  * operation is still in-progress on some nodes.
43  */
44 #include <sys/param.h>
45 #include <sys/systm.h>
46 #include <sys/kernel.h>
47 #include <sys/fcntl.h>
48 #include <sys/buf.h>
49 #include <sys/proc.h>
50 #include <sys/namei.h>
51 #include <sys/mount.h>
52 #include <sys/vnode.h>
53 #include <sys/mountctl.h>
54 #include <sys/dirent.h>
55 #include <sys/uio.h>
56 #include <sys/objcache.h>
57 #include <sys/event.h>
58 #include <sys/file.h>
59 #include <vfs/fifofs/fifo.h>
60
61 #include "hammer2.h"
62
63 /*
64  * Determine if the specified directory is empty.
65  *
66  *      Returns 0 on success.
67  *
68  *      Returns HAMMER_ERROR_EAGAIN if caller must re-lookup the entry and
69  *      retry. (occurs if we race a ripup on oparent or ochain).
70  *
71  *      Or returns a permanent HAMMER2_ERROR_* error mask.
72  *
73  * The caller must pass in an exclusively locked oparent and ochain.  This
74  * function will handle the case where the chain is a directory entry or
75  * the inode itself.  The original oparent,ochain will be locked upon return.
76  *
77  * This function will unlock the underlying oparent,ochain temporarily when
78  * doing an inode lookup to avoid deadlocks.  The caller MUST handle the EAGAIN
79  * result as this means that oparent is no longer the parent of ochain, or
80  * that ochain was destroyed while it was unlocked.
81  */
82 static
83 int
84 checkdirempty(hammer2_chain_t *oparent, hammer2_chain_t *ochain, int clindex)
85 {
86         hammer2_chain_t *parent;
87         hammer2_chain_t *chain;
88         hammer2_key_t key_next;
89         hammer2_key_t inum;
90         int error;
91         int didunlock;
92
93         error = 0;
94         didunlock = 0;
95
96         /*
97          * Find the inode, set it up as a locked 'chain'.  ochain can be the
98          * inode itself, or it can be a directory entry.
99          */
100         if (ochain->bref.type == HAMMER2_BREF_TYPE_DIRENT) {
101                 inum = ochain->bref.embed.dirent.inum;
102                 hammer2_chain_unlock(ochain);
103                 hammer2_chain_unlock(oparent);
104
105                 parent = NULL;
106                 chain = NULL;
107                 error = hammer2_chain_inode_find(ochain->pmp, inum,
108                                                  clindex, 0,
109                                                  &parent, &chain);
110                 if (parent) {
111                         hammer2_chain_unlock(parent);
112                         hammer2_chain_drop(parent);
113                 }
114                 didunlock = 1;
115         } else {
116                 /*
117                  * The directory entry *is* the directory inode
118                  */
119                 chain = hammer2_chain_lookup_init(ochain, 0);
120         }
121
122         /*
123          * Determine if the directory is empty or not by checking its
124          * visible namespace (the area which contains directory entries).
125          */
126         if (error == 0) {
127                 parent = chain;
128                 chain = NULL;
129                 if (parent) {
130                         chain = hammer2_chain_lookup(&parent, &key_next,
131                                                      HAMMER2_DIRHASH_VISIBLE,
132                                                      HAMMER2_KEY_MAX,
133                                                      &error, 0);
134                 }
135                 if (chain) {
136                         error = HAMMER2_ERROR_ENOTEMPTY;
137                         hammer2_chain_unlock(chain);
138                         hammer2_chain_drop(chain);
139                 }
140                 hammer2_chain_lookup_done(parent);
141         }
142
143         if (didunlock) {
144                 hammer2_chain_lock(oparent, HAMMER2_RESOLVE_ALWAYS);
145                 hammer2_chain_lock(ochain, HAMMER2_RESOLVE_ALWAYS);
146                 if ((ochain->flags & HAMMER2_CHAIN_DELETED) ||
147                     (oparent->flags & HAMMER2_CHAIN_DELETED) ||
148                     ochain->parent != oparent) {
149                         kprintf("hammer2: debug: CHECKDIR inum %jd RETRY\n",
150                                 inum);
151                         error = HAMMER2_ERROR_EAGAIN;
152                 }
153         }
154         return error;
155 }
156
157 /*
158  * Backend for hammer2_vfs_root()
159  *
160  * This is called when a newly mounted PFS has not yet synchronized
161  * to the inode_tid and modify_tid.
162  */
163 void
164 hammer2_xop_ipcluster(hammer2_thread_t *thr, hammer2_xop_t *arg)
165 {
166         hammer2_xop_ipcluster_t *xop = &arg->xop_ipcluster;
167         hammer2_chain_t *chain;
168         int error;
169
170         chain = hammer2_inode_chain(xop->head.ip1, thr->clindex,
171                                     HAMMER2_RESOLVE_ALWAYS |
172                                     HAMMER2_RESOLVE_SHARED);
173         if (chain)
174                 error = chain->error;
175         else
176                 error = HAMMER2_ERROR_EIO;
177                 
178         hammer2_xop_feed(&xop->head, chain, thr->clindex, error);
179         if (chain) {
180                 hammer2_chain_unlock(chain);
181                 hammer2_chain_drop(chain);
182         }
183 }
184
185 /*
186  * Backend for hammer2_vop_readdir()
187  */
188 void
189 hammer2_xop_readdir(hammer2_thread_t *thr, hammer2_xop_t *arg)
190 {
191         hammer2_xop_readdir_t *xop = &arg->xop_readdir;
192         hammer2_chain_t *parent;
193         hammer2_chain_t *chain;
194         hammer2_key_t key_next;
195         hammer2_key_t lkey;
196         int error = 0;
197
198         lkey = xop->lkey;
199         if (hammer2_debug & 0x0020)
200                 kprintf("xop_readdir %p lkey=%016jx\n", xop, lkey);
201
202         /*
203          * The inode's chain is the iterator.  If we cannot acquire it our
204          * contribution ends here.
205          */
206         parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
207                                      HAMMER2_RESOLVE_ALWAYS |
208                                      HAMMER2_RESOLVE_SHARED);
209         if (parent == NULL) {
210                 kprintf("xop_readdir: NULL parent\n");
211                 goto done;
212         }
213
214         /*
215          * Directory scan [re]start and loop, the feed inherits the chain's
216          * lock so do not unlock it on the iteration.
217          */
218         chain = hammer2_chain_lookup(&parent, &key_next, lkey, lkey,
219                                      &error, HAMMER2_LOOKUP_SHARED);
220         if (chain == NULL) {
221                 chain = hammer2_chain_lookup(&parent, &key_next,
222                                              lkey, HAMMER2_KEY_MAX,
223                                              &error, HAMMER2_LOOKUP_SHARED);
224         }
225         while (chain) {
226                 error = hammer2_xop_feed(&xop->head, chain, thr->clindex, 0);
227                 if (error)
228                         goto break2;
229                 chain = hammer2_chain_next(&parent, chain, &key_next,
230                                            key_next, HAMMER2_KEY_MAX,
231                                            &error, HAMMER2_LOOKUP_SHARED);
232         }
233 break2:
234         if (chain) {
235                 hammer2_chain_unlock(chain);
236                 hammer2_chain_drop(chain);
237         }
238         hammer2_chain_unlock(parent);
239         hammer2_chain_drop(parent);
240 done:
241         hammer2_xop_feed(&xop->head, NULL, thr->clindex, error);
242 }
243
244 /*
245  * Backend for hammer2_vop_nresolve()
246  */
247 void
248 hammer2_xop_nresolve(hammer2_thread_t *thr, hammer2_xop_t *arg)
249 {
250         hammer2_xop_nresolve_t *xop = &arg->xop_nresolve;
251         hammer2_chain_t *parent;
252         hammer2_chain_t *chain;
253         const char *name;
254         size_t name_len;
255         hammer2_key_t key_next;
256         hammer2_key_t lhc;
257         int error;
258
259         parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
260                                      HAMMER2_RESOLVE_ALWAYS |
261                                      HAMMER2_RESOLVE_SHARED);
262         if (parent == NULL) {
263                 kprintf("xop_nresolve: NULL parent\n");
264                 chain = NULL;
265                 error = HAMMER2_ERROR_EIO;
266                 goto done;
267         }
268         name = xop->head.name1;
269         name_len = xop->head.name1_len;
270
271         /*
272          * Lookup the directory entry
273          */
274         lhc = hammer2_dirhash(name, name_len);
275         chain = hammer2_chain_lookup(&parent, &key_next,
276                                      lhc, lhc + HAMMER2_DIRHASH_LOMASK,
277                                      &error,
278                                      HAMMER2_LOOKUP_ALWAYS |
279                                      HAMMER2_LOOKUP_SHARED);
280         while (chain) {
281                 if (hammer2_chain_dirent_test(chain, name, name_len))
282                         break;
283                 chain = hammer2_chain_next(&parent, chain, &key_next,
284                                            key_next,
285                                            lhc + HAMMER2_DIRHASH_LOMASK,
286                                            &error,
287                                            HAMMER2_LOOKUP_ALWAYS |
288                                            HAMMER2_LOOKUP_SHARED);
289         }
290
291         /*
292          * If the entry is a hardlink pointer, resolve it.
293          */
294         if (chain && chain->error == 0) {
295                 if (chain->bref.type == HAMMER2_BREF_TYPE_DIRENT) {
296                         lhc = chain->bref.embed.dirent.inum;
297                         error = hammer2_chain_inode_find(chain->pmp,
298                                                          lhc,
299                                                          thr->clindex,
300                                                          HAMMER2_LOOKUP_SHARED,
301                                                          &parent,
302                                                          &chain);
303                 }
304         } else if (chain && error == 0) {
305                 error = chain->error;
306         }
307 done:
308         error = hammer2_xop_feed(&xop->head, chain, thr->clindex, error);
309         if (chain) {
310                 hammer2_chain_unlock(chain);
311                 hammer2_chain_drop(chain);
312         }
313         if (parent) {
314                 hammer2_chain_unlock(parent);
315                 hammer2_chain_drop(parent);
316         }
317 }
318
319 /*
320  * Backend for hammer2_vop_nremove(), hammer2_vop_nrmdir(), and
321  * backend for pfs_delete.
322  *
323  * This function locates and removes a directory entry, and will lookup
324  * and return the underlying inode.  For directory entries the underlying
325  * inode is not removed.  If the directory entry is the actual inode itself,
326  * it may be conditonally removed and returned.
327  *
328  * WARNING!  Any target inode's nlinks may not be synchronized to the
329  *           in-memory inode.  The frontend's hammer2_inode_unlink_finisher()
330  *           is responsible for the final disposition of the actual inode.
331  */
332 void
333 hammer2_xop_unlink(hammer2_thread_t *thr, hammer2_xop_t *arg)
334 {
335         hammer2_xop_unlink_t *xop = &arg->xop_unlink;
336         hammer2_chain_t *parent;
337         hammer2_chain_t *chain;
338         const char *name;
339         size_t name_len;
340         hammer2_key_t key_next;
341         hammer2_key_t lhc;
342         int error;
343
344 again:
345         /*
346          * Requires exclusive lock
347          */
348         parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
349                                      HAMMER2_RESOLVE_ALWAYS);
350         chain = NULL;
351         if (parent == NULL) {
352                 kprintf("xop_nresolve: NULL parent\n");
353                 error = HAMMER2_ERROR_EIO;
354                 goto done;
355         }
356         name = xop->head.name1;
357         name_len = xop->head.name1_len;
358
359         /*
360          * Lookup the directory entry
361          */
362         lhc = hammer2_dirhash(name, name_len);
363         chain = hammer2_chain_lookup(&parent, &key_next,
364                                      lhc, lhc + HAMMER2_DIRHASH_LOMASK,
365                                      &error, HAMMER2_LOOKUP_ALWAYS);
366         while (chain) {
367                 if (hammer2_chain_dirent_test(chain, name, name_len))
368                         break;
369                 chain = hammer2_chain_next(&parent, chain, &key_next,
370                                            key_next,
371                                            lhc + HAMMER2_DIRHASH_LOMASK,
372                                            &error, HAMMER2_LOOKUP_ALWAYS);
373         }
374
375         /*
376          * The directory entry will either be a BREF_TYPE_DIRENT or a
377          * BREF_TYPE_INODE.  We always permanently delete DIRENTs, but
378          * must go by xop->dopermanent for BREF_TYPE_INODE.
379          *
380          * Note that the target chain's nlinks may not be synchronized with
381          * the in-memory hammer2_inode_t structure, so we don't try to do
382          * anything fancy here.  The frontend deals with nlinks
383          * synchronization.
384          */
385         if (chain && chain->error == 0) {
386                 int dopermanent = xop->dopermanent & H2DOPERM_PERMANENT;
387                 int doforce = xop->dopermanent & H2DOPERM_FORCE;
388                 uint8_t type;
389
390                 /*
391                  * If the directory entry is the actual inode then use its
392                  * type for the directory typing tests, otherwise if it is
393                  * a directory entry, pull the type field from the entry.
394                  *
395                  * Directory entries are always permanently deleted
396                  * (because they aren't the actual inode).
397                  */
398                 if (chain->bref.type == HAMMER2_BREF_TYPE_DIRENT) {
399                         type = chain->bref.embed.dirent.type;
400                         dopermanent |= HAMMER2_DELETE_PERMANENT;
401                 } else {
402                         type = chain->data->ipdata.meta.type;
403                 }
404
405                 /*
406                  * Check directory typing and delete the entry.  Note that
407                  * nlinks adjustments are made on the real inode by the
408                  * frontend, not here.
409                  *
410                  * Unfortunately, checkdirempty() may have to unlock (parent).
411                  * If it no longer matches chain->parent after re-locking,
412                  * EAGAIN is returned.
413                  */
414                 if (type == HAMMER2_OBJTYPE_DIRECTORY && doforce) {
415                         /*
416                          * If doforce then execute the operation even if
417                          * the directory is not empty or errored.  We
418                          * ignore chain->error here, allowing an errored
419                          * chain (aka directory entry) to still be deleted.
420                          */
421                         error = hammer2_chain_delete(parent, chain,
422                                              xop->head.mtid, dopermanent);
423                 } else if (type == HAMMER2_OBJTYPE_DIRECTORY &&
424                            (error = checkdirempty(parent, chain, thr->clindex)) != 0) {
425                         /*
426                          * error may be EAGAIN or ENOTEMPTY
427                          */
428                         if (error == HAMMER2_ERROR_EAGAIN) {
429                                 hammer2_chain_unlock(chain);
430                                 hammer2_chain_drop(chain);
431                                 hammer2_chain_unlock(parent);
432                                 hammer2_chain_drop(parent);
433                                 goto again;
434                         }
435                 } else if (type == HAMMER2_OBJTYPE_DIRECTORY &&
436                     xop->isdir == 0) {
437                         error = HAMMER2_ERROR_ENOTDIR;
438                 } else if (type != HAMMER2_OBJTYPE_DIRECTORY &&
439                            xop->isdir >= 1) {
440                         error = HAMMER2_ERROR_EISDIR;
441                 } else {
442                         /*
443                          * Delete the directory entry.  chain might also
444                          * be a directly-embedded inode.
445                          *
446                          * Allow the deletion to proceed even if the chain
447                          * is errored.  Give priority to error-on-delete over
448                          * chain->error.
449                          */
450                         error = hammer2_chain_delete(parent, chain,
451                                                      xop->head.mtid,
452                                                      dopermanent);
453                         if (error == 0)
454                                 error = chain->error;
455                 }
456         } else {
457                 if (chain && error == 0)
458                         error = chain->error;
459         }
460
461         /*
462          * If chain is a directory entry we must resolve it.  We do not try
463          * to manipulate the contents as it might not be synchronized with
464          * the frontend hammer2_inode_t, nor do we try to lookup the
465          * frontend hammer2_inode_t here (we are the backend!).
466          */
467         if (chain && chain->bref.type == HAMMER2_BREF_TYPE_DIRENT &&
468             (xop->dopermanent & H2DOPERM_IGNINO) == 0) {
469                 int error2;
470
471                 lhc = chain->bref.embed.dirent.inum;
472
473                 error2 = hammer2_chain_inode_find(chain->pmp, lhc,
474                                                   thr->clindex, 0,
475                                                   &parent, &chain);
476                 if (error2) {
477                         kprintf("inode_find: %016jx %p failed\n",
478                                 lhc, chain);
479                         error2 = 0;     /* silently ignore */
480                 }
481                 if (error == 0)
482                         error = error2;
483         }
484
485         /*
486          * Return the inode target for further action.  Typically used by
487          * hammer2_inode_unlink_finisher().
488          */
489 done:
490         hammer2_xop_feed(&xop->head, chain, thr->clindex, error);
491         if (chain) {
492                 hammer2_chain_unlock(chain);
493                 hammer2_chain_drop(chain);
494                 chain = NULL;
495         }
496         if (parent) {
497                 hammer2_chain_unlock(parent);
498                 hammer2_chain_drop(parent);
499                 parent = NULL;
500         }
501 }
502
503 /*
504  * Backend for hammer2_vop_nrename()
505  *
506  * This handles the backend rename operation.  Typically this renames
507  * directory entries but can also be used to rename embedded inodes.
508  *
509  * NOTE! The frontend is responsible for updating the inode meta-data in
510  *       the file being renamed and for decrementing the target-replaced
511  *       inode's nlinks, if present.
512  */
513 void
514 hammer2_xop_nrename(hammer2_thread_t *thr, hammer2_xop_t *arg)
515 {
516         hammer2_xop_nrename_t *xop = &arg->xop_nrename;
517         hammer2_pfs_t *pmp;
518         hammer2_chain_t *parent;
519         hammer2_chain_t *chain;
520         hammer2_chain_t *tmp;
521         hammer2_inode_t *ip;
522         hammer2_key_t key_next;
523         int error;
524
525         /*
526          * We need the precise parent chain to issue the deletion.
527          *
528          * If this is a directory entry we must locate the underlying
529          * inode.  If it is an embedded inode we can act directly on it.
530          */
531         ip = xop->head.ip2;
532         pmp = ip->pmp;
533         chain = NULL;
534         error = 0;
535
536         if (xop->ip_key & HAMMER2_DIRHASH_VISIBLE) {
537                 /*
538                  * Find ip's direct parent chain.
539                  */
540                 chain = hammer2_inode_chain(ip, thr->clindex,
541                                             HAMMER2_RESOLVE_ALWAYS);
542                 if (chain == NULL) {
543                         error = HAMMER2_ERROR_EIO;
544                         parent = NULL;
545                         goto done;
546                 }
547                 parent = hammer2_chain_getparent(chain, HAMMER2_RESOLVE_ALWAYS);
548                 if (parent == NULL) {
549                         error = HAMMER2_ERROR_EIO;
550                         goto done;
551                 }
552         } else {
553                 /*
554                  * The directory entry for the head.ip1 inode
555                  * is in fdip, do a namespace search.
556                  */
557                 hammer2_key_t lhc;
558                 const char *name;
559                 size_t name_len;
560
561                 parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
562                                              HAMMER2_RESOLVE_ALWAYS);
563                 if (parent == NULL) {
564                         kprintf("xop_nrename: NULL parent\n");
565                         error = HAMMER2_ERROR_EIO;
566                         goto done;
567                 }
568                 name = xop->head.name1;
569                 name_len = xop->head.name1_len;
570
571                 /*
572                  * Lookup the directory entry
573                  */
574                 lhc = hammer2_dirhash(name, name_len);
575                 chain = hammer2_chain_lookup(&parent, &key_next,
576                                              lhc, lhc + HAMMER2_DIRHASH_LOMASK,
577                                              &error, HAMMER2_LOOKUP_ALWAYS);
578                 while (chain) {
579                         if (hammer2_chain_dirent_test(chain, name, name_len))
580                                 break;
581                         chain = hammer2_chain_next(&parent, chain, &key_next,
582                                                    key_next,
583                                                    lhc + HAMMER2_DIRHASH_LOMASK,
584                                                    &error,
585                                                    HAMMER2_LOOKUP_ALWAYS);
586                 }
587         }
588
589         if (chain == NULL) {
590                 /* XXX shouldn't happen, but does under fsstress */
591                 kprintf("hammer2_xop_rename: \"%s\" -> \"%s\"  ENOENT\n",
592                         xop->head.name1,
593                         xop->head.name2);
594                 if (error == 0)
595                         error = HAMMER2_ERROR_ENOENT;
596                 goto done;
597         }
598
599         if (chain->error) {
600                 error = chain->error;
601                 goto done;
602         }
603
604         /*
605          * Delete it, then create it in the new namespace.
606          *
607          * An error can occur if the chain being deleted requires
608          * modification and the media is full.
609          */
610         error = hammer2_chain_delete(parent, chain, xop->head.mtid, 0);
611         hammer2_chain_unlock(parent);
612         hammer2_chain_drop(parent);
613         parent = NULL;          /* safety */
614         if (error)
615                 goto done;
616
617         /*
618          * Adjust fields in the deleted chain appropriate for the rename
619          * operation.
620          *
621          * NOTE! For embedded inodes, the frontend will officially replicate
622          *       the field adjustments, but we also do it here to maintain
623          *       consistency in case of a crash.
624          */
625         if (chain->bref.key != xop->lhc ||
626             xop->head.name1_len != xop->head.name2_len ||
627             bcmp(xop->head.name1, xop->head.name2, xop->head.name1_len) != 0) {
628                 if (chain->bref.type == HAMMER2_BREF_TYPE_INODE) {
629                         hammer2_inode_data_t *wipdata;
630
631                         error = hammer2_chain_modify(chain, xop->head.mtid,
632                                                      0, 0);
633                         if (error == 0) {
634                                 wipdata = &chain->data->ipdata;
635
636                                 bzero(wipdata->filename,
637                                       sizeof(wipdata->filename));
638                                 bcopy(xop->head.name2,
639                                       wipdata->filename,
640                                       xop->head.name2_len);
641                                 wipdata->meta.name_key = xop->lhc;
642                                 wipdata->meta.name_len = xop->head.name2_len;
643                         }
644                 }
645                 if (chain->bref.type == HAMMER2_BREF_TYPE_DIRENT) {
646                         if (xop->head.name2_len <=
647                             sizeof(chain->bref.check.buf)) {
648                                 /*
649                                  * Remove any related data buffer, we can
650                                  * embed the filename in the bref itself.
651                                  */
652                                 error = hammer2_chain_resize(
653                                                 chain, xop->head.mtid, 0, 0, 0);
654                                 if (error == 0) {
655                                         error = hammer2_chain_modify(
656                                                         chain, xop->head.mtid,
657                                                         0, 0);
658                                 }
659                                 if (error == 0) {
660                                         bzero(chain->bref.check.buf,
661                                               sizeof(chain->bref.check.buf));
662                                         bcopy(xop->head.name2,
663                                               chain->bref.check.buf,
664                                               xop->head.name2_len);
665                                 }
666                         } else {
667                                 /*
668                                  * Associate a data buffer with the bref.
669                                  * Zero it for consistency.  Note that the
670                                  * data buffer is not 64KB so use chain->bytes
671                                  * instead of sizeof().
672                                  */
673                                 error = hammer2_chain_resize(
674                                         chain, xop->head.mtid, 0,
675                                         hammer2_getradix(HAMMER2_ALLOC_MIN), 0);
676                                 if (error == 0) {
677                                         error = hammer2_chain_modify(
678                                                     chain, xop->head.mtid,
679                                                     0, 0);
680                                 }
681                                 if (error == 0) {
682                                         bzero(chain->data->buf, chain->bytes);
683                                         bcopy(xop->head.name2,
684                                               chain->data->buf,
685                                               xop->head.name2_len);
686                                 }
687                         }
688                         if (error == 0) {
689                                 chain->bref.embed.dirent.namlen =
690                                         xop->head.name2_len;
691                         }
692                 }
693         }
694
695         /*
696          * The frontend will replicate this operation and is the real final
697          * authority, but adjust the inode's iparent field too if the inode
698          * is embedded in the directory.
699          */
700         if (chain->bref.type == HAMMER2_BREF_TYPE_INODE &&
701             chain->data->ipdata.meta.iparent != xop->head.ip3->meta.inum) {
702                 hammer2_inode_data_t *wipdata;
703
704                 error = hammer2_chain_modify(chain, xop->head.mtid, 0, 0);
705                 if (error == 0) {
706                         wipdata = &chain->data->ipdata;
707                         wipdata->meta.iparent = xop->head.ip3->meta.inum;
708                 }
709         }
710
711         /*
712          * Destroy any matching target(s) before creating the new entry.
713          * This will result in some ping-ponging of the directory key
714          * iterator but that is ok.
715          */
716         parent = hammer2_inode_chain(xop->head.ip3, thr->clindex,
717                                      HAMMER2_RESOLVE_ALWAYS);
718         if (parent == NULL) {
719                 error = HAMMER2_ERROR_EIO;
720                 goto done;
721         }
722
723         /*
724          * Delete all matching directory entries.  That is, get rid of
725          * multiple duplicates if present, as a self-healing mechanism.
726          */
727         if (error == 0) {
728                 tmp = hammer2_chain_lookup(&parent, &key_next,
729                                            xop->lhc & ~HAMMER2_DIRHASH_LOMASK,
730                                            xop->lhc | HAMMER2_DIRHASH_LOMASK,
731                                            &error,
732                                            HAMMER2_LOOKUP_ALWAYS);
733                 while (tmp) {
734                         int e2;
735                         if (hammer2_chain_dirent_test(tmp, xop->head.name2,
736                                                       xop->head.name2_len)) {
737                                 e2 = hammer2_chain_delete(parent, tmp,
738                                                           xop->head.mtid, 0);
739                                 if (error == 0 && e2)
740                                         error = e2;
741                         }
742                         tmp = hammer2_chain_next(&parent, tmp, &key_next,
743                                                  key_next,
744                                                  xop->lhc |
745                                                   HAMMER2_DIRHASH_LOMASK,
746                                                  &error,
747                                                  HAMMER2_LOOKUP_ALWAYS);
748                 }
749         }
750         if (error == 0) {
751                 /*
752                  * A relookup is required before the create to properly
753                  * position the parent chain.
754                  */
755                 tmp = hammer2_chain_lookup(&parent, &key_next,
756                                            xop->lhc, xop->lhc,
757                                            &error, 0);
758                 KKASSERT(tmp == NULL);
759                 error = hammer2_chain_create(&parent, &chain,
760                                              pmp, HAMMER2_METH_DEFAULT,
761                                              xop->lhc, 0,
762                                              HAMMER2_BREF_TYPE_INODE,
763                                              HAMMER2_INODE_BYTES,
764                                              xop->head.mtid, 0, 0);
765         }
766 done:
767         hammer2_xop_feed(&xop->head, NULL, thr->clindex, error);
768         if (parent) {
769                 hammer2_chain_unlock(parent);
770                 hammer2_chain_drop(parent);
771         }
772         if (chain) {
773                 hammer2_chain_unlock(chain);
774                 hammer2_chain_drop(chain);
775         }
776 }
777
778 /*
779  * Directory collision resolver scan helper (backend, threaded).
780  *
781  * Used by the inode create code to locate an unused lhc.
782  */
783 void
784 hammer2_xop_scanlhc(hammer2_thread_t *thr, hammer2_xop_t *arg)
785 {
786         hammer2_xop_scanlhc_t *xop = &arg->xop_scanlhc;
787         hammer2_chain_t *parent;
788         hammer2_chain_t *chain;
789         hammer2_key_t key_next;
790         int error = 0;
791
792         parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
793                                      HAMMER2_RESOLVE_ALWAYS |
794                                      HAMMER2_RESOLVE_SHARED);
795         if (parent == NULL) {
796                 kprintf("xop_nresolve: NULL parent\n");
797                 chain = NULL;
798                 error = HAMMER2_ERROR_EIO;
799                 goto done;
800         }
801
802         /*
803          * Lookup all possibly conflicting directory entries, the feed
804          * inherits the chain's lock so do not unlock it on the iteration.
805          */
806         chain = hammer2_chain_lookup(&parent, &key_next,
807                                      xop->lhc,
808                                      xop->lhc + HAMMER2_DIRHASH_LOMASK,
809                                      &error,
810                                      HAMMER2_LOOKUP_ALWAYS |
811                                      HAMMER2_LOOKUP_SHARED);
812         while (chain) {
813                 error = hammer2_xop_feed(&xop->head, chain, thr->clindex, 0);
814                 if (error) {
815                         hammer2_chain_unlock(chain);
816                         hammer2_chain_drop(chain);
817                         chain = NULL;   /* safety */
818                         goto done;
819                 }
820                 chain = hammer2_chain_next(&parent, chain, &key_next,
821                                            key_next,
822                                            xop->lhc + HAMMER2_DIRHASH_LOMASK,
823                                            &error,
824                                            HAMMER2_LOOKUP_ALWAYS |
825                                            HAMMER2_LOOKUP_SHARED);
826         }
827 done:
828         hammer2_xop_feed(&xop->head, NULL, thr->clindex, error);
829         if (parent) {
830                 hammer2_chain_unlock(parent);
831                 hammer2_chain_drop(parent);
832         }
833 }
834
835 /*
836  * Generic lookup of a specific key.
837  *
838  * Used by the inode hidden directory code to find the hidden directory.
839  */
840 void
841 hammer2_xop_lookup(hammer2_thread_t *thr, hammer2_xop_t *arg)
842 {
843         hammer2_xop_scanlhc_t *xop = &arg->xop_scanlhc;
844         hammer2_chain_t *parent;
845         hammer2_chain_t *chain;
846         hammer2_key_t key_next;
847         int error = 0;
848
849         parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
850                                      HAMMER2_RESOLVE_ALWAYS |
851                                      HAMMER2_RESOLVE_SHARED);
852         chain = NULL;
853         if (parent == NULL) {
854                 error = HAMMER2_ERROR_EIO;
855                 goto done;
856         }
857
858         /*
859          * Lookup all possibly conflicting directory entries, the feed
860          * inherits the chain's lock so do not unlock it on the iteration.
861          */
862         chain = hammer2_chain_lookup(&parent, &key_next,
863                                      xop->lhc, xop->lhc,
864                                      &error,
865                                      HAMMER2_LOOKUP_ALWAYS |
866                                      HAMMER2_LOOKUP_SHARED);
867         if (error == 0) {
868                 if (chain)
869                         error = chain->error;
870                 else
871                         error = HAMMER2_ERROR_ENOENT;
872         }
873         hammer2_xop_feed(&xop->head, chain, thr->clindex, error);
874
875 done:
876         if (chain) {
877                 hammer2_chain_unlock(chain);
878                 hammer2_chain_drop(chain);
879         }
880         if (parent) {
881                 hammer2_chain_unlock(parent);
882                 hammer2_chain_drop(parent);
883         }
884 }
885
886 /*
887  * Generic scan
888  *
889  * WARNING! Fed chains must be locked shared so ownership can be transfered
890  *          and to prevent frontend/backend stalls that would occur with an
891  *          exclusive lock.  The shared lock also allows chain->data to be
892  *          retained.
893  */
894 void
895 hammer2_xop_scanall(hammer2_thread_t *thr, hammer2_xop_t *arg)
896 {
897         hammer2_xop_scanall_t *xop = &arg->xop_scanall;
898         hammer2_chain_t *parent;
899         hammer2_chain_t *chain;
900         hammer2_key_t key_next;
901         int error = 0;
902
903         /*
904          * Assert required flags.
905          */
906         KKASSERT(xop->resolve_flags & HAMMER2_RESOLVE_SHARED);
907         KKASSERT(xop->lookup_flags & HAMMER2_LOOKUP_SHARED);
908
909         /*
910          * The inode's chain is the iterator.  If we cannot acquire it our
911          * contribution ends here.
912          */
913         parent = hammer2_inode_chain(xop->head.ip1, thr->clindex,
914                                      xop->resolve_flags);
915         if (parent == NULL) {
916                 kprintf("xop_readdir: NULL parent\n");
917                 goto done;
918         }
919
920         /*
921          * Generic scan of exact records.  Note that indirect blocks are
922          * automatically recursed and will not be returned.
923          */
924         chain = hammer2_chain_lookup(&parent, &key_next,
925                                      xop->key_beg, xop->key_end,
926                                      &error, xop->lookup_flags);
927         while (chain) {
928                 error = hammer2_xop_feed(&xop->head, chain, thr->clindex, 0);
929                 if (error)
930                         goto break2;
931                 chain = hammer2_chain_next(&parent, chain, &key_next,
932                                            key_next, xop->key_end,
933                                            &error, xop->lookup_flags);
934         }
935 break2:
936         if (chain) {
937                 hammer2_chain_unlock(chain);
938                 hammer2_chain_drop(chain);
939         }
940         hammer2_chain_unlock(parent);
941         hammer2_chain_drop(parent);
942 done:
943         hammer2_xop_feed(&xop->head, NULL, thr->clindex, error);
944 }