4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
20 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
21 * CA 95054 USA or visit www.sun.com if you need additional information or
27 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
28 * Use is subject to license terms.
30 * Copyright (c) 2011, 2012, Intel Corporation.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
37 #ifndef __LUSTRE_DT_OBJECT_H
38 #define __LUSTRE_DT_OBJECT_H
41 * Sub-class of lu_object with methods common for "data" objects in OST stack.
43 * Data objects behave like regular files: you can read/write them, get and
44 * set their attributes. Implementation of dt interface is supposed to
45 * implement some form of garbage collection, normally reference counting
48 * Examples: osd (lustre/osd) is an implementation of dt interface.
54 * super-class definitions.
56 #include "lu_object.h"
58 #include "../../include/linux/libcfs/libcfs.h"
61 struct proc_dir_entry;
67 struct dt_index_features;
70 struct ldlm_enqueue_info;
73 MNTOPT_USERXATTR = 0x00000001,
74 MNTOPT_ACL = 0x00000002,
77 struct dt_device_param {
78 unsigned ddp_max_name_len;
79 unsigned ddp_max_nlink;
80 unsigned ddp_block_shift;
82 unsigned ddp_max_ea_size;
83 void *ddp_mnt; /* XXX: old code can retrieve mnt -bzzz */
85 unsigned long long ddp_maxbytes;
86 /* percentage of available space to reserve for grant error margin */
87 int ddp_grant_reserved;
88 /* per-inode space consumption */
90 /* per-fragment grant overhead to be used by client for grant
96 * Per-transaction commit callback function
98 struct dt_txn_commit_cb;
99 typedef void (*dt_cb_t)(struct lu_env *env, struct thandle *th,
100 struct dt_txn_commit_cb *cb, int err);
102 * Special per-transaction callback for cases when just commit callback
103 * is needed and per-device callback are not convenient to use
105 #define TRANS_COMMIT_CB_MAGIC 0xa0a00a0a
106 #define MAX_COMMIT_CB_STR_LEN 32
108 struct dt_txn_commit_cb {
109 struct list_head dcb_linkage;
112 char dcb_name[MAX_COMMIT_CB_STR_LEN];
116 * Operations on dt device.
118 struct dt_device_operations {
120 * Return device-wide statistics.
122 int (*dt_statfs)(const struct lu_env *env,
123 struct dt_device *dev, struct obd_statfs *osfs);
125 * Create transaction, described by \a param.
127 struct thandle *(*dt_trans_create)(const struct lu_env *env,
128 struct dt_device *dev);
130 * Start transaction, described by \a param.
132 int (*dt_trans_start)(const struct lu_env *env,
133 struct dt_device *dev, struct thandle *th);
135 * Finish previously started transaction.
137 int (*dt_trans_stop)(const struct lu_env *env,
140 * Add commit callback to the transaction.
142 int (*dt_trans_cb_add)(struct thandle *th,
143 struct dt_txn_commit_cb *dcb);
145 * Return fid of root index object.
147 int (*dt_root_get)(const struct lu_env *env,
148 struct dt_device *dev, struct lu_fid *f);
150 * Return device configuration data.
152 void (*dt_conf_get)(const struct lu_env *env,
153 const struct dt_device *dev,
154 struct dt_device_param *param);
156 * handling device state, mostly for tests
158 int (*dt_sync)(const struct lu_env *env, struct dt_device *dev);
159 int (*dt_ro)(const struct lu_env *env, struct dt_device *dev);
161 * Start a transaction commit asynchronously
163 * \param env environment
164 * \param dev dt_device to start commit on
166 * \return 0 success, negative value if error
168 int (*dt_commit_async)(const struct lu_env *env,
169 struct dt_device *dev);
171 * Initialize capability context.
173 int (*dt_init_capa_ctxt)(const struct lu_env *env,
174 struct dt_device *dev,
175 int mode, unsigned long timeout,
176 __u32 alg, struct lustre_capa_key *keys);
179 struct dt_index_features {
180 /** required feature flags from enum dt_index_flags */
182 /** minimal required key size */
183 size_t dif_keysize_min;
184 /** maximal required key size, 0 if no limit */
185 size_t dif_keysize_max;
186 /** minimal required record size */
187 size_t dif_recsize_min;
188 /** maximal required record size, 0 if no limit */
189 size_t dif_recsize_max;
190 /** pointer size for record */
194 enum dt_index_flags {
195 /** index supports variable sized keys */
196 DT_IND_VARKEY = 1 << 0,
197 /** index supports variable sized records */
198 DT_IND_VARREC = 1 << 1,
199 /** index can be modified */
200 DT_IND_UPDATE = 1 << 2,
201 /** index supports records with non-unique (duplicate) keys */
202 DT_IND_NONUNQ = 1 << 3,
204 * index support fixed-size keys sorted with natural numerical way
205 * and is able to return left-side value if no exact value found
207 DT_IND_RANGE = 1 << 4,
211 * Features, required from index to support file system directories (mapping
214 extern const struct dt_index_features dt_directory_features;
215 extern const struct dt_index_features dt_otable_features;
216 extern const struct dt_index_features dt_lfsck_features;
218 /* index features supported by the accounting objects */
219 extern const struct dt_index_features dt_acct_features;
221 /* index features supported by the quota global indexes */
222 extern const struct dt_index_features dt_quota_glb_features;
224 /* index features supported by the quota slave indexes */
225 extern const struct dt_index_features dt_quota_slv_features;
228 * This is a general purpose dt allocation hint.
229 * It now contains the parent object.
230 * It can contain any allocation hint in the future.
232 struct dt_allocation_hint {
233 struct dt_object *dah_parent;
238 * object type specifier.
241 enum dt_format_type {
246 /** for special index */
248 /** for symbolic link */
253 * object format specifier.
255 struct dt_object_format {
256 /** type for dt object */
257 enum dt_format_type dof_type;
267 * special index need feature as parameter to create
271 const struct dt_index_features *di_feat;
276 enum dt_format_type dt_mode_to_dft(__u32 mode);
278 typedef __u64 dt_obj_version_t;
281 * Per-dt-object operations.
283 struct dt_object_operations {
284 void (*do_read_lock)(const struct lu_env *env,
285 struct dt_object *dt, unsigned role);
286 void (*do_write_lock)(const struct lu_env *env,
287 struct dt_object *dt, unsigned role);
288 void (*do_read_unlock)(const struct lu_env *env,
289 struct dt_object *dt);
290 void (*do_write_unlock)(const struct lu_env *env,
291 struct dt_object *dt);
292 int (*do_write_locked)(const struct lu_env *env,
293 struct dt_object *dt);
295 * Note: following ->do_{x,}attr_{set,get}() operations are very
296 * similar to ->moo_{x,}attr_{set,get}() operations in struct
297 * md_object_operations (see md_object.h). These operations are not in
298 * lu_object_operations, because ->do_{x,}attr_set() versions take
299 * transaction handle as an argument (this transaction is started by
300 * caller). We might factor ->do_{x,}attr_get() into
301 * lu_object_operations, but that would break existing symmetry.
305 * Return standard attributes.
307 * precondition: lu_object_exists(&dt->do_lu);
309 int (*do_attr_get)(const struct lu_env *env,
310 struct dt_object *dt, struct lu_attr *attr,
311 struct lustre_capa *capa);
313 * Set standard attributes.
315 * precondition: dt_object_exists(dt);
317 int (*do_declare_attr_set)(const struct lu_env *env,
318 struct dt_object *dt,
319 const struct lu_attr *attr,
320 struct thandle *handle);
321 int (*do_attr_set)(const struct lu_env *env,
322 struct dt_object *dt,
323 const struct lu_attr *attr,
324 struct thandle *handle,
325 struct lustre_capa *capa);
327 * Return a value of an extended attribute.
329 * precondition: dt_object_exists(dt);
331 int (*do_xattr_get)(const struct lu_env *env, struct dt_object *dt,
332 struct lu_buf *buf, const char *name,
333 struct lustre_capa *capa);
335 * Set value of an extended attribute.
337 * \a fl - flags from enum lu_xattr_flags
339 * precondition: dt_object_exists(dt);
341 int (*do_declare_xattr_set)(const struct lu_env *env,
342 struct dt_object *dt,
343 const struct lu_buf *buf,
344 const char *name, int fl,
345 struct thandle *handle);
346 int (*do_xattr_set)(const struct lu_env *env,
347 struct dt_object *dt, const struct lu_buf *buf,
348 const char *name, int fl, struct thandle *handle,
349 struct lustre_capa *capa);
351 * Delete existing extended attribute.
353 * precondition: dt_object_exists(dt);
355 int (*do_declare_xattr_del)(const struct lu_env *env,
356 struct dt_object *dt,
357 const char *name, struct thandle *handle);
358 int (*do_xattr_del)(const struct lu_env *env,
359 struct dt_object *dt,
360 const char *name, struct thandle *handle,
361 struct lustre_capa *capa);
363 * Place list of existing extended attributes into \a buf (which has
366 * precondition: dt_object_exists(dt);
368 int (*do_xattr_list)(const struct lu_env *env,
369 struct dt_object *dt, struct lu_buf *buf,
370 struct lustre_capa *capa);
372 * Init allocation hint using parent object and child mode.
373 * (1) The \a parent might be NULL if this is a partial creation for
375 * (2) The type of child is in \a child_mode.
376 * (3) The result hint is stored in \a ah;
378 void (*do_ah_init)(const struct lu_env *env,
379 struct dt_allocation_hint *ah,
380 struct dt_object *parent,
381 struct dt_object *child,
384 * Create new object on this device.
386 * precondition: !dt_object_exists(dt);
387 * postcondition: ergo(result == 0, dt_object_exists(dt));
389 int (*do_declare_create)(const struct lu_env *env,
390 struct dt_object *dt,
391 struct lu_attr *attr,
392 struct dt_allocation_hint *hint,
393 struct dt_object_format *dof,
395 int (*do_create)(const struct lu_env *env, struct dt_object *dt,
396 struct lu_attr *attr,
397 struct dt_allocation_hint *hint,
398 struct dt_object_format *dof,
402 Destroy object on this device
403 * precondition: !dt_object_exists(dt);
404 * postcondition: ergo(result == 0, dt_object_exists(dt));
406 int (*do_declare_destroy)(const struct lu_env *env,
407 struct dt_object *dt,
409 int (*do_destroy)(const struct lu_env *env, struct dt_object *dt,
413 * Announce that this object is going to be used as an index. This
414 * operation check that object supports indexing operations and
415 * installs appropriate dt_index_operations vector on success.
417 * Also probes for features. Operation is successful if all required
418 * features are supported.
420 int (*do_index_try)(const struct lu_env *env,
421 struct dt_object *dt,
422 const struct dt_index_features *feat);
424 * Add nlink of the object
425 * precondition: dt_object_exists(dt);
427 int (*do_declare_ref_add)(const struct lu_env *env,
428 struct dt_object *dt, struct thandle *th);
429 int (*do_ref_add)(const struct lu_env *env,
430 struct dt_object *dt, struct thandle *th);
432 * Del nlink of the object
433 * precondition: dt_object_exists(dt);
435 int (*do_declare_ref_del)(const struct lu_env *env,
436 struct dt_object *dt, struct thandle *th);
437 int (*do_ref_del)(const struct lu_env *env,
438 struct dt_object *dt, struct thandle *th);
440 struct obd_capa *(*do_capa_get)(const struct lu_env *env,
441 struct dt_object *dt,
442 struct lustre_capa *old,
444 int (*do_object_sync)(const struct lu_env *env, struct dt_object *obj,
445 __u64 start, __u64 end);
447 * Get object info of next level. Currently, only get inode from osd.
448 * This is only used by quota b=16542
449 * precondition: dt_object_exists(dt);
451 int (*do_data_get)(const struct lu_env *env, struct dt_object *dt,
457 int (*do_object_lock)(const struct lu_env *env, struct dt_object *dt,
458 struct lustre_handle *lh,
459 struct ldlm_enqueue_info *einfo,
464 * Per-dt-object operations on "file body".
466 struct dt_body_operations {
468 * precondition: dt_object_exists(dt);
470 ssize_t (*dbo_read)(const struct lu_env *env, struct dt_object *dt,
471 struct lu_buf *buf, loff_t *pos,
472 struct lustre_capa *capa);
474 * precondition: dt_object_exists(dt);
476 ssize_t (*dbo_declare_write)(const struct lu_env *env,
477 struct dt_object *dt,
478 const loff_t size, loff_t pos,
479 struct thandle *handle);
480 ssize_t (*dbo_write)(const struct lu_env *env, struct dt_object *dt,
481 const struct lu_buf *buf, loff_t *pos,
482 struct thandle *handle, struct lustre_capa *capa,
485 * methods for zero-copy IO
489 * precondition: dt_object_exists(dt);
493 * > 0 - number of local buffers prepared
495 int (*dbo_bufs_get)(const struct lu_env *env, struct dt_object *dt,
496 loff_t pos, ssize_t len, struct niobuf_local *lb,
497 int rw, struct lustre_capa *capa);
499 * precondition: dt_object_exists(dt);
501 int (*dbo_bufs_put)(const struct lu_env *env, struct dt_object *dt,
502 struct niobuf_local *lb, int nr);
504 * precondition: dt_object_exists(dt);
506 int (*dbo_write_prep)(const struct lu_env *env, struct dt_object *dt,
507 struct niobuf_local *lb, int nr);
509 * precondition: dt_object_exists(dt);
511 int (*dbo_declare_write_commit)(const struct lu_env *env,
512 struct dt_object *dt,
513 struct niobuf_local *,
514 int, struct thandle *);
516 * precondition: dt_object_exists(dt);
518 int (*dbo_write_commit)(const struct lu_env *env, struct dt_object *dt,
519 struct niobuf_local *, int, struct thandle *);
521 * precondition: dt_object_exists(dt);
523 int (*dbo_read_prep)(const struct lu_env *env, struct dt_object *dt,
524 struct niobuf_local *lnb, int nr);
525 int (*dbo_fiemap_get)(const struct lu_env *env, struct dt_object *dt,
526 struct ll_user_fiemap *fm);
528 * Punch object's content
529 * precondition: regular object, not index
531 int (*dbo_declare_punch)(const struct lu_env *, struct dt_object *,
532 __u64, __u64, struct thandle *th);
533 int (*dbo_punch)(const struct lu_env *env, struct dt_object *dt,
534 __u64 start, __u64 end, struct thandle *th,
535 struct lustre_capa *capa);
539 * Incomplete type of index record.
544 * Incomplete type of index key.
549 * Incomplete type of dt iterator.
554 * Per-dt-object operations on object as index.
556 struct dt_index_operations {
558 * precondition: dt_object_exists(dt);
560 int (*dio_lookup)(const struct lu_env *env, struct dt_object *dt,
561 struct dt_rec *rec, const struct dt_key *key,
562 struct lustre_capa *capa);
564 * precondition: dt_object_exists(dt);
566 int (*dio_declare_insert)(const struct lu_env *env,
567 struct dt_object *dt,
568 const struct dt_rec *rec,
569 const struct dt_key *key,
570 struct thandle *handle);
571 int (*dio_insert)(const struct lu_env *env, struct dt_object *dt,
572 const struct dt_rec *rec, const struct dt_key *key,
573 struct thandle *handle, struct lustre_capa *capa,
576 * precondition: dt_object_exists(dt);
578 int (*dio_declare_delete)(const struct lu_env *env,
579 struct dt_object *dt,
580 const struct dt_key *key,
581 struct thandle *handle);
582 int (*dio_delete)(const struct lu_env *env, struct dt_object *dt,
583 const struct dt_key *key, struct thandle *handle,
584 struct lustre_capa *capa);
590 * Allocate and initialize new iterator.
592 * precondition: dt_object_exists(dt);
594 struct dt_it *(*init)(const struct lu_env *env,
595 struct dt_object *dt,
597 struct lustre_capa *capa);
598 void (*fini)(const struct lu_env *env,
600 int (*get)(const struct lu_env *env,
602 const struct dt_key *key);
603 void (*put)(const struct lu_env *env,
605 int (*next)(const struct lu_env *env,
607 struct dt_key *(*key)(const struct lu_env *env,
608 const struct dt_it *di);
609 int (*key_size)(const struct lu_env *env,
610 const struct dt_it *di);
611 int (*rec)(const struct lu_env *env,
612 const struct dt_it *di,
615 __u64 (*store)(const struct lu_env *env,
616 const struct dt_it *di);
617 int (*load)(const struct lu_env *env,
618 const struct dt_it *di, __u64 hash);
619 int (*key_rec)(const struct lu_env *env,
620 const struct dt_it *di, void *key_rec);
624 enum dt_otable_it_valid {
625 DOIV_ERROR_HANDLE = 0x0001,
628 enum dt_otable_it_flags {
629 /* Exit when fail. */
630 DOIF_FAILOUT = 0x0001,
632 /* Reset iteration position to the device beginning. */
635 /* There is up layer component uses the iteration. */
636 DOIF_OUTUSED = 0x0004,
639 /* otable based iteration needs to use the common DT interation APIs.
640 * To initialize the iteration, it needs call dio_it::init() firstly.
641 * Here is how the otable based iteration should prepare arguments to
642 * call dt_it_ops::init().
644 * For otable based iteration, the 32-bits 'attr' for dt_it_ops::init()
645 * is composed of two parts:
646 * low 16-bits is for valid bits, high 16-bits is for flags bits. */
647 #define DT_OTABLE_IT_FLAGS_SHIFT 16
648 #define DT_OTABLE_IT_FLAGS_MASK 0xffff0000
651 struct lu_device dd_lu_dev;
652 const struct dt_device_operations *dd_ops;
655 * List of dt_txn_callback (see below). This is not protected in any
656 * way, because callbacks are supposed to be added/deleted only during
657 * single-threaded start-up shut-down procedures.
659 struct list_head dd_txn_callbacks;
662 int dt_device_init(struct dt_device *dev, struct lu_device_type *t);
663 void dt_device_fini(struct dt_device *dev);
665 static inline int lu_device_is_dt(const struct lu_device *d)
667 return ergo(d != NULL, d->ld_type->ldt_tags & LU_DEVICE_DT);
670 static inline struct dt_device *lu2dt_dev(struct lu_device *l)
672 LASSERT(lu_device_is_dt(l));
673 return container_of0(l, struct dt_device, dd_lu_dev);
677 struct lu_object do_lu;
678 const struct dt_object_operations *do_ops;
679 const struct dt_body_operations *do_body_ops;
680 const struct dt_index_operations *do_index_ops;
684 * In-core representation of per-device local object OID storage
686 struct local_oid_storage {
687 /* all initialized llog systems on this node linked by this */
688 struct list_head los_list;
690 /* how many handle's reference this los has */
691 atomic_t los_refcount;
692 struct dt_device *los_dev;
693 struct dt_object *los_obj;
695 /* data used to generate new fids */
696 struct mutex los_id_lock;
701 static inline struct dt_object *lu2dt(struct lu_object *l)
703 LASSERT(l == NULL || IS_ERR(l) || lu_device_is_dt(l->lo_dev));
704 return container_of0(l, struct dt_object, do_lu);
707 int dt_object_init(struct dt_object *obj,
708 struct lu_object_header *h, struct lu_device *d);
710 void dt_object_fini(struct dt_object *obj);
712 static inline int dt_object_exists(const struct dt_object *dt)
714 return lu_object_exists(&dt->do_lu);
717 static inline int dt_object_remote(const struct dt_object *dt)
719 return lu_object_remote(&dt->do_lu);
722 static inline struct dt_object *lu2dt_obj(struct lu_object *o)
724 LASSERT(ergo(o != NULL, lu_device_is_dt(o->lo_dev)));
725 return container_of0(o, struct dt_object, do_lu);
729 * This is the general purpose transaction handle.
730 * 1. Transaction Life Cycle
731 * This transaction handle is allocated upon starting a new transaction,
732 * and deallocated after this transaction is committed.
733 * 2. Transaction Nesting
734 * We do _NOT_ support nested transaction. So, every thread should only
735 * have one active transaction, and a transaction only belongs to one
736 * thread. Due to this, transaction handle need no reference count.
737 * 3. Transaction & dt_object locking
738 * dt_object locks should be taken inside transaction.
739 * 4. Transaction & RPC
740 * No RPC request should be issued inside transaction.
743 /** the dt device on which the transactions are executed */
744 struct dt_device *th_dev;
746 /** context for this transaction, tag is LCT_TX_HANDLE */
747 struct lu_context th_ctx;
749 /** additional tags (layers can add in declare) */
752 /** the last operation result in this transaction.
753 * this value is used in recovery */
756 /** whether we need sync commit */
757 unsigned int th_sync:1;
759 /* local transation, no need to inform other layers */
760 unsigned int th_local:1;
762 /* In DNE, one transaction can be disassemblied into
763 * updates on several different MDTs, and these updates
764 * will be attached to th_remote_update_list per target.
765 * Only single thread will access the list, no need lock
767 struct list_head th_remote_update_list;
768 struct update_request *th_current_request;
772 * Transaction call-backs.
774 * These are invoked by osd (or underlying transaction engine) when
775 * transaction changes state.
777 * Call-backs are used by upper layers to modify transaction parameters and to
778 * perform some actions on for each transaction state transition. Typical
779 * example is mdt registering call-back to write into last-received file
780 * before each transaction commit.
782 struct dt_txn_callback {
783 int (*dtc_txn_start)(const struct lu_env *env,
784 struct thandle *txn, void *cookie);
785 int (*dtc_txn_stop)(const struct lu_env *env,
786 struct thandle *txn, void *cookie);
787 void (*dtc_txn_commit)(struct thandle *txn, void *cookie);
790 struct list_head dtc_linkage;
793 void dt_txn_callback_add(struct dt_device *dev, struct dt_txn_callback *cb);
794 void dt_txn_callback_del(struct dt_device *dev, struct dt_txn_callback *cb);
796 int dt_txn_hook_start(const struct lu_env *env,
797 struct dt_device *dev, struct thandle *txn);
798 int dt_txn_hook_stop(const struct lu_env *env, struct thandle *txn);
799 void dt_txn_hook_commit(struct thandle *txn);
801 int dt_try_as_dir(const struct lu_env *env, struct dt_object *obj);
804 * Callback function used for parsing path.
805 * \see llo_store_resolve
807 typedef int (*dt_entry_func_t)(const struct lu_env *env,
811 #define DT_MAX_PATH 1024
813 int dt_path_parser(const struct lu_env *env,
814 char *local, dt_entry_func_t entry_func,
818 dt_store_resolve(const struct lu_env *env, struct dt_device *dt,
819 const char *path, struct lu_fid *fid);
821 struct dt_object *dt_store_open(const struct lu_env *env,
822 struct dt_device *dt,
824 const char *filename,
827 struct dt_object *dt_find_or_create(const struct lu_env *env,
828 struct dt_device *dt,
829 const struct lu_fid *fid,
830 struct dt_object_format *dof,
831 struct lu_attr *attr);
833 struct dt_object *dt_locate_at(const struct lu_env *env,
834 struct dt_device *dev,
835 const struct lu_fid *fid,
836 struct lu_device *top_dev);
837 static inline struct dt_object *
838 dt_locate(const struct lu_env *env, struct dt_device *dev,
839 const struct lu_fid *fid)
841 return dt_locate_at(env, dev, fid, dev->dd_lu_dev.ld_site->ls_top_dev);
845 int local_oid_storage_init(const struct lu_env *env, struct dt_device *dev,
846 const struct lu_fid *first_fid,
847 struct local_oid_storage **los);
848 void local_oid_storage_fini(const struct lu_env *env,
849 struct local_oid_storage *los);
850 int local_object_fid_generate(const struct lu_env *env,
851 struct local_oid_storage *los,
853 int local_object_declare_create(const struct lu_env *env,
854 struct local_oid_storage *los,
856 struct lu_attr *attr,
857 struct dt_object_format *dof,
859 int local_object_create(const struct lu_env *env,
860 struct local_oid_storage *los,
862 struct lu_attr *attr, struct dt_object_format *dof,
864 struct dt_object *local_file_find_or_create(const struct lu_env *env,
865 struct local_oid_storage *los,
866 struct dt_object *parent,
867 const char *name, __u32 mode);
868 struct dt_object *local_file_find_or_create_with_fid(const struct lu_env *env,
869 struct dt_device *dt,
870 const struct lu_fid *fid,
871 struct dt_object *parent,
875 local_index_find_or_create(const struct lu_env *env,
876 struct local_oid_storage *los,
877 struct dt_object *parent,
878 const char *name, __u32 mode,
879 const struct dt_index_features *ft);
881 local_index_find_or_create_with_fid(const struct lu_env *env,
882 struct dt_device *dt,
883 const struct lu_fid *fid,
884 struct dt_object *parent,
885 const char *name, __u32 mode,
886 const struct dt_index_features *ft);
887 int local_object_unlink(const struct lu_env *env, struct dt_device *dt,
888 struct dt_object *parent, const char *name);
890 static inline int dt_object_lock(const struct lu_env *env,
891 struct dt_object *o, struct lustre_handle *lh,
892 struct ldlm_enqueue_info *einfo,
897 LASSERT(o->do_ops->do_object_lock);
898 return o->do_ops->do_object_lock(env, o, lh, einfo, policy);
901 int dt_lookup_dir(const struct lu_env *env, struct dt_object *dir,
902 const char *name, struct lu_fid *fid);
904 static inline int dt_object_sync(const struct lu_env *env, struct dt_object *o,
905 __u64 start, __u64 end)
909 LASSERT(o->do_ops->do_object_sync);
910 return o->do_ops->do_object_sync(env, o, start, end);
913 int dt_declare_version_set(const struct lu_env *env, struct dt_object *o,
915 void dt_version_set(const struct lu_env *env, struct dt_object *o,
916 dt_obj_version_t version, struct thandle *th);
917 dt_obj_version_t dt_version_get(const struct lu_env *env, struct dt_object *o);
920 int dt_read(const struct lu_env *env, struct dt_object *dt,
921 struct lu_buf *buf, loff_t *pos);
922 int dt_record_read(const struct lu_env *env, struct dt_object *dt,
923 struct lu_buf *buf, loff_t *pos);
924 int dt_record_write(const struct lu_env *env, struct dt_object *dt,
925 const struct lu_buf *buf, loff_t *pos, struct thandle *th);
926 typedef int (*dt_index_page_build_t)(const struct lu_env *env,
927 union lu_page *lp, int nob,
928 const struct dt_it_ops *iops,
929 struct dt_it *it, __u32 attr, void *arg);
930 int dt_index_walk(const struct lu_env *env, struct dt_object *obj,
931 const struct lu_rdpg *rdpg, dt_index_page_build_t filler,
933 int dt_index_read(const struct lu_env *env, struct dt_device *dev,
934 struct idx_info *ii, const struct lu_rdpg *rdpg);
936 static inline struct thandle *dt_trans_create(const struct lu_env *env,
939 LASSERT(d->dd_ops->dt_trans_create);
940 return d->dd_ops->dt_trans_create(env, d);
943 static inline int dt_trans_start(const struct lu_env *env,
944 struct dt_device *d, struct thandle *th)
946 LASSERT(d->dd_ops->dt_trans_start);
947 return d->dd_ops->dt_trans_start(env, d, th);
950 /* for this transaction hooks shouldn't be called */
951 static inline int dt_trans_start_local(const struct lu_env *env,
952 struct dt_device *d, struct thandle *th)
954 LASSERT(d->dd_ops->dt_trans_start);
956 return d->dd_ops->dt_trans_start(env, d, th);
959 static inline int dt_trans_stop(const struct lu_env *env,
960 struct dt_device *d, struct thandle *th)
962 LASSERT(d->dd_ops->dt_trans_stop);
963 return d->dd_ops->dt_trans_stop(env, th);
966 static inline int dt_trans_cb_add(struct thandle *th,
967 struct dt_txn_commit_cb *dcb)
969 LASSERT(th->th_dev->dd_ops->dt_trans_cb_add);
970 dcb->dcb_magic = TRANS_COMMIT_CB_MAGIC;
971 return th->th_dev->dd_ops->dt_trans_cb_add(th, dcb);
976 static inline int dt_declare_record_write(const struct lu_env *env,
977 struct dt_object *dt,
978 int size, loff_t pos,
983 LASSERTF(dt != NULL, "dt is NULL when we want to write record\n");
985 LASSERT(dt->do_body_ops);
986 LASSERT(dt->do_body_ops->dbo_declare_write);
987 rc = dt->do_body_ops->dbo_declare_write(env, dt, size, pos, th);
991 static inline int dt_declare_create(const struct lu_env *env,
992 struct dt_object *dt,
993 struct lu_attr *attr,
994 struct dt_allocation_hint *hint,
995 struct dt_object_format *dof,
1000 LASSERT(dt->do_ops->do_declare_create);
1001 return dt->do_ops->do_declare_create(env, dt, attr, hint, dof, th);
1004 static inline int dt_create(const struct lu_env *env,
1005 struct dt_object *dt,
1006 struct lu_attr *attr,
1007 struct dt_allocation_hint *hint,
1008 struct dt_object_format *dof,
1012 LASSERT(dt->do_ops);
1013 LASSERT(dt->do_ops->do_create);
1014 return dt->do_ops->do_create(env, dt, attr, hint, dof, th);
1017 static inline int dt_declare_destroy(const struct lu_env *env,
1018 struct dt_object *dt,
1022 LASSERT(dt->do_ops);
1023 LASSERT(dt->do_ops->do_declare_destroy);
1024 return dt->do_ops->do_declare_destroy(env, dt, th);
1027 static inline int dt_destroy(const struct lu_env *env,
1028 struct dt_object *dt,
1032 LASSERT(dt->do_ops);
1033 LASSERT(dt->do_ops->do_destroy);
1034 return dt->do_ops->do_destroy(env, dt, th);
1037 static inline void dt_read_lock(const struct lu_env *env,
1038 struct dt_object *dt,
1042 LASSERT(dt->do_ops);
1043 LASSERT(dt->do_ops->do_read_lock);
1044 dt->do_ops->do_read_lock(env, dt, role);
1047 static inline void dt_write_lock(const struct lu_env *env,
1048 struct dt_object *dt,
1052 LASSERT(dt->do_ops);
1053 LASSERT(dt->do_ops->do_write_lock);
1054 dt->do_ops->do_write_lock(env, dt, role);
1057 static inline void dt_read_unlock(const struct lu_env *env,
1058 struct dt_object *dt)
1061 LASSERT(dt->do_ops);
1062 LASSERT(dt->do_ops->do_read_unlock);
1063 dt->do_ops->do_read_unlock(env, dt);
1066 static inline void dt_write_unlock(const struct lu_env *env,
1067 struct dt_object *dt)
1070 LASSERT(dt->do_ops);
1071 LASSERT(dt->do_ops->do_write_unlock);
1072 dt->do_ops->do_write_unlock(env, dt);
1075 static inline int dt_write_locked(const struct lu_env *env,
1076 struct dt_object *dt)
1079 LASSERT(dt->do_ops);
1080 LASSERT(dt->do_ops->do_write_locked);
1081 return dt->do_ops->do_write_locked(env, dt);
1084 static inline int dt_attr_get(const struct lu_env *env, struct dt_object *dt,
1085 struct lu_attr *la, void *arg)
1088 LASSERT(dt->do_ops);
1089 LASSERT(dt->do_ops->do_attr_get);
1090 return dt->do_ops->do_attr_get(env, dt, la, arg);
1093 static inline int dt_declare_attr_set(const struct lu_env *env,
1094 struct dt_object *dt,
1095 const struct lu_attr *la,
1099 LASSERT(dt->do_ops);
1100 LASSERT(dt->do_ops->do_declare_attr_set);
1101 return dt->do_ops->do_declare_attr_set(env, dt, la, th);
1104 static inline int dt_attr_set(const struct lu_env *env, struct dt_object *dt,
1105 const struct lu_attr *la, struct thandle *th,
1106 struct lustre_capa *capa)
1109 LASSERT(dt->do_ops);
1110 LASSERT(dt->do_ops->do_attr_set);
1111 return dt->do_ops->do_attr_set(env, dt, la, th, capa);
1114 static inline int dt_declare_ref_add(const struct lu_env *env,
1115 struct dt_object *dt, struct thandle *th)
1118 LASSERT(dt->do_ops);
1119 LASSERT(dt->do_ops->do_declare_ref_add);
1120 return dt->do_ops->do_declare_ref_add(env, dt, th);
1123 static inline int dt_ref_add(const struct lu_env *env,
1124 struct dt_object *dt, struct thandle *th)
1127 LASSERT(dt->do_ops);
1128 LASSERT(dt->do_ops->do_ref_add);
1129 return dt->do_ops->do_ref_add(env, dt, th);
1132 static inline int dt_declare_ref_del(const struct lu_env *env,
1133 struct dt_object *dt, struct thandle *th)
1136 LASSERT(dt->do_ops);
1137 LASSERT(dt->do_ops->do_declare_ref_del);
1138 return dt->do_ops->do_declare_ref_del(env, dt, th);
1141 static inline int dt_ref_del(const struct lu_env *env,
1142 struct dt_object *dt, struct thandle *th)
1145 LASSERT(dt->do_ops);
1146 LASSERT(dt->do_ops->do_ref_del);
1147 return dt->do_ops->do_ref_del(env, dt, th);
1150 static inline struct obd_capa *dt_capa_get(const struct lu_env *env,
1151 struct dt_object *dt,
1152 struct lustre_capa *old, __u64 opc)
1155 LASSERT(dt->do_ops);
1156 LASSERT(dt->do_ops->do_ref_del);
1157 return dt->do_ops->do_capa_get(env, dt, old, opc);
1160 static inline int dt_bufs_get(const struct lu_env *env, struct dt_object *d,
1161 struct niobuf_remote *rnb,
1162 struct niobuf_local *lnb, int rw,
1163 struct lustre_capa *capa)
1166 LASSERT(d->do_body_ops);
1167 LASSERT(d->do_body_ops->dbo_bufs_get);
1168 return d->do_body_ops->dbo_bufs_get(env, d, rnb->offset,
1169 rnb->len, lnb, rw, capa);
1172 static inline int dt_bufs_put(const struct lu_env *env, struct dt_object *d,
1173 struct niobuf_local *lnb, int n)
1176 LASSERT(d->do_body_ops);
1177 LASSERT(d->do_body_ops->dbo_bufs_put);
1178 return d->do_body_ops->dbo_bufs_put(env, d, lnb, n);
1181 static inline int dt_write_prep(const struct lu_env *env, struct dt_object *d,
1182 struct niobuf_local *lnb, int n)
1185 LASSERT(d->do_body_ops);
1186 LASSERT(d->do_body_ops->dbo_write_prep);
1187 return d->do_body_ops->dbo_write_prep(env, d, lnb, n);
1190 static inline int dt_declare_write_commit(const struct lu_env *env,
1191 struct dt_object *d,
1192 struct niobuf_local *lnb,
1193 int n, struct thandle *th)
1195 LASSERTF(d != NULL, "dt is NULL when we want to declare write\n");
1196 LASSERT(th != NULL);
1197 return d->do_body_ops->dbo_declare_write_commit(env, d, lnb, n, th);
1201 static inline int dt_write_commit(const struct lu_env *env,
1202 struct dt_object *d, struct niobuf_local *lnb,
1203 int n, struct thandle *th)
1206 LASSERT(d->do_body_ops);
1207 LASSERT(d->do_body_ops->dbo_write_commit);
1208 return d->do_body_ops->dbo_write_commit(env, d, lnb, n, th);
1211 static inline int dt_read_prep(const struct lu_env *env, struct dt_object *d,
1212 struct niobuf_local *lnb, int n)
1215 LASSERT(d->do_body_ops);
1216 LASSERT(d->do_body_ops->dbo_read_prep);
1217 return d->do_body_ops->dbo_read_prep(env, d, lnb, n);
1220 static inline int dt_declare_punch(const struct lu_env *env,
1221 struct dt_object *dt, __u64 start,
1222 __u64 end, struct thandle *th)
1225 LASSERT(dt->do_body_ops);
1226 LASSERT(dt->do_body_ops->dbo_declare_punch);
1227 return dt->do_body_ops->dbo_declare_punch(env, dt, start, end, th);
1230 static inline int dt_punch(const struct lu_env *env, struct dt_object *dt,
1231 __u64 start, __u64 end, struct thandle *th,
1232 struct lustre_capa *capa)
1235 LASSERT(dt->do_body_ops);
1236 LASSERT(dt->do_body_ops->dbo_punch);
1237 return dt->do_body_ops->dbo_punch(env, dt, start, end, th, capa);
1240 static inline int dt_fiemap_get(const struct lu_env *env, struct dt_object *d,
1241 struct ll_user_fiemap *fm)
1244 if (d->do_body_ops == NULL)
1246 if (d->do_body_ops->dbo_fiemap_get == NULL)
1248 return d->do_body_ops->dbo_fiemap_get(env, d, fm);
1251 static inline int dt_statfs(const struct lu_env *env, struct dt_device *dev,
1252 struct obd_statfs *osfs)
1255 LASSERT(dev->dd_ops);
1256 LASSERT(dev->dd_ops->dt_statfs);
1257 return dev->dd_ops->dt_statfs(env, dev, osfs);
1260 static inline int dt_root_get(const struct lu_env *env, struct dt_device *dev,
1264 LASSERT(dev->dd_ops);
1265 LASSERT(dev->dd_ops->dt_root_get);
1266 return dev->dd_ops->dt_root_get(env, dev, f);
1269 static inline void dt_conf_get(const struct lu_env *env,
1270 const struct dt_device *dev,
1271 struct dt_device_param *param)
1274 LASSERT(dev->dd_ops);
1275 LASSERT(dev->dd_ops->dt_conf_get);
1276 return dev->dd_ops->dt_conf_get(env, dev, param);
1279 static inline int dt_sync(const struct lu_env *env, struct dt_device *dev)
1282 LASSERT(dev->dd_ops);
1283 LASSERT(dev->dd_ops->dt_sync);
1284 return dev->dd_ops->dt_sync(env, dev);
1287 static inline int dt_ro(const struct lu_env *env, struct dt_device *dev)
1290 LASSERT(dev->dd_ops);
1291 LASSERT(dev->dd_ops->dt_ro);
1292 return dev->dd_ops->dt_ro(env, dev);
1295 static inline int dt_declare_insert(const struct lu_env *env,
1296 struct dt_object *dt,
1297 const struct dt_rec *rec,
1298 const struct dt_key *key,
1302 LASSERT(dt->do_index_ops);
1303 LASSERT(dt->do_index_ops->dio_declare_insert);
1304 return dt->do_index_ops->dio_declare_insert(env, dt, rec, key, th);
1307 static inline int dt_insert(const struct lu_env *env,
1308 struct dt_object *dt,
1309 const struct dt_rec *rec,
1310 const struct dt_key *key,
1312 struct lustre_capa *capa,
1316 LASSERT(dt->do_index_ops);
1317 LASSERT(dt->do_index_ops->dio_insert);
1318 return dt->do_index_ops->dio_insert(env, dt, rec, key, th,
1322 static inline int dt_declare_xattr_del(const struct lu_env *env,
1323 struct dt_object *dt,
1328 LASSERT(dt->do_ops);
1329 LASSERT(dt->do_ops->do_declare_xattr_del);
1330 return dt->do_ops->do_declare_xattr_del(env, dt, name, th);
1333 static inline int dt_xattr_del(const struct lu_env *env,
1334 struct dt_object *dt, const char *name,
1336 struct lustre_capa *capa)
1339 LASSERT(dt->do_ops);
1340 LASSERT(dt->do_ops->do_xattr_del);
1341 return dt->do_ops->do_xattr_del(env, dt, name, th, capa);
1344 static inline int dt_declare_xattr_set(const struct lu_env *env,
1345 struct dt_object *dt,
1346 const struct lu_buf *buf,
1347 const char *name, int fl,
1351 LASSERT(dt->do_ops);
1352 LASSERT(dt->do_ops->do_declare_xattr_set);
1353 return dt->do_ops->do_declare_xattr_set(env, dt, buf, name, fl, th);
1356 static inline int dt_xattr_set(const struct lu_env *env,
1357 struct dt_object *dt, const struct lu_buf *buf,
1358 const char *name, int fl, struct thandle *th,
1359 struct lustre_capa *capa)
1362 LASSERT(dt->do_ops);
1363 LASSERT(dt->do_ops->do_xattr_set);
1364 return dt->do_ops->do_xattr_set(env, dt, buf, name, fl, th, capa);
1367 static inline int dt_xattr_get(const struct lu_env *env,
1368 struct dt_object *dt, struct lu_buf *buf,
1369 const char *name, struct lustre_capa *capa)
1372 LASSERT(dt->do_ops);
1373 LASSERT(dt->do_ops->do_xattr_get);
1374 return dt->do_ops->do_xattr_get(env, dt, buf, name, capa);
1377 static inline int dt_xattr_list(const struct lu_env *env,
1378 struct dt_object *dt, struct lu_buf *buf,
1379 struct lustre_capa *capa)
1382 LASSERT(dt->do_ops);
1383 LASSERT(dt->do_ops->do_xattr_list);
1384 return dt->do_ops->do_xattr_list(env, dt, buf, capa);
1387 static inline int dt_declare_delete(const struct lu_env *env,
1388 struct dt_object *dt,
1389 const struct dt_key *key,
1393 LASSERT(dt->do_index_ops);
1394 LASSERT(dt->do_index_ops->dio_declare_delete);
1395 return dt->do_index_ops->dio_declare_delete(env, dt, key, th);
1398 static inline int dt_delete(const struct lu_env *env,
1399 struct dt_object *dt,
1400 const struct dt_key *key,
1402 struct lustre_capa *capa)
1405 LASSERT(dt->do_index_ops);
1406 LASSERT(dt->do_index_ops->dio_delete);
1407 return dt->do_index_ops->dio_delete(env, dt, key, th, capa);
1410 static inline int dt_commit_async(const struct lu_env *env,
1411 struct dt_device *dev)
1414 LASSERT(dev->dd_ops);
1415 LASSERT(dev->dd_ops->dt_commit_async);
1416 return dev->dd_ops->dt_commit_async(env, dev);
1419 static inline int dt_init_capa_ctxt(const struct lu_env *env,
1420 struct dt_device *dev,
1421 int mode, unsigned long timeout,
1422 __u32 alg, struct lustre_capa_key *keys)
1425 LASSERT(dev->dd_ops);
1426 LASSERT(dev->dd_ops->dt_init_capa_ctxt);
1427 return dev->dd_ops->dt_init_capa_ctxt(env, dev, mode,
1428 timeout, alg, keys);
1431 static inline int dt_lookup(const struct lu_env *env,
1432 struct dt_object *dt,
1434 const struct dt_key *key,
1435 struct lustre_capa *capa)
1440 LASSERT(dt->do_index_ops);
1441 LASSERT(dt->do_index_ops->dio_lookup);
1443 ret = dt->do_index_ops->dio_lookup(env, dt, rec, key, capa);
1451 #define LU221_BAD_TIME (0x80000000U + 24 * 3600)
1453 struct dt_find_hint {
1454 struct lu_fid *dfh_fid;
1455 struct dt_device *dfh_dt;
1456 struct dt_object *dfh_o;
1459 struct dt_thread_info {
1460 char dti_buf[DT_MAX_PATH];
1461 struct dt_find_hint dti_dfh;
1462 struct lu_attr dti_attr;
1463 struct lu_fid dti_fid;
1464 struct dt_object_format dti_dof;
1465 struct lustre_mdt_attrs dti_lma;
1466 struct lu_buf dti_lb;
1470 extern struct lu_context_key dt_key;
1472 static inline struct dt_thread_info *dt_info(const struct lu_env *env)
1474 struct dt_thread_info *dti;
1476 dti = lu_context_key_get(&env->le_ctx, &dt_key);
1481 int dt_global_init(void);
1482 void dt_global_fini(void);
1484 #if defined (CONFIG_PROC_FS)
1485 int lprocfs_dt_rd_blksize(char *page, char **start, off_t off,
1486 int count, int *eof, void *data);
1487 int lprocfs_dt_rd_kbytestotal(char *page, char **start, off_t off,
1488 int count, int *eof, void *data);
1489 int lprocfs_dt_rd_kbytesfree(char *page, char **start, off_t off,
1490 int count, int *eof, void *data);
1491 int lprocfs_dt_rd_kbytesavail(char *page, char **start, off_t off,
1492 int count, int *eof, void *data);
1493 int lprocfs_dt_rd_filestotal(char *page, char **start, off_t off,
1494 int count, int *eof, void *data);
1495 int lprocfs_dt_rd_filesfree(char *page, char **start, off_t off,
1496 int count, int *eof, void *data);
1497 #endif /* CONFIG_PROC_FS */
1499 #endif /* __LUSTRE_DT_OBJECT_H */