xref: /linux/fs/ceph/export.c (revision 71901cc4109b3794b863884e348aff3c71e693cc)
1 #include "ceph_debug.h"
2 
3 #include <linux/exportfs.h>
4 #include <linux/slab.h>
5 #include <asm/unaligned.h>
6 
7 #include "super.h"
8 
9 /*
10  * NFS export support
11  *
12  * NFS re-export of a ceph mount is, at present, only semireliable.
13  * The basic issue is that the Ceph architectures doesn't lend itself
14  * well to generating filehandles that will remain valid forever.
15  *
16  * So, we do our best.  If you're lucky, your inode will be in the
17  * client's cache.  If it's not, and you have a connectable fh, then
18  * the MDS server may be able to find it for you.  Otherwise, you get
19  * ESTALE.
20  *
21  * There are ways to this more reliable, but in the non-connectable fh
22  * case, we won't every work perfectly, and in the connectable case,
23  * some changes are needed on the MDS side to work better.
24  */
25 
26 /*
27  * Basic fh
28  */
29 struct ceph_nfs_fh {
30 	u64 ino;
31 } __attribute__ ((packed));
32 
33 /*
34  * Larger 'connectable' fh that includes parent ino and name hash.
35  * Use this whenever possible, as it works more reliably.
36  */
37 struct ceph_nfs_confh {
38 	u64 ino, parent_ino;
39 	u32 parent_name_hash;
40 } __attribute__ ((packed));
41 
42 static int ceph_encode_fh(struct dentry *dentry, u32 *rawfh, int *max_len,
43 			  int connectable)
44 {
45 	int type;
46 	struct ceph_nfs_fh *fh = (void *)rawfh;
47 	struct ceph_nfs_confh *cfh = (void *)rawfh;
48 	struct dentry *parent = dentry->d_parent;
49 	struct inode *inode = dentry->d_inode;
50 	int connected_handle_length = sizeof(*cfh)/4;
51 	int handle_length = sizeof(*fh)/4;
52 
53 	/* don't re-export snaps */
54 	if (ceph_snap(inode) != CEPH_NOSNAP)
55 		return -EINVAL;
56 
57 	if (*max_len >= connected_handle_length) {
58 		dout("encode_fh %p connectable\n", dentry);
59 		cfh->ino = ceph_ino(dentry->d_inode);
60 		cfh->parent_ino = ceph_ino(parent->d_inode);
61 		cfh->parent_name_hash = parent->d_name.hash;
62 		*max_len = connected_handle_length;
63 		type = 2;
64 	} else if (*max_len >= handle_length) {
65 		if (connectable) {
66 			*max_len = connected_handle_length;
67 			return 255;
68 		}
69 		dout("encode_fh %p\n", dentry);
70 		fh->ino = ceph_ino(dentry->d_inode);
71 		*max_len = handle_length;
72 		type = 1;
73 	} else {
74 		*max_len = handle_length;
75 		return 255;
76 	}
77 	return type;
78 }
79 
80 /*
81  * convert regular fh to dentry
82  *
83  * FIXME: we should try harder by querying the mds for the ino.
84  */
85 static struct dentry *__fh_to_dentry(struct super_block *sb,
86 				     struct ceph_nfs_fh *fh)
87 {
88 	struct inode *inode;
89 	struct dentry *dentry;
90 	struct ceph_vino vino;
91 	int err;
92 
93 	dout("__fh_to_dentry %llx\n", fh->ino);
94 	vino.ino = fh->ino;
95 	vino.snap = CEPH_NOSNAP;
96 	inode = ceph_find_inode(sb, vino);
97 	if (!inode)
98 		return ERR_PTR(-ESTALE);
99 
100 	dentry = d_obtain_alias(inode);
101 	if (IS_ERR(dentry)) {
102 		pr_err("fh_to_dentry %llx -- inode %p but ENOMEM\n",
103 		       fh->ino, inode);
104 		iput(inode);
105 		return dentry;
106 	}
107 	err = ceph_init_dentry(dentry);
108 
109 	if (err < 0) {
110 		iput(inode);
111 		return ERR_PTR(err);
112 	}
113 	dout("__fh_to_dentry %llx %p dentry %p\n", fh->ino, inode, dentry);
114 	return dentry;
115 }
116 
117 /*
118  * convert connectable fh to dentry
119  */
120 static struct dentry *__cfh_to_dentry(struct super_block *sb,
121 				      struct ceph_nfs_confh *cfh)
122 {
123 	struct ceph_mds_client *mdsc = &ceph_sb_to_client(sb)->mdsc;
124 	struct inode *inode;
125 	struct dentry *dentry;
126 	struct ceph_vino vino;
127 	int err;
128 
129 	dout("__cfh_to_dentry %llx (%llx/%x)\n",
130 	     cfh->ino, cfh->parent_ino, cfh->parent_name_hash);
131 
132 	vino.ino = cfh->ino;
133 	vino.snap = CEPH_NOSNAP;
134 	inode = ceph_find_inode(sb, vino);
135 	if (!inode) {
136 		struct ceph_mds_request *req;
137 
138 		req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_LOOKUPHASH,
139 					       USE_ANY_MDS);
140 		if (IS_ERR(req))
141 			return ERR_CAST(req);
142 
143 		req->r_ino1 = vino;
144 		req->r_ino2.ino = cfh->parent_ino;
145 		req->r_ino2.snap = CEPH_NOSNAP;
146 		req->r_path2 = kmalloc(16, GFP_NOFS);
147 		snprintf(req->r_path2, 16, "%d", cfh->parent_name_hash);
148 		req->r_num_caps = 1;
149 		err = ceph_mdsc_do_request(mdsc, NULL, req);
150 		ceph_mdsc_put_request(req);
151 		inode = ceph_find_inode(sb, vino);
152 		if (!inode)
153 			return ERR_PTR(err ? err : -ESTALE);
154 	}
155 
156 	dentry = d_obtain_alias(inode);
157 	if (IS_ERR(dentry)) {
158 		pr_err("cfh_to_dentry %llx -- inode %p but ENOMEM\n",
159 		       cfh->ino, inode);
160 		iput(inode);
161 		return dentry;
162 	}
163 	err = ceph_init_dentry(dentry);
164 	if (err < 0) {
165 		iput(inode);
166 		return ERR_PTR(err);
167 	}
168 	dout("__cfh_to_dentry %llx %p dentry %p\n", cfh->ino, inode, dentry);
169 	return dentry;
170 }
171 
172 static struct dentry *ceph_fh_to_dentry(struct super_block *sb, struct fid *fid,
173 					int fh_len, int fh_type)
174 {
175 	if (fh_type == 1)
176 		return __fh_to_dentry(sb, (struct ceph_nfs_fh *)fid->raw);
177 	else
178 		return __cfh_to_dentry(sb, (struct ceph_nfs_confh *)fid->raw);
179 }
180 
181 /*
182  * get parent, if possible.
183  *
184  * FIXME: we could do better by querying the mds to discover the
185  * parent.
186  */
187 static struct dentry *ceph_fh_to_parent(struct super_block *sb,
188 					 struct fid *fid,
189 					int fh_len, int fh_type)
190 {
191 	struct ceph_nfs_confh *cfh = (void *)fid->raw;
192 	struct ceph_vino vino;
193 	struct inode *inode;
194 	struct dentry *dentry;
195 	int err;
196 
197 	if (fh_type == 1)
198 		return ERR_PTR(-ESTALE);
199 
200 	pr_debug("fh_to_parent %llx/%d\n", cfh->parent_ino,
201 		 cfh->parent_name_hash);
202 
203 	vino.ino = cfh->ino;
204 	vino.snap = CEPH_NOSNAP;
205 	inode = ceph_find_inode(sb, vino);
206 	if (!inode)
207 		return ERR_PTR(-ESTALE);
208 
209 	dentry = d_obtain_alias(inode);
210 	if (IS_ERR(dentry)) {
211 		pr_err("fh_to_parent %llx -- inode %p but ENOMEM\n",
212 		       cfh->ino, inode);
213 		iput(inode);
214 		return dentry;
215 	}
216 	err = ceph_init_dentry(dentry);
217 	if (err < 0) {
218 		iput(inode);
219 		return ERR_PTR(err);
220 	}
221 	dout("fh_to_parent %llx %p dentry %p\n", cfh->ino, inode, dentry);
222 	return dentry;
223 }
224 
225 const struct export_operations ceph_export_ops = {
226 	.encode_fh = ceph_encode_fh,
227 	.fh_to_dentry = ceph_fh_to_dentry,
228 	.fh_to_parent = ceph_fh_to_parent,
229 };
230