blob: 58558e37fb8ab9ab09ab168fb4a7deb002d26ed3 [file] [log] [blame]
Mike Marshall5db11c22015-07-17 10:38:12 -04001/*
2 * (C) 2001 Clemson University and The University of Chicago
3 *
4 * See COPYING in top-level directory.
5 */
6
7#include "protocol.h"
Mike Marshall575e9462015-12-04 12:56:14 -05008#include "orangefs-kernel.h"
9#include "orangefs-bufmap.h"
Mike Marshall5db11c22015-07-17 10:38:12 -040010
11struct readdir_handle_s {
12 int buffer_index;
Yi Liu8bb8aef2015-11-24 15:12:14 -050013 struct orangefs_readdir_response_s readdir_response;
Mike Marshall5db11c22015-07-17 10:38:12 -040014 void *dents_buf;
15};
16
17/*
18 * decode routine needed by kmod to make sense of the shared page for readdirs.
19 */
Al Viro80928952015-10-09 18:11:10 -040020static long decode_dirents(char *ptr, size_t size,
Yi Liu8bb8aef2015-11-24 15:12:14 -050021 struct orangefs_readdir_response_s *readdir)
Mike Marshall5db11c22015-07-17 10:38:12 -040022{
23 int i;
Yi Liu8bb8aef2015-11-24 15:12:14 -050024 struct orangefs_readdir_response_s *rd =
25 (struct orangefs_readdir_response_s *) ptr;
Mike Marshall5db11c22015-07-17 10:38:12 -040026 char *buf = ptr;
Mike Marshall5db11c22015-07-17 10:38:12 -040027
Yi Liu8bb8aef2015-11-24 15:12:14 -050028 if (size < offsetof(struct orangefs_readdir_response_s, dirent_array))
Al Viro80928952015-10-09 18:11:10 -040029 return -EINVAL;
30
Mike Marshall5db11c22015-07-17 10:38:12 -040031 readdir->token = rd->token;
Yi Liu8bb8aef2015-11-24 15:12:14 -050032 readdir->orangefs_dirent_outcount = rd->orangefs_dirent_outcount;
33 readdir->dirent_array = kcalloc(readdir->orangefs_dirent_outcount,
Mike Marshall5db11c22015-07-17 10:38:12 -040034 sizeof(*readdir->dirent_array),
35 GFP_KERNEL);
36 if (readdir->dirent_array == NULL)
37 return -ENOMEM;
Al Viro80928952015-10-09 18:11:10 -040038
Yi Liu8bb8aef2015-11-24 15:12:14 -050039 buf += offsetof(struct orangefs_readdir_response_s, dirent_array);
40 size -= offsetof(struct orangefs_readdir_response_s, dirent_array);
Al Viro80928952015-10-09 18:11:10 -040041
Yi Liu8bb8aef2015-11-24 15:12:14 -050042 for (i = 0; i < readdir->orangefs_dirent_outcount; i++) {
Al Viro80928952015-10-09 18:11:10 -040043 __u32 len;
44
45 if (size < 4)
46 goto Einval;
47
48 len = *(__u32 *)buf;
49 if (len >= (unsigned)-24)
50 goto Einval;
51
Al Viro9be68b02015-10-09 17:43:15 -040052 readdir->dirent_array[i].d_name = buf + 4;
Al Viro9be68b02015-10-09 17:43:15 -040053 readdir->dirent_array[i].d_length = len;
Al Viro80928952015-10-09 18:11:10 -040054
Martin Brandenburg7d221482016-01-04 15:05:28 -050055 /*
56 * Round 4 + len + 1, which is the encoded size plus the string
57 * plus the null terminator to the nearest eight byte boundry.
58 */
59 len = ((4 + len + 1) + 7) & ~7;
Al Viro80928952015-10-09 18:11:10 -040060 if (size < len + 16)
61 goto Einval;
62 size -= len + 16;
63
64 buf += len;
65
Mike Marshall5db11c22015-07-17 10:38:12 -040066 readdir->dirent_array[i].khandle =
Yi Liu8bb8aef2015-11-24 15:12:14 -050067 *(struct orangefs_khandle *) buf;
Al Viro9be68b02015-10-09 17:43:15 -040068 buf += 16;
Mike Marshall5db11c22015-07-17 10:38:12 -040069 }
Al Viro9be68b02015-10-09 17:43:15 -040070 return buf - ptr;
Al Viro80928952015-10-09 18:11:10 -040071Einval:
72 kfree(readdir->dirent_array);
73 readdir->dirent_array = NULL;
74 return -EINVAL;
Mike Marshall5db11c22015-07-17 10:38:12 -040075}
76
77static long readdir_handle_ctor(struct readdir_handle_s *rhandle, void *buf,
Al Viro80928952015-10-09 18:11:10 -040078 size_t size, int buffer_index)
Mike Marshall5db11c22015-07-17 10:38:12 -040079{
80 long ret;
81
82 if (buf == NULL) {
83 gossip_err
84 ("Invalid NULL buffer specified in readdir_handle_ctor\n");
85 return -ENOMEM;
86 }
87 if (buffer_index < 0) {
88 gossip_err
89 ("Invalid buffer index specified in readdir_handle_ctor\n");
90 return -EINVAL;
91 }
92 rhandle->buffer_index = buffer_index;
93 rhandle->dents_buf = buf;
Al Viro80928952015-10-09 18:11:10 -040094 ret = decode_dirents(buf, size, &rhandle->readdir_response);
Mike Marshall5db11c22015-07-17 10:38:12 -040095 if (ret < 0) {
96 gossip_err("Could not decode readdir from buffer %ld\n", ret);
97 rhandle->buffer_index = -1;
98 gossip_debug(GOSSIP_DIR_DEBUG, "vfree %p\n", buf);
99 vfree(buf);
100 rhandle->dents_buf = NULL;
101 }
102 return ret;
103}
104
Yi Liu8bb8aef2015-11-24 15:12:14 -0500105static void readdir_handle_dtor(struct orangefs_bufmap *bufmap,
Mike Marshall5db11c22015-07-17 10:38:12 -0400106 struct readdir_handle_s *rhandle)
107{
108 if (rhandle == NULL)
109 return;
110
111 /* kfree(NULL) is safe */
112 kfree(rhandle->readdir_response.dirent_array);
113 rhandle->readdir_response.dirent_array = NULL;
114
115 if (rhandle->buffer_index >= 0) {
Martin Brandenburg7d221482016-01-04 15:05:28 -0500116 orangefs_readdir_index_put(bufmap, rhandle->buffer_index);
Mike Marshall5db11c22015-07-17 10:38:12 -0400117 rhandle->buffer_index = -1;
118 }
119 if (rhandle->dents_buf) {
120 gossip_debug(GOSSIP_DIR_DEBUG, "vfree %p\n",
121 rhandle->dents_buf);
122 vfree(rhandle->dents_buf);
123 rhandle->dents_buf = NULL;
124 }
125}
126
127/*
128 * Read directory entries from an instance of an open directory.
Mike Marshall5db11c22015-07-17 10:38:12 -0400129 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500130static int orangefs_readdir(struct file *file, struct dir_context *ctx)
Mike Marshall5db11c22015-07-17 10:38:12 -0400131{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500132 struct orangefs_bufmap *bufmap = NULL;
Mike Marshall5db11c22015-07-17 10:38:12 -0400133 int ret = 0;
134 int buffer_index;
Mike Marshall88309aa2015-09-23 16:48:40 -0400135 /*
136 * ptoken supports Orangefs' distributed directory logic, added
137 * in 2.9.2.
138 */
Mike Marshall5db11c22015-07-17 10:38:12 -0400139 __u64 *ptoken = file->private_data;
140 __u64 pos = 0;
141 ino_t ino = 0;
142 struct dentry *dentry = file->f_path.dentry;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500143 struct orangefs_kernel_op_s *new_op = NULL;
144 struct orangefs_inode_s *orangefs_inode = ORANGEFS_I(dentry->d_inode);
Mike Marshall5db11c22015-07-17 10:38:12 -0400145 int buffer_full = 0;
146 struct readdir_handle_s rhandle;
147 int i = 0;
148 int len = 0;
149 ino_t current_ino = 0;
150 char *current_entry = NULL;
151 long bytes_decoded;
152
Mike Marshall88309aa2015-09-23 16:48:40 -0400153 gossip_debug(GOSSIP_DIR_DEBUG,
154 "%s: ctx->pos:%lld, ptoken = %llu\n",
155 __func__,
156 lld(ctx->pos),
157 llu(*ptoken));
Mike Marshall5db11c22015-07-17 10:38:12 -0400158
159 pos = (__u64) ctx->pos;
160
161 /* are we done? */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500162 if (pos == ORANGEFS_READDIR_END) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400163 gossip_debug(GOSSIP_DIR_DEBUG,
164 "Skipping to termination path\n");
165 return 0;
166 }
167
168 gossip_debug(GOSSIP_DIR_DEBUG,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500169 "orangefs_readdir called on %s (pos=%llu)\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400170 dentry->d_name.name, llu(pos));
171
172 rhandle.buffer_index = -1;
173 rhandle.dents_buf = NULL;
174 memset(&rhandle.readdir_response, 0, sizeof(rhandle.readdir_response));
175
Yi Liu8bb8aef2015-11-24 15:12:14 -0500176 new_op = op_alloc(ORANGEFS_VFS_OP_READDIR);
Mike Marshall5db11c22015-07-17 10:38:12 -0400177 if (!new_op)
178 return -ENOMEM;
179
180 new_op->uses_shared_memory = 1;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500181 new_op->upcall.req.readdir.refn = orangefs_inode->refn;
Martin Brandenburg7d221482016-01-04 15:05:28 -0500182 new_op->upcall.req.readdir.max_dirent_count =
183 ORANGEFS_MAX_DIRENT_COUNT_READDIR;
Mike Marshall5db11c22015-07-17 10:38:12 -0400184
185 gossip_debug(GOSSIP_DIR_DEBUG,
186 "%s: upcall.req.readdir.refn.khandle: %pU\n",
187 __func__,
188 &new_op->upcall.req.readdir.refn.khandle);
189
Mike Marshall5db11c22015-07-17 10:38:12 -0400190 new_op->upcall.req.readdir.token = *ptoken;
191
192get_new_buffer_index:
Martin Brandenburg7d221482016-01-04 15:05:28 -0500193 ret = orangefs_readdir_index_get(&bufmap, &buffer_index);
Mike Marshall5db11c22015-07-17 10:38:12 -0400194 if (ret < 0) {
Martin Brandenburg7d221482016-01-04 15:05:28 -0500195 gossip_lerr("orangefs_readdir: orangefs_readdir_index_get() failure (%d)\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400196 ret);
197 goto out_free_op;
198 }
199 new_op->upcall.req.readdir.buf_index = buffer_index;
200
201 ret = service_operation(new_op,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500202 "orangefs_readdir",
Mike Marshall5db11c22015-07-17 10:38:12 -0400203 get_interruptible_flag(dentry->d_inode));
204
205 gossip_debug(GOSSIP_DIR_DEBUG,
206 "Readdir downcall status is %d. ret:%d\n",
207 new_op->downcall.status,
208 ret);
209
210 if (ret == -EAGAIN && op_state_purged(new_op)) {
211 /*
212 * readdir shared memory aread has been wiped due to
213 * pvfs2-client-core restarting, so we must get a new
214 * index into the shared memory.
215 */
216 gossip_debug(GOSSIP_DIR_DEBUG,
217 "%s: Getting new buffer_index for retry of readdir..\n",
218 __func__);
Martin Brandenburg7d221482016-01-04 15:05:28 -0500219 orangefs_readdir_index_put(bufmap, buffer_index);
Mike Marshall5db11c22015-07-17 10:38:12 -0400220 goto get_new_buffer_index;
221 }
222
223 if (ret == -EIO && op_state_purged(new_op)) {
224 gossip_err("%s: Client is down. Aborting readdir call.\n",
225 __func__);
Martin Brandenburg7d221482016-01-04 15:05:28 -0500226 orangefs_readdir_index_put(bufmap, buffer_index);
Mike Marshall5db11c22015-07-17 10:38:12 -0400227 goto out_free_op;
228 }
229
230 if (ret < 0 || new_op->downcall.status != 0) {
231 gossip_debug(GOSSIP_DIR_DEBUG,
232 "Readdir request failed. Status:%d\n",
233 new_op->downcall.status);
Martin Brandenburg7d221482016-01-04 15:05:28 -0500234 orangefs_readdir_index_put(bufmap, buffer_index);
Mike Marshall5db11c22015-07-17 10:38:12 -0400235 if (ret >= 0)
236 ret = new_op->downcall.status;
237 goto out_free_op;
238 }
239
240 bytes_decoded =
241 readdir_handle_ctor(&rhandle,
242 new_op->downcall.trailer_buf,
Al Viro80928952015-10-09 18:11:10 -0400243 new_op->downcall.trailer_size,
Mike Marshall5db11c22015-07-17 10:38:12 -0400244 buffer_index);
245 if (bytes_decoded < 0) {
Yi Liu8bb8aef2015-11-24 15:12:14 -0500246 gossip_err("orangefs_readdir: Could not decode trailer buffer into a readdir response %d\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400247 ret);
248 ret = bytes_decoded;
Martin Brandenburg7d221482016-01-04 15:05:28 -0500249 orangefs_readdir_index_put(bufmap, buffer_index);
Mike Marshall5db11c22015-07-17 10:38:12 -0400250 goto out_free_op;
251 }
252
253 if (bytes_decoded != new_op->downcall.trailer_size) {
Yi Liu8bb8aef2015-11-24 15:12:14 -0500254 gossip_err("orangefs_readdir: # bytes decoded (%ld) "
Mike Marshall88309aa2015-09-23 16:48:40 -0400255 "!= trailer size (%ld)\n",
256 bytes_decoded,
257 (long)new_op->downcall.trailer_size);
Mike Marshall5db11c22015-07-17 10:38:12 -0400258 ret = -EINVAL;
259 goto out_destroy_handle;
260 }
261
Mike Marshall88309aa2015-09-23 16:48:40 -0400262 /*
Yi Liu8bb8aef2015-11-24 15:12:14 -0500263 * orangefs doesn't actually store dot and dot-dot, but
Mike Marshall88309aa2015-09-23 16:48:40 -0400264 * we need to have them represented.
265 */
Mike Marshall5db11c22015-07-17 10:38:12 -0400266 if (pos == 0) {
267 ino = get_ino_from_khandle(dentry->d_inode);
268 gossip_debug(GOSSIP_DIR_DEBUG,
269 "%s: calling dir_emit of \".\" with pos = %llu\n",
270 __func__,
271 llu(pos));
272 ret = dir_emit(ctx, ".", 1, ino, DT_DIR);
Mike Marshall88309aa2015-09-23 16:48:40 -0400273 pos += 1;
Mike Marshall5db11c22015-07-17 10:38:12 -0400274 }
275
276 if (pos == 1) {
277 ino = get_parent_ino_from_dentry(dentry);
278 gossip_debug(GOSSIP_DIR_DEBUG,
279 "%s: calling dir_emit of \"..\" with pos = %llu\n",
280 __func__,
281 llu(pos));
282 ret = dir_emit(ctx, "..", 2, ino, DT_DIR);
Mike Marshall88309aa2015-09-23 16:48:40 -0400283 pos += 1;
Mike Marshall5db11c22015-07-17 10:38:12 -0400284 }
285
Mike Marshall88309aa2015-09-23 16:48:40 -0400286 /*
Yi Liu8bb8aef2015-11-24 15:12:14 -0500287 * we stored ORANGEFS_ITERATE_NEXT in ctx->pos last time around
Mike Marshall88309aa2015-09-23 16:48:40 -0400288 * to prevent "finding" dot and dot-dot on any iteration
289 * other than the first.
290 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500291 if (ctx->pos == ORANGEFS_ITERATE_NEXT)
Mike Marshall88309aa2015-09-23 16:48:40 -0400292 ctx->pos = 0;
293
294 for (i = ctx->pos;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500295 i < rhandle.readdir_response.orangefs_dirent_outcount;
Mike Marshall88309aa2015-09-23 16:48:40 -0400296 i++) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400297 len = rhandle.readdir_response.dirent_array[i].d_length;
298 current_entry = rhandle.readdir_response.dirent_array[i].d_name;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500299 current_ino = orangefs_khandle_to_ino(
Mike Marshall5db11c22015-07-17 10:38:12 -0400300 &(rhandle.readdir_response.dirent_array[i].khandle));
301
302 gossip_debug(GOSSIP_DIR_DEBUG,
Mike Marshall88309aa2015-09-23 16:48:40 -0400303 "calling dir_emit for %s with len %d"
304 ", ctx->pos %ld\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400305 current_entry,
306 len,
Mike Marshall88309aa2015-09-23 16:48:40 -0400307 (unsigned long)ctx->pos);
308 /*
309 * type is unknown. We don't return object type
310 * in the dirent_array. This leaves getdents
311 * clueless about type.
312 */
Mike Marshall5db11c22015-07-17 10:38:12 -0400313 ret =
314 dir_emit(ctx, current_entry, len, current_ino, DT_UNKNOWN);
Mike Marshall88309aa2015-09-23 16:48:40 -0400315 if (!ret)
316 break;
Mike Marshall5db11c22015-07-17 10:38:12 -0400317 ctx->pos++;
Mike Marshall88309aa2015-09-23 16:48:40 -0400318 gossip_debug(GOSSIP_DIR_DEBUG,
Mike Marshall5db11c22015-07-17 10:38:12 -0400319 "%s: ctx->pos:%lld\n",
320 __func__,
321 lld(ctx->pos));
322
Mike Marshall5db11c22015-07-17 10:38:12 -0400323 }
324
Mike Marshall54804942015-10-05 13:44:24 -0400325 /*
Mike Marshall88309aa2015-09-23 16:48:40 -0400326 * we ran all the way through the last batch, set up for
327 * getting another batch...
328 */
329 if (ret) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400330 *ptoken = rhandle.readdir_response.token;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500331 ctx->pos = ORANGEFS_ITERATE_NEXT;
Mike Marshall5db11c22015-07-17 10:38:12 -0400332 }
333
334 /*
335 * Did we hit the end of the directory?
336 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500337 if (rhandle.readdir_response.token == ORANGEFS_READDIR_END &&
Mike Marshall5db11c22015-07-17 10:38:12 -0400338 !buffer_full) {
Mike Marshall88309aa2015-09-23 16:48:40 -0400339 gossip_debug(GOSSIP_DIR_DEBUG,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500340 "End of dir detected; setting ctx->pos to ORANGEFS_READDIR_END.\n");
341 ctx->pos = ORANGEFS_READDIR_END;
Mike Marshall5db11c22015-07-17 10:38:12 -0400342 }
343
Mike Marshall5db11c22015-07-17 10:38:12 -0400344out_destroy_handle:
345 readdir_handle_dtor(bufmap, &rhandle);
346out_free_op:
347 op_release(new_op);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500348 gossip_debug(GOSSIP_DIR_DEBUG, "orangefs_readdir returning %d\n", ret);
Mike Marshall5db11c22015-07-17 10:38:12 -0400349 return ret;
350}
351
Yi Liu8bb8aef2015-11-24 15:12:14 -0500352static int orangefs_dir_open(struct inode *inode, struct file *file)
Mike Marshall5db11c22015-07-17 10:38:12 -0400353{
354 __u64 *ptoken;
355
356 file->private_data = kmalloc(sizeof(__u64), GFP_KERNEL);
357 if (!file->private_data)
358 return -ENOMEM;
359
360 ptoken = file->private_data;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500361 *ptoken = ORANGEFS_READDIR_START;
Mike Marshall5db11c22015-07-17 10:38:12 -0400362 return 0;
363}
364
Yi Liu8bb8aef2015-11-24 15:12:14 -0500365static int orangefs_dir_release(struct inode *inode, struct file *file)
Mike Marshall5db11c22015-07-17 10:38:12 -0400366{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500367 orangefs_flush_inode(inode);
Mike Marshall5db11c22015-07-17 10:38:12 -0400368 kfree(file->private_data);
369 return 0;
370}
371
Yi Liu8bb8aef2015-11-24 15:12:14 -0500372/** ORANGEFS implementation of VFS directory operations */
373const struct file_operations orangefs_dir_operations = {
Mike Marshall5db11c22015-07-17 10:38:12 -0400374 .read = generic_read_dir,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500375 .iterate = orangefs_readdir,
376 .open = orangefs_dir_open,
377 .release = orangefs_dir_release,
Mike Marshall5db11c22015-07-17 10:38:12 -0400378};