blob: 5a9c53eb115f7496daa5adf6ff769d2acb61a2a0 [file] [log] [blame]
Mike Marshall5db11c22015-07-17 10:38:12 -04001/*
2 * (C) 2001 Clemson University and The University of Chicago
3 *
4 * Changes by Acxiom Corporation to add protocol version to kernel
5 * communication, Copyright Acxiom Corporation, 2005.
6 *
7 * See COPYING in top-level directory.
8 */
9
10#include "protocol.h"
Mike Marshall575e9462015-12-04 12:56:14 -050011#include "orangefs-kernel.h"
12#include "orangefs-dev-proto.h"
13#include "orangefs-bufmap.h"
Mike Marshall5db11c22015-07-17 10:38:12 -040014
15#include <linux/debugfs.h>
16#include <linux/slab.h>
17
18/* this file implements the /dev/pvfs2-req device node */
19
20static int open_access_count;
21
22#define DUMP_DEVICE_ERROR() \
23do { \
24 gossip_err("*****************************************************\n");\
Yi Liu8bb8aef2015-11-24 15:12:14 -050025 gossip_err("ORANGEFS Device Error: You cannot open the device file "); \
Mike Marshall5db11c22015-07-17 10:38:12 -040026 gossip_err("\n/dev/%s more than once. Please make sure that\nthere " \
Yi Liu8bb8aef2015-11-24 15:12:14 -050027 "are no ", ORANGEFS_REQDEVICE_NAME); \
Mike Marshall5db11c22015-07-17 10:38:12 -040028 gossip_err("instances of a program using this device\ncurrently " \
29 "running. (You must verify this!)\n"); \
30 gossip_err("For example, you can use the lsof program as follows:\n");\
31 gossip_err("'lsof | grep %s' (run this as root)\n", \
Yi Liu8bb8aef2015-11-24 15:12:14 -050032 ORANGEFS_REQDEVICE_NAME); \
Mike Marshall5db11c22015-07-17 10:38:12 -040033 gossip_err(" open_access_count = %d\n", open_access_count); \
34 gossip_err("*****************************************************\n");\
35} while (0)
36
37static int hash_func(__u64 tag, int table_size)
38{
Mike Marshall2c590d52015-07-24 10:37:15 -040039 return do_div(tag, (unsigned int)table_size);
Mike Marshall5db11c22015-07-17 10:38:12 -040040}
41
Yi Liu8bb8aef2015-11-24 15:12:14 -050042static void orangefs_devreq_add_op(struct orangefs_kernel_op_s *op)
Mike Marshall5db11c22015-07-17 10:38:12 -040043{
44 int index = hash_func(op->tag, hash_table_size);
45
46 spin_lock(&htable_ops_in_progress_lock);
47 list_add_tail(&op->list, &htable_ops_in_progress[index]);
48 spin_unlock(&htable_ops_in_progress_lock);
49}
50
Yi Liu8bb8aef2015-11-24 15:12:14 -050051static struct orangefs_kernel_op_s *orangefs_devreq_remove_op(__u64 tag)
Mike Marshall5db11c22015-07-17 10:38:12 -040052{
Yi Liu8bb8aef2015-11-24 15:12:14 -050053 struct orangefs_kernel_op_s *op, *next;
Mike Marshall5db11c22015-07-17 10:38:12 -040054 int index;
55
56 index = hash_func(tag, hash_table_size);
57
58 spin_lock(&htable_ops_in_progress_lock);
59 list_for_each_entry_safe(op,
60 next,
61 &htable_ops_in_progress[index],
62 list) {
63 if (op->tag == tag) {
64 list_del(&op->list);
65 spin_unlock(&htable_ops_in_progress_lock);
66 return op;
67 }
68 }
69
70 spin_unlock(&htable_ops_in_progress_lock);
71 return NULL;
72}
73
Yi Liu8bb8aef2015-11-24 15:12:14 -050074static int orangefs_devreq_open(struct inode *inode, struct file *file)
Mike Marshall5db11c22015-07-17 10:38:12 -040075{
76 int ret = -EINVAL;
77
78 if (!(file->f_flags & O_NONBLOCK)) {
Mike Marshall97f10022015-12-11 16:45:03 -050079 gossip_err("%s: device cannot be opened in blocking mode\n",
80 __func__);
Mike Marshall5db11c22015-07-17 10:38:12 -040081 goto out;
82 }
83 ret = -EACCES;
Mike Marshall97f10022015-12-11 16:45:03 -050084 gossip_debug(GOSSIP_DEV_DEBUG, "client-core: opening device\n");
Mike Marshall5db11c22015-07-17 10:38:12 -040085 mutex_lock(&devreq_mutex);
86
87 if (open_access_count == 0) {
88 ret = generic_file_open(inode, file);
89 if (ret == 0)
90 open_access_count++;
91 } else {
92 DUMP_DEVICE_ERROR();
93 }
94 mutex_unlock(&devreq_mutex);
95
96out:
97
98 gossip_debug(GOSSIP_DEV_DEBUG,
99 "pvfs2-client-core: open device complete (ret = %d)\n",
100 ret);
101 return ret;
102}
103
Mike Marshall97f10022015-12-11 16:45:03 -0500104/* Function for read() callers into the device */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500105static ssize_t orangefs_devreq_read(struct file *file,
Mike Marshall5db11c22015-07-17 10:38:12 -0400106 char __user *buf,
107 size_t count, loff_t *offset)
108{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500109 struct orangefs_kernel_op_s *op, *temp;
110 __s32 proto_ver = ORANGEFS_KERNEL_PROTO_VERSION;
111 static __s32 magic = ORANGEFS_DEVREQ_MAGIC;
112 struct orangefs_kernel_op_s *cur_op = NULL;
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500113 unsigned long ret;
Mike Marshall5db11c22015-07-17 10:38:12 -0400114
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500115 /* We do not support blocking IO. */
Mike Marshall5db11c22015-07-17 10:38:12 -0400116 if (!(file->f_flags & O_NONBLOCK)) {
Mike Marshall97f10022015-12-11 16:45:03 -0500117 gossip_err("%s: blocking read from client-core.\n",
118 __func__);
Mike Marshall5db11c22015-07-17 10:38:12 -0400119 return -EINVAL;
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500120 }
121
122 /*
Martin Brandenburga762ae62015-12-15 14:22:06 -0500123 * The client will do an ioctl to find MAX_DEV_REQ_UPSIZE, then
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500124 * always read with that size buffer.
125 */
Martin Brandenburga762ae62015-12-15 14:22:06 -0500126 if (count != MAX_DEV_REQ_UPSIZE) {
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500127 gossip_err("orangefs: client-core tried to read wrong size\n");
128 return -EINVAL;
129 }
130
131 /* Get next op (if any) from top of list. */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500132 spin_lock(&orangefs_request_list_lock);
133 list_for_each_entry_safe(op, temp, &orangefs_request_list, list) {
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500134 __s32 fsid;
135 /* This lock is held past the end of the loop when we break. */
136 spin_lock(&op->lock);
137
138 fsid = fsid_of_op(op);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500139 if (fsid != ORANGEFS_FS_ID_NULL) {
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500140 int ret;
141 /* Skip ops whose filesystem needs to be mounted. */
142 ret = fs_mount_pending(fsid);
143 if (ret == 1) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400144 gossip_debug(GOSSIP_DEV_DEBUG,
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500145 "orangefs: skipping op tag %llu %s\n",
146 llu(op->tag), get_opname_string(op));
147 spin_unlock(&op->lock);
Mike Marshall5db11c22015-07-17 10:38:12 -0400148 continue;
Mike Marshall97f10022015-12-11 16:45:03 -0500149 /*
150 * Skip ops whose filesystem we don't know about unless
151 * it is being mounted.
152 */
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500153 /* XXX: is there a better way to detect this? */
154 } else if (ret == -1 &&
Mike Marshall97f10022015-12-11 16:45:03 -0500155 !(op->upcall.type ==
156 ORANGEFS_VFS_OP_FS_MOUNT ||
157 op->upcall.type ==
158 ORANGEFS_VFS_OP_GETATTR)) {
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500159 gossip_debug(GOSSIP_DEV_DEBUG,
160 "orangefs: skipping op tag %llu %s\n",
161 llu(op->tag), get_opname_string(op));
162 gossip_err(
163 "orangefs: ERROR: fs_mount_pending %d\n",
164 fsid);
165 spin_unlock(&op->lock);
166 continue;
Mike Marshall5db11c22015-07-17 10:38:12 -0400167 }
168 }
Mike Marshall5db11c22015-07-17 10:38:12 -0400169 /*
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500170 * Either this op does not pertain to a filesystem, is mounting
171 * a filesystem, or pertains to a mounted filesystem. Let it
172 * through.
Mike Marshall5db11c22015-07-17 10:38:12 -0400173 */
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500174 cur_op = op;
175 break;
Mike Marshall5db11c22015-07-17 10:38:12 -0400176 }
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500177
178 /*
179 * At this point we either have a valid op and can continue or have not
180 * found an op and must ask the client to try again later.
181 */
182 if (!cur_op) {
Yi Liu8bb8aef2015-11-24 15:12:14 -0500183 spin_unlock(&orangefs_request_list_lock);
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500184 return -EAGAIN;
185 }
186
187 gossip_debug(GOSSIP_DEV_DEBUG, "orangefs: reading op tag %llu %s\n",
188 llu(cur_op->tag), get_opname_string(cur_op));
189
190 /*
191 * Such an op should never be on the list in the first place. If so, we
192 * will abort.
193 */
194 if (op_state_in_progress(cur_op) || op_state_serviced(cur_op)) {
195 gossip_err("orangefs: ERROR: Current op already queued.\n");
196 list_del(&cur_op->list);
197 spin_unlock(&cur_op->lock);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500198 spin_unlock(&orangefs_request_list_lock);
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500199 return -EAGAIN;
200 }
201
202 /*
203 * Set the operation to be in progress and move it between lists since
204 * it has been sent to the client.
205 */
206 set_op_state_inprogress(cur_op);
207
208 list_del(&cur_op->list);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500209 spin_unlock(&orangefs_request_list_lock);
210 orangefs_devreq_add_op(cur_op);
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500211 spin_unlock(&cur_op->lock);
212
213 /* Push the upcall out. */
214 ret = copy_to_user(buf, &proto_ver, sizeof(__s32));
215 if (ret != 0)
216 goto error;
217 ret = copy_to_user(buf+sizeof(__s32), &magic, sizeof(__s32));
218 if (ret != 0)
219 goto error;
220 ret = copy_to_user(buf+2 * sizeof(__s32), &cur_op->tag, sizeof(__u64));
221 if (ret != 0)
222 goto error;
223 ret = copy_to_user(buf+2*sizeof(__s32)+sizeof(__u64), &cur_op->upcall,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500224 sizeof(struct orangefs_upcall_s));
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500225 if (ret != 0)
226 goto error;
227
228 /* The client only asks to read one size buffer. */
Martin Brandenburga762ae62015-12-15 14:22:06 -0500229 return MAX_DEV_REQ_UPSIZE;
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500230error:
231 /*
232 * We were unable to copy the op data to the client. Put the op back in
233 * list. If client has crashed, the op will be purged later when the
234 * device is released.
235 */
236 gossip_err("orangefs: Failed to copy data to user space\n");
Yi Liu8bb8aef2015-11-24 15:12:14 -0500237 spin_lock(&orangefs_request_list_lock);
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500238 spin_lock(&cur_op->lock);
239 set_op_state_waiting(cur_op);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500240 orangefs_devreq_remove_op(cur_op->tag);
241 list_add(&cur_op->list, &orangefs_request_list);
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500242 spin_unlock(&cur_op->lock);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500243 spin_unlock(&orangefs_request_list_lock);
Martin Brandenburg24c8d082015-11-13 14:26:10 -0500244 return -EFAULT;
Mike Marshall5db11c22015-07-17 10:38:12 -0400245}
246
Mike Marshall97f10022015-12-11 16:45:03 -0500247/*
248 * Function for writev() callers into the device. Readdir related
249 * operations have an extra iovec containing info about objects
250 * contained in directories.
251 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500252static ssize_t orangefs_devreq_writev(struct file *file,
Mike Marshall5db11c22015-07-17 10:38:12 -0400253 const struct iovec *iov,
254 size_t count,
255 loff_t *offset)
256{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500257 struct orangefs_kernel_op_s *op = NULL;
Mike Marshall5db11c22015-07-17 10:38:12 -0400258 void *buffer = NULL;
259 void *ptr = NULL;
260 unsigned long i = 0;
Martin Brandenburga762ae62015-12-15 14:22:06 -0500261 int num_remaining = MAX_DEV_REQ_DOWNSIZE;
Mike Marshall97f10022015-12-11 16:45:03 -0500262 int ret = 0;
263 /* num elements in iovec without trailer */
264 int notrailer_count = 4;
265 /*
266 * If there's a trailer, its iov index will be equal to
267 * notrailer_count.
268 */
269 int trailer_index = notrailer_count;
Mike Marshall5db11c22015-07-17 10:38:12 -0400270 int payload_size = 0;
Mike Marshall97f10022015-12-11 16:45:03 -0500271 int returned_downcall_size = 0;
Mike Marshall5db11c22015-07-17 10:38:12 -0400272 __s32 magic = 0;
273 __s32 proto_ver = 0;
274 __u64 tag = 0;
275 ssize_t total_returned_size = 0;
276
Mike Marshall97f10022015-12-11 16:45:03 -0500277 /*
278 * There will always be at least notrailer_count iovecs, and
279 * when there's a trailer, one more than notrailer_count. Check
280 * count's sanity.
281 */
Mike Marshall5db11c22015-07-17 10:38:12 -0400282 if (count != notrailer_count && count != (notrailer_count + 1)) {
Mike Marshall97f10022015-12-11 16:45:03 -0500283 gossip_err("%s: count:%zu: notrailer_count :%d:\n",
284 __func__,
Mike Marshall5db11c22015-07-17 10:38:12 -0400285 count,
286 notrailer_count);
287 return -EPROTO;
288 }
Mike Marshall5db11c22015-07-17 10:38:12 -0400289
Mike Marshall97f10022015-12-11 16:45:03 -0500290
291 /* Copy the non-trailer iovec data into a device request buffer. */
292 buffer = dev_req_alloc();
293 if (!buffer) {
294 gossip_err("%s: dev_req_alloc failed.\n", __func__);
295 return -ENOMEM;
296 }
297 ptr = buffer;
Mike Marshall5db11c22015-07-17 10:38:12 -0400298 for (i = 0; i < notrailer_count; i++) {
299 if (iov[i].iov_len > num_remaining) {
300 gossip_err
301 ("writev error: Freeing buffer and returning\n");
302 dev_req_release(buffer);
303 return -EMSGSIZE;
304 }
305 ret = copy_from_user(ptr, iov[i].iov_base, iov[i].iov_len);
306 if (ret) {
307 gossip_err("Failed to copy data from user space\n");
308 dev_req_release(buffer);
309 return -EIO;
310 }
311 num_remaining -= iov[i].iov_len;
312 ptr += iov[i].iov_len;
313 payload_size += iov[i].iov_len;
314 }
315 total_returned_size = payload_size;
316
317 /* these elements are currently 8 byte aligned (8 bytes for (version +
318 * magic) 8 bytes for tag). If you add another element, either
319 * make it 8 bytes big, or use get_unaligned when asigning.
320 */
321 ptr = buffer;
Mike Marshall97f10022015-12-11 16:45:03 -0500322 proto_ver = *((__s32 *) ptr); /* unused */
Mike Marshall5db11c22015-07-17 10:38:12 -0400323 ptr += sizeof(__s32);
324
325 magic = *((__s32 *) ptr);
326 ptr += sizeof(__s32);
327
328 tag = *((__u64 *) ptr);
329 ptr += sizeof(__u64);
330
Yi Liu8bb8aef2015-11-24 15:12:14 -0500331 if (magic != ORANGEFS_DEVREQ_MAGIC) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400332 gossip_err("Error: Device magic number does not match.\n");
333 dev_req_release(buffer);
334 return -EPROTO;
335 }
336
Yi Liu8bb8aef2015-11-24 15:12:14 -0500337 op = orangefs_devreq_remove_op(tag);
Mike Marshall5db11c22015-07-17 10:38:12 -0400338 if (op) {
339 /* Increase ref count! */
340 get_op(op);
Mike Marshall97f10022015-12-11 16:45:03 -0500341
342 /* calculate the size of the returned downcall. */
343 returned_downcall_size =
344 payload_size - (2 * sizeof(__s32) + sizeof(__u64));
345
346 /* copy the passed in downcall into the op */
347 if (returned_downcall_size ==
348 sizeof(struct orangefs_downcall_s)) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400349 memcpy(&op->downcall,
350 ptr,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500351 sizeof(struct orangefs_downcall_s));
Mike Marshall97f10022015-12-11 16:45:03 -0500352 } else {
353 gossip_err("%s: returned downcall size:%d: \n",
354 __func__,
355 returned_downcall_size);
356 dev_req_release(buffer);
357 put_op(op);
358 return -EMSGSIZE;
Mike Marshall5db11c22015-07-17 10:38:12 -0400359 }
360
Mike Marshall97f10022015-12-11 16:45:03 -0500361 /* Don't tolerate an unexpected trailer iovec. */
362 if ((op->downcall.trailer_size == 0) &&
363 (count != notrailer_count)) {
364 gossip_err("%s: unexpected trailer iovec.\n",
365 __func__);
366 dev_req_release(buffer);
367 put_op(op);
368 return -EPROTO;
369 }
370
371 /* Don't consider the trailer if there's a bad status. */
372 if (op->downcall.status != 0)
373 goto no_trailer;
374
375 /* get the trailer if there is one. */
376 if (op->downcall.trailer_size == 0)
377 goto no_trailer;
378
379 gossip_debug(GOSSIP_DEV_DEBUG,
380 "%s: op->downcall.trailer_size %lld\n",
381 __func__,
382 op->downcall.trailer_size);
383
384 /*
385 * Bail if we think think there should be a trailer, but
386 * there's no iovec for it.
387 */
388 if (count != (notrailer_count + 1)) {
389 gossip_err("%s: trailer_size:%lld: count:%zu:\n",
390 __func__,
391 op->downcall.trailer_size,
392 count);
393 dev_req_release(buffer);
394 put_op(op);
395 return -EPROTO;
396 }
397
398 /* Verify that trailer_size is accurate. */
399 if (op->downcall.trailer_size != iov[trailer_index].iov_len) {
400 gossip_err("%s: trailer_size:%lld: != iov_len:%zd:\n",
401 __func__,
402 op->downcall.trailer_size,
403 iov[trailer_index].iov_len);
404 dev_req_release(buffer);
405 put_op(op);
406 return -EMSGSIZE;
407 }
408
409 total_returned_size += iov[trailer_index].iov_len;
410
411 /*
412 * Allocate a buffer, copy the trailer bytes into it and
413 * attach it to the downcall.
414 */
415 op->downcall.trailer_buf = vmalloc(iov[trailer_index].iov_len);
416 if (op->downcall.trailer_buf != NULL) {
417 gossip_debug(GOSSIP_DEV_DEBUG, "vmalloc: %p\n",
418 op->downcall.trailer_buf);
419 ret = copy_from_user(op->downcall.trailer_buf,
420 iov[trailer_index].iov_base,
421 iov[trailer_index].iov_len);
422 if (ret) {
423 gossip_err("%s: Failed to copy trailer.\n",
424 __func__);
425 dev_req_release(buffer);
426 gossip_debug(GOSSIP_DEV_DEBUG,
427 "vfree: %p\n",
428 op->downcall.trailer_buf);
429 vfree(op->downcall.trailer_buf);
430 op->downcall.trailer_buf = NULL;
431 put_op(op);
432 return -EIO;
433 }
434 } else {
Mike Marshall97f10022015-12-11 16:45:03 -0500435 gossip_err("writev: could not vmalloc for trailer!\n");
436 dev_req_release(buffer);
437 put_op(op);
438 return -ENOMEM;
439 }
440
441no_trailer:
442
443 /* if this operation is an I/O operation we need to wait
Mike Marshall5db11c22015-07-17 10:38:12 -0400444 * for all data to be copied before we can return to avoid
445 * buffer corruption and races that can pull the buffers
446 * out from under us.
447 *
448 * Essentially we're synchronizing with other parts of the
449 * vfs implicitly by not allowing the user space
450 * application reading/writing this device to return until
451 * the buffers are done being used.
452 */
Mike Marshall97f10022015-12-11 16:45:03 -0500453 if (op->upcall.type == ORANGEFS_VFS_OP_FILE_IO) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400454 int timed_out = 0;
Mike Marshallce6c4142015-12-14 14:54:46 -0500455 DEFINE_WAIT(wait_entry);
Mike Marshall5db11c22015-07-17 10:38:12 -0400456
Mike Marshall97f10022015-12-11 16:45:03 -0500457 /*
458 * tell the vfs op waiting on a waitqueue
Mike Marshall5db11c22015-07-17 10:38:12 -0400459 * that this op is done
460 */
461 spin_lock(&op->lock);
462 set_op_state_serviced(op);
463 spin_unlock(&op->lock);
464
Mike Marshall5db11c22015-07-17 10:38:12 -0400465 wake_up_interruptible(&op->waitq);
466
467 while (1) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400468 spin_lock(&op->lock);
Mike Marshallce6c4142015-12-14 14:54:46 -0500469 prepare_to_wait_exclusive(
470 &op->io_completion_waitq,
471 &wait_entry,
472 TASK_INTERRUPTIBLE);
Mike Marshall5db11c22015-07-17 10:38:12 -0400473 if (op->io_completed) {
474 spin_unlock(&op->lock);
475 break;
476 }
477 spin_unlock(&op->lock);
478
479 if (!signal_pending(current)) {
480 int timeout =
481 MSECS_TO_JIFFIES(1000 *
482 op_timeout_secs);
483 if (!schedule_timeout(timeout)) {
Mike Marshall97f10022015-12-11 16:45:03 -0500484 gossip_debug(GOSSIP_DEV_DEBUG,
485 "%s: timed out.\n",
486 __func__);
Mike Marshall5db11c22015-07-17 10:38:12 -0400487 timed_out = 1;
488 break;
489 }
490 continue;
491 }
492
Mike Marshall97f10022015-12-11 16:45:03 -0500493 gossip_debug(GOSSIP_DEV_DEBUG,
494 "%s: signal on I/O wait, aborting\n",
495 __func__);
Mike Marshall5db11c22015-07-17 10:38:12 -0400496 break;
497 }
498
Mike Marshallce6c4142015-12-14 14:54:46 -0500499 spin_lock(&op->lock);
500 finish_wait(&op->io_completion_waitq, &wait_entry);
501 spin_unlock(&op->lock);
Mike Marshall5db11c22015-07-17 10:38:12 -0400502
503 /* NOTE: for I/O operations we handle releasing the op
504 * object except in the case of timeout. the reason we
505 * can't free the op in timeout cases is that the op
506 * service logic in the vfs retries operations using
507 * the same op ptr, thus it can't be freed.
508 */
509 if (!timed_out)
510 op_release(op);
511 } else {
512
513 /*
514 * tell the vfs op waiting on a waitqueue that
515 * this op is done
516 */
517 spin_lock(&op->lock);
518 set_op_state_serviced(op);
519 spin_unlock(&op->lock);
520 /*
Mike Marshall54804942015-10-05 13:44:24 -0400521 * for every other operation (i.e. non-I/O), we need to
522 * wake up the callers for downcall completion
523 * notification
Mike Marshall5db11c22015-07-17 10:38:12 -0400524 */
525 wake_up_interruptible(&op->waitq);
526 }
527 } else {
528 /* ignore downcalls that we're not interested in */
529 gossip_debug(GOSSIP_DEV_DEBUG,
530 "WARNING: No one's waiting for tag %llu\n",
531 llu(tag));
532 }
Mike Marshall97f10022015-12-11 16:45:03 -0500533 /* put_op? */
Mike Marshall5db11c22015-07-17 10:38:12 -0400534 dev_req_release(buffer);
535
536 return total_returned_size;
537}
538
Yi Liu8bb8aef2015-11-24 15:12:14 -0500539static ssize_t orangefs_devreq_write_iter(struct kiocb *iocb,
Mike Marshall5db11c22015-07-17 10:38:12 -0400540 struct iov_iter *iter)
541{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500542 return orangefs_devreq_writev(iocb->ki_filp,
Mike Marshall5db11c22015-07-17 10:38:12 -0400543 iter->iov,
544 iter->nr_segs,
545 &iocb->ki_pos);
546}
547
548/* Returns whether any FS are still pending remounted */
549static int mark_all_pending_mounts(void)
550{
551 int unmounted = 1;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500552 struct orangefs_sb_info_s *orangefs_sb = NULL;
Mike Marshall5db11c22015-07-17 10:38:12 -0400553
Yi Liu8bb8aef2015-11-24 15:12:14 -0500554 spin_lock(&orangefs_superblocks_lock);
555 list_for_each_entry(orangefs_sb, &orangefs_superblocks, list) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400556 /* All of these file system require a remount */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500557 orangefs_sb->mount_pending = 1;
Mike Marshall5db11c22015-07-17 10:38:12 -0400558 unmounted = 0;
559 }
Yi Liu8bb8aef2015-11-24 15:12:14 -0500560 spin_unlock(&orangefs_superblocks_lock);
Mike Marshall5db11c22015-07-17 10:38:12 -0400561 return unmounted;
562}
563
564/*
565 * Determine if a given file system needs to be remounted or not
566 * Returns -1 on error
567 * 0 if already mounted
568 * 1 if needs remount
569 */
570int fs_mount_pending(__s32 fsid)
571{
572 int mount_pending = -1;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500573 struct orangefs_sb_info_s *orangefs_sb = NULL;
Mike Marshall5db11c22015-07-17 10:38:12 -0400574
Yi Liu8bb8aef2015-11-24 15:12:14 -0500575 spin_lock(&orangefs_superblocks_lock);
576 list_for_each_entry(orangefs_sb, &orangefs_superblocks, list) {
577 if (orangefs_sb->fs_id == fsid) {
578 mount_pending = orangefs_sb->mount_pending;
Mike Marshall5db11c22015-07-17 10:38:12 -0400579 break;
580 }
581 }
Yi Liu8bb8aef2015-11-24 15:12:14 -0500582 spin_unlock(&orangefs_superblocks_lock);
Mike Marshall5db11c22015-07-17 10:38:12 -0400583 return mount_pending;
584}
585
586/*
587 * NOTE: gets called when the last reference to this device is dropped.
588 * Using the open_access_count variable, we enforce a reference count
589 * on this file so that it can be opened by only one process at a time.
590 * the devreq_mutex is used to make sure all i/o has completed
Yi Liu8bb8aef2015-11-24 15:12:14 -0500591 * before we call orangefs_bufmap_finalize, and similar such tricky
Mike Marshall5db11c22015-07-17 10:38:12 -0400592 * situations
593 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500594static int orangefs_devreq_release(struct inode *inode, struct file *file)
Mike Marshall5db11c22015-07-17 10:38:12 -0400595{
596 int unmounted = 0;
597
598 gossip_debug(GOSSIP_DEV_DEBUG,
599 "%s:pvfs2-client-core: exiting, closing device\n",
600 __func__);
601
602 mutex_lock(&devreq_mutex);
Martin Brandenburg90d26aa2015-12-14 15:26:38 -0500603 if (get_bufmap_init())
604 orangefs_bufmap_finalize();
Mike Marshall5db11c22015-07-17 10:38:12 -0400605
606 open_access_count--;
607
608 unmounted = mark_all_pending_mounts();
Yi Liu8bb8aef2015-11-24 15:12:14 -0500609 gossip_debug(GOSSIP_DEV_DEBUG, "ORANGEFS Device Close: Filesystem(s) %s\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400610 (unmounted ? "UNMOUNTED" : "MOUNTED"));
611 mutex_unlock(&devreq_mutex);
612
613 /*
614 * Walk through the list of ops in the request list, mark them
615 * as purged and wake them up.
616 */
617 purge_waiting_ops();
618 /*
619 * Walk through the hash table of in progress operations; mark
620 * them as purged and wake them up
621 */
622 purge_inprogress_ops();
623 gossip_debug(GOSSIP_DEV_DEBUG,
624 "pvfs2-client-core: device close complete\n");
625 return 0;
626}
627
628int is_daemon_in_service(void)
629{
630 int in_service;
631
632 /*
633 * What this function does is checks if client-core is alive
634 * based on the access count we maintain on the device.
635 */
636 mutex_lock(&devreq_mutex);
637 in_service = open_access_count == 1 ? 0 : -EIO;
638 mutex_unlock(&devreq_mutex);
639 return in_service;
640}
641
642static inline long check_ioctl_command(unsigned int command)
643{
644 /* Check for valid ioctl codes */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500645 if (_IOC_TYPE(command) != ORANGEFS_DEV_MAGIC) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400646 gossip_err("device ioctl magic numbers don't match! Did you rebuild pvfs2-client-core/libpvfs2? [cmd %x, magic %x != %x]\n",
647 command,
648 _IOC_TYPE(command),
Yi Liu8bb8aef2015-11-24 15:12:14 -0500649 ORANGEFS_DEV_MAGIC);
Mike Marshall5db11c22015-07-17 10:38:12 -0400650 return -EINVAL;
651 }
652 /* and valid ioctl commands */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500653 if (_IOC_NR(command) >= ORANGEFS_DEV_MAXNR || _IOC_NR(command) <= 0) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400654 gossip_err("Invalid ioctl command number [%d >= %d]\n",
Yi Liu8bb8aef2015-11-24 15:12:14 -0500655 _IOC_NR(command), ORANGEFS_DEV_MAXNR);
Mike Marshall5db11c22015-07-17 10:38:12 -0400656 return -ENOIOCTLCMD;
657 }
658 return 0;
659}
660
661static long dispatch_ioctl_command(unsigned int command, unsigned long arg)
662{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500663 static __s32 magic = ORANGEFS_DEVREQ_MAGIC;
Martin Brandenburga762ae62015-12-15 14:22:06 -0500664 static __s32 max_up_size = MAX_DEV_REQ_UPSIZE;
665 static __s32 max_down_size = MAX_DEV_REQ_DOWNSIZE;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500666 struct ORANGEFS_dev_map_desc user_desc;
Mike Marshall5db11c22015-07-17 10:38:12 -0400667 int ret = 0;
668 struct dev_mask_info_s mask_info = { 0 };
669 struct dev_mask2_info_s mask2_info = { 0, 0 };
670 int upstream_kmod = 1;
671 struct list_head *tmp = NULL;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500672 struct orangefs_sb_info_s *orangefs_sb = NULL;
Mike Marshall5db11c22015-07-17 10:38:12 -0400673
674 /* mtmoore: add locking here */
675
676 switch (command) {
Yi Liu8bb8aef2015-11-24 15:12:14 -0500677 case ORANGEFS_DEV_GET_MAGIC:
Mike Marshall5db11c22015-07-17 10:38:12 -0400678 return ((put_user(magic, (__s32 __user *) arg) == -EFAULT) ?
679 -EIO :
680 0);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500681 case ORANGEFS_DEV_GET_MAX_UPSIZE:
Mike Marshall5db11c22015-07-17 10:38:12 -0400682 return ((put_user(max_up_size,
683 (__s32 __user *) arg) == -EFAULT) ?
684 -EIO :
685 0);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500686 case ORANGEFS_DEV_GET_MAX_DOWNSIZE:
Mike Marshall5db11c22015-07-17 10:38:12 -0400687 return ((put_user(max_down_size,
688 (__s32 __user *) arg) == -EFAULT) ?
689 -EIO :
690 0);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500691 case ORANGEFS_DEV_MAP:
Mike Marshall5db11c22015-07-17 10:38:12 -0400692 ret = copy_from_user(&user_desc,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500693 (struct ORANGEFS_dev_map_desc __user *)
Mike Marshall5db11c22015-07-17 10:38:12 -0400694 arg,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500695 sizeof(struct ORANGEFS_dev_map_desc));
Martin Brandenburg90d26aa2015-12-14 15:26:38 -0500696 if (get_bufmap_init()) {
697 return -EINVAL;
698 } else {
699 return ret ?
700 -EIO :
701 orangefs_bufmap_initialize(&user_desc);
702 }
Yi Liu8bb8aef2015-11-24 15:12:14 -0500703 case ORANGEFS_DEV_REMOUNT_ALL:
Mike Marshall5db11c22015-07-17 10:38:12 -0400704 gossip_debug(GOSSIP_DEV_DEBUG,
Mike Marshall97f10022015-12-11 16:45:03 -0500705 "%s: got ORANGEFS_DEV_REMOUNT_ALL\n",
706 __func__);
Mike Marshall5db11c22015-07-17 10:38:12 -0400707
708 /*
Yi Liu8bb8aef2015-11-24 15:12:14 -0500709 * remount all mounted orangefs volumes to regain the lost
Mike Marshall5db11c22015-07-17 10:38:12 -0400710 * dynamic mount tables (if any) -- NOTE: this is done
711 * without keeping the superblock list locked due to the
712 * upcall/downcall waiting. also, the request semaphore is
713 * used to ensure that no operations will be serviced until
714 * all of the remounts are serviced (to avoid ops between
715 * mounts to fail)
716 */
717 ret = mutex_lock_interruptible(&request_mutex);
718 if (ret < 0)
719 return ret;
720 gossip_debug(GOSSIP_DEV_DEBUG,
Mike Marshall97f10022015-12-11 16:45:03 -0500721 "%s: priority remount in progress\n",
722 __func__);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500723 list_for_each(tmp, &orangefs_superblocks) {
724 orangefs_sb =
Mike Marshall97f10022015-12-11 16:45:03 -0500725 list_entry(tmp,
726 struct orangefs_sb_info_s,
727 list);
Yi Liu8bb8aef2015-11-24 15:12:14 -0500728 if (orangefs_sb && (orangefs_sb->sb)) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400729 gossip_debug(GOSSIP_DEV_DEBUG,
Mike Marshall97f10022015-12-11 16:45:03 -0500730 "%s: Remounting SB %p\n",
731 __func__,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500732 orangefs_sb);
Mike Marshall5db11c22015-07-17 10:38:12 -0400733
Yi Liu8bb8aef2015-11-24 15:12:14 -0500734 ret = orangefs_remount(orangefs_sb->sb);
Mike Marshall5db11c22015-07-17 10:38:12 -0400735 if (ret) {
736 gossip_debug(GOSSIP_DEV_DEBUG,
737 "SB %p remount failed\n",
Yi Liu8bb8aef2015-11-24 15:12:14 -0500738 orangefs_sb);
Mike Marshall97f10022015-12-11 16:45:03 -0500739 break;
Mike Marshall5db11c22015-07-17 10:38:12 -0400740 }
741 }
742 }
743 gossip_debug(GOSSIP_DEV_DEBUG,
Mike Marshall97f10022015-12-11 16:45:03 -0500744 "%s: priority remount complete\n",
745 __func__);
Mike Marshall5db11c22015-07-17 10:38:12 -0400746 mutex_unlock(&request_mutex);
747 return ret;
748
Yi Liu8bb8aef2015-11-24 15:12:14 -0500749 case ORANGEFS_DEV_UPSTREAM:
Mike Marshall5db11c22015-07-17 10:38:12 -0400750 ret = copy_to_user((void __user *)arg,
751 &upstream_kmod,
752 sizeof(upstream_kmod));
753
754 if (ret != 0)
755 return -EIO;
756 else
757 return ret;
758
Yi Liu8bb8aef2015-11-24 15:12:14 -0500759 case ORANGEFS_DEV_CLIENT_MASK:
Mike Marshall5db11c22015-07-17 10:38:12 -0400760 ret = copy_from_user(&mask2_info,
761 (void __user *)arg,
762 sizeof(struct dev_mask2_info_s));
763
764 if (ret != 0)
765 return -EIO;
766
767 client_debug_mask.mask1 = mask2_info.mask1_value;
768 client_debug_mask.mask2 = mask2_info.mask2_value;
769
770 pr_info("%s: client debug mask has been been received "
771 ":%llx: :%llx:\n",
772 __func__,
773 (unsigned long long)client_debug_mask.mask1,
774 (unsigned long long)client_debug_mask.mask2);
775
776 return ret;
777
Yi Liu8bb8aef2015-11-24 15:12:14 -0500778 case ORANGEFS_DEV_CLIENT_STRING:
Mike Marshall5db11c22015-07-17 10:38:12 -0400779 ret = copy_from_user(&client_debug_array_string,
780 (void __user *)arg,
Yi Liu8bb8aef2015-11-24 15:12:14 -0500781 ORANGEFS_MAX_DEBUG_STRING_LEN);
Mike Marshall5db11c22015-07-17 10:38:12 -0400782 if (ret != 0) {
Mike Marshall97f10022015-12-11 16:45:03 -0500783 pr_info("%s: CLIENT_STRING: copy_from_user failed\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400784 __func__);
785 return -EIO;
786 }
787
Mike Marshall97f10022015-12-11 16:45:03 -0500788 pr_info("%s: client debug array string has been received.\n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400789 __func__);
790
791 if (!help_string_initialized) {
792
793 /* Free the "we don't know yet" default string... */
794 kfree(debug_help_string);
795
796 /* build a proper debug help string */
797 if (orangefs_prepare_debugfs_help_string(0)) {
Mike Marshall97f10022015-12-11 16:45:03 -0500798 gossip_err("%s: no debug help string \n",
Mike Marshall5db11c22015-07-17 10:38:12 -0400799 __func__);
800 return -EIO;
801 }
802
803 /* Replace the boilerplate boot-time debug-help file. */
804 debugfs_remove(help_file_dentry);
805
806 help_file_dentry =
807 debugfs_create_file(
808 ORANGEFS_KMOD_DEBUG_HELP_FILE,
809 0444,
810 debug_dir,
811 debug_help_string,
812 &debug_help_fops);
813
814 if (!help_file_dentry) {
815 gossip_err("%s: debugfs_create_file failed for"
816 " :%s:!\n",
817 __func__,
818 ORANGEFS_KMOD_DEBUG_HELP_FILE);
819 return -EIO;
820 }
821 }
822
823 debug_mask_to_string(&client_debug_mask, 1);
824
825 debugfs_remove(client_debug_dentry);
826
Yi Liu8bb8aef2015-11-24 15:12:14 -0500827 orangefs_client_debug_init();
Mike Marshall5db11c22015-07-17 10:38:12 -0400828
829 help_string_initialized++;
830
831 return ret;
832
Yi Liu8bb8aef2015-11-24 15:12:14 -0500833 case ORANGEFS_DEV_DEBUG:
Mike Marshall5db11c22015-07-17 10:38:12 -0400834 ret = copy_from_user(&mask_info,
835 (void __user *)arg,
836 sizeof(mask_info));
837
838 if (ret != 0)
839 return -EIO;
840
841 if (mask_info.mask_type == KERNEL_MASK) {
842 if ((mask_info.mask_value == 0)
843 && (kernel_mask_set_mod_init)) {
844 /*
845 * the kernel debug mask was set when the
846 * kernel module was loaded; don't override
847 * it if the client-core was started without
Yi Liu8bb8aef2015-11-24 15:12:14 -0500848 * a value for ORANGEFS_KMODMASK.
Mike Marshall5db11c22015-07-17 10:38:12 -0400849 */
850 return 0;
851 }
852 debug_mask_to_string(&mask_info.mask_value,
853 mask_info.mask_type);
854 gossip_debug_mask = mask_info.mask_value;
Mike Marshall97f10022015-12-11 16:45:03 -0500855 pr_info("%s: kernel debug mask has been modified to "
Mike Marshall5db11c22015-07-17 10:38:12 -0400856 ":%s: :%llx:\n",
Mike Marshall97f10022015-12-11 16:45:03 -0500857 __func__,
Mike Marshall5db11c22015-07-17 10:38:12 -0400858 kernel_debug_string,
859 (unsigned long long)gossip_debug_mask);
860 } else if (mask_info.mask_type == CLIENT_MASK) {
861 debug_mask_to_string(&mask_info.mask_value,
862 mask_info.mask_type);
Mike Marshall97f10022015-12-11 16:45:03 -0500863 pr_info("%s: client debug mask has been modified to"
Mike Marshall5db11c22015-07-17 10:38:12 -0400864 ":%s: :%llx:\n",
Mike Marshall97f10022015-12-11 16:45:03 -0500865 __func__,
Mike Marshall5db11c22015-07-17 10:38:12 -0400866 client_debug_string,
867 llu(mask_info.mask_value));
868 } else {
869 gossip_lerr("Invalid mask type....\n");
870 return -EINVAL;
871 }
872
873 return ret;
874
875 default:
876 return -ENOIOCTLCMD;
877 }
878 return -ENOIOCTLCMD;
879}
880
Yi Liu8bb8aef2015-11-24 15:12:14 -0500881static long orangefs_devreq_ioctl(struct file *file,
Mike Marshall5db11c22015-07-17 10:38:12 -0400882 unsigned int command, unsigned long arg)
883{
884 long ret;
885
886 /* Check for properly constructed commands */
887 ret = check_ioctl_command(command);
888 if (ret < 0)
889 return (int)ret;
890
891 return (int)dispatch_ioctl_command(command, arg);
892}
893
894#ifdef CONFIG_COMPAT /* CONFIG_COMPAT is in .config */
895
Yi Liu8bb8aef2015-11-24 15:12:14 -0500896/* Compat structure for the ORANGEFS_DEV_MAP ioctl */
897struct ORANGEFS_dev_map_desc32 {
Mike Marshall5db11c22015-07-17 10:38:12 -0400898 compat_uptr_t ptr;
899 __s32 total_size;
900 __s32 size;
901 __s32 count;
902};
903
904static unsigned long translate_dev_map26(unsigned long args, long *error)
905{
Yi Liu8bb8aef2015-11-24 15:12:14 -0500906 struct ORANGEFS_dev_map_desc32 __user *p32 = (void __user *)args;
Mike Marshall5db11c22015-07-17 10:38:12 -0400907 /*
908 * Depending on the architecture, allocate some space on the
909 * user-call-stack based on our expected layout.
910 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500911 struct ORANGEFS_dev_map_desc __user *p =
Mike Marshall5db11c22015-07-17 10:38:12 -0400912 compat_alloc_user_space(sizeof(*p));
Mike Marshall84d02152015-07-28 13:27:51 -0400913 compat_uptr_t addr;
Mike Marshall5db11c22015-07-17 10:38:12 -0400914
915 *error = 0;
916 /* get the ptr from the 32 bit user-space */
917 if (get_user(addr, &p32->ptr))
918 goto err;
919 /* try to put that into a 64-bit layout */
920 if (put_user(compat_ptr(addr), &p->ptr))
921 goto err;
922 /* copy the remaining fields */
923 if (copy_in_user(&p->total_size, &p32->total_size, sizeof(__s32)))
924 goto err;
925 if (copy_in_user(&p->size, &p32->size, sizeof(__s32)))
926 goto err;
927 if (copy_in_user(&p->count, &p32->count, sizeof(__s32)))
928 goto err;
929 return (unsigned long)p;
930err:
931 *error = -EFAULT;
932 return 0;
933}
934
935/*
936 * 32 bit user-space apps' ioctl handlers when kernel modules
937 * is compiled as a 64 bit one
938 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500939static long orangefs_devreq_compat_ioctl(struct file *filp, unsigned int cmd,
Mike Marshall5db11c22015-07-17 10:38:12 -0400940 unsigned long args)
941{
942 long ret;
943 unsigned long arg = args;
944
945 /* Check for properly constructed commands */
946 ret = check_ioctl_command(cmd);
947 if (ret < 0)
948 return ret;
Yi Liu8bb8aef2015-11-24 15:12:14 -0500949 if (cmd == ORANGEFS_DEV_MAP) {
Mike Marshall5db11c22015-07-17 10:38:12 -0400950 /*
951 * convert the arguments to what we expect internally
952 * in kernel space
953 */
954 arg = translate_dev_map26(args, &ret);
955 if (ret < 0) {
956 gossip_err("Could not translate dev map\n");
957 return ret;
958 }
959 }
960 /* no other ioctl requires translation */
961 return dispatch_ioctl_command(cmd, arg);
962}
963
Mike Marshall2c590d52015-07-24 10:37:15 -0400964#endif /* CONFIG_COMPAT is in .config */
965
966/*
967 * The following two ioctl32 functions had been refactored into the above
968 * CONFIG_COMPAT ifdef, but that was an over simplification that was
969 * not noticed until we tried to compile on power pc...
970 */
971#if (defined(CONFIG_COMPAT) && !defined(HAVE_REGISTER_IOCTL32_CONVERSION)) || !defined(CONFIG_COMPAT)
Yi Liu8bb8aef2015-11-24 15:12:14 -0500972static int orangefs_ioctl32_init(void)
Mike Marshall5db11c22015-07-17 10:38:12 -0400973{
974 return 0;
975}
976
Yi Liu8bb8aef2015-11-24 15:12:14 -0500977static void orangefs_ioctl32_cleanup(void)
Mike Marshall5db11c22015-07-17 10:38:12 -0400978{
979 return;
980}
Mike Marshall2c590d52015-07-24 10:37:15 -0400981#endif
Mike Marshall5db11c22015-07-17 10:38:12 -0400982
983/* the assigned character device major number */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500984static int orangefs_dev_major;
Mike Marshall5db11c22015-07-17 10:38:12 -0400985
986/*
Yi Liu8bb8aef2015-11-24 15:12:14 -0500987 * Initialize orangefs device specific state:
Mike Marshall5db11c22015-07-17 10:38:12 -0400988 * Must be called at module load time only
989 */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500990int orangefs_dev_init(void)
Mike Marshall5db11c22015-07-17 10:38:12 -0400991{
992 int ret;
993
994 /* register the ioctl32 sub-system */
Yi Liu8bb8aef2015-11-24 15:12:14 -0500995 ret = orangefs_ioctl32_init();
Mike Marshall5db11c22015-07-17 10:38:12 -0400996 if (ret < 0)
997 return ret;
998
Yi Liu8bb8aef2015-11-24 15:12:14 -0500999 /* register orangefs-req device */
1000 orangefs_dev_major = register_chrdev(0,
1001 ORANGEFS_REQDEVICE_NAME,
1002 &orangefs_devreq_file_operations);
1003 if (orangefs_dev_major < 0) {
Mike Marshall5db11c22015-07-17 10:38:12 -04001004 gossip_debug(GOSSIP_DEV_DEBUG,
1005 "Failed to register /dev/%s (error %d)\n",
Yi Liu8bb8aef2015-11-24 15:12:14 -05001006 ORANGEFS_REQDEVICE_NAME, orangefs_dev_major);
1007 orangefs_ioctl32_cleanup();
1008 return orangefs_dev_major;
Mike Marshall5db11c22015-07-17 10:38:12 -04001009 }
1010
1011 gossip_debug(GOSSIP_DEV_DEBUG,
1012 "*** /dev/%s character device registered ***\n",
Yi Liu8bb8aef2015-11-24 15:12:14 -05001013 ORANGEFS_REQDEVICE_NAME);
Mike Marshall5db11c22015-07-17 10:38:12 -04001014 gossip_debug(GOSSIP_DEV_DEBUG, "'mknod /dev/%s c %d 0'.\n",
Yi Liu8bb8aef2015-11-24 15:12:14 -05001015 ORANGEFS_REQDEVICE_NAME, orangefs_dev_major);
Mike Marshall5db11c22015-07-17 10:38:12 -04001016 return 0;
1017}
1018
Yi Liu8bb8aef2015-11-24 15:12:14 -05001019void orangefs_dev_cleanup(void)
Mike Marshall5db11c22015-07-17 10:38:12 -04001020{
Yi Liu8bb8aef2015-11-24 15:12:14 -05001021 unregister_chrdev(orangefs_dev_major, ORANGEFS_REQDEVICE_NAME);
Mike Marshall5db11c22015-07-17 10:38:12 -04001022 gossip_debug(GOSSIP_DEV_DEBUG,
1023 "*** /dev/%s character device unregistered ***\n",
Yi Liu8bb8aef2015-11-24 15:12:14 -05001024 ORANGEFS_REQDEVICE_NAME);
Mike Marshall5db11c22015-07-17 10:38:12 -04001025 /* unregister the ioctl32 sub-system */
Yi Liu8bb8aef2015-11-24 15:12:14 -05001026 orangefs_ioctl32_cleanup();
Mike Marshall5db11c22015-07-17 10:38:12 -04001027}
1028
Yi Liu8bb8aef2015-11-24 15:12:14 -05001029static unsigned int orangefs_devreq_poll(struct file *file,
Mike Marshall5db11c22015-07-17 10:38:12 -04001030 struct poll_table_struct *poll_table)
1031{
1032 int poll_revent_mask = 0;
1033
1034 if (open_access_count == 1) {
Yi Liu8bb8aef2015-11-24 15:12:14 -05001035 poll_wait(file, &orangefs_request_list_waitq, poll_table);
Mike Marshall5db11c22015-07-17 10:38:12 -04001036
Yi Liu8bb8aef2015-11-24 15:12:14 -05001037 spin_lock(&orangefs_request_list_lock);
1038 if (!list_empty(&orangefs_request_list))
Mike Marshall5db11c22015-07-17 10:38:12 -04001039 poll_revent_mask |= POLL_IN;
Yi Liu8bb8aef2015-11-24 15:12:14 -05001040 spin_unlock(&orangefs_request_list_lock);
Mike Marshall5db11c22015-07-17 10:38:12 -04001041 }
1042 return poll_revent_mask;
1043}
1044
Yi Liu8bb8aef2015-11-24 15:12:14 -05001045const struct file_operations orangefs_devreq_file_operations = {
Mike Marshall5db11c22015-07-17 10:38:12 -04001046 .owner = THIS_MODULE,
Yi Liu8bb8aef2015-11-24 15:12:14 -05001047 .read = orangefs_devreq_read,
1048 .write_iter = orangefs_devreq_write_iter,
1049 .open = orangefs_devreq_open,
1050 .release = orangefs_devreq_release,
1051 .unlocked_ioctl = orangefs_devreq_ioctl,
Mike Marshall5db11c22015-07-17 10:38:12 -04001052
1053#ifdef CONFIG_COMPAT /* CONFIG_COMPAT is in .config */
Yi Liu8bb8aef2015-11-24 15:12:14 -05001054 .compat_ioctl = orangefs_devreq_compat_ioctl,
Mike Marshall5db11c22015-07-17 10:38:12 -04001055#endif
Yi Liu8bb8aef2015-11-24 15:12:14 -05001056 .poll = orangefs_devreq_poll
Mike Marshall5db11c22015-07-17 10:38:12 -04001057};