Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 2 | #ifndef _FS_CEPH_OSD_CLIENT_H |
| 3 | #define _FS_CEPH_OSD_CLIENT_H |
| 4 | |
Ilya Dryomov | a02a946 | 2017-06-19 12:18:05 +0200 | [diff] [blame] | 5 | #include <linux/bitrev.h> |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 6 | #include <linux/completion.h> |
Sage Weil | 415e49a | 2009-12-07 13:37:03 -0800 | [diff] [blame] | 7 | #include <linux/kref.h> |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 8 | #include <linux/mempool.h> |
| 9 | #include <linux/rbtree.h> |
Elena Reshetova | 02113a0 | 2017-03-17 14:10:28 +0200 | [diff] [blame] | 10 | #include <linux/refcount.h> |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 11 | |
Alex Elder | 6c4a191 | 2012-05-16 15:16:38 -0500 | [diff] [blame] | 12 | #include <linux/ceph/types.h> |
| 13 | #include <linux/ceph/osdmap.h> |
| 14 | #include <linux/ceph/messenger.h> |
Ilya Dryomov | b2aa5d0 | 2016-06-07 21:57:15 +0200 | [diff] [blame] | 15 | #include <linux/ceph/msgpool.h> |
Alex Elder | 6c4a191 | 2012-05-16 15:16:38 -0500 | [diff] [blame] | 16 | #include <linux/ceph/auth.h> |
Alex Elder | c885837 | 2012-11-13 21:11:15 -0600 | [diff] [blame] | 17 | #include <linux/ceph/pagelist.h> |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 18 | |
| 19 | struct ceph_msg; |
| 20 | struct ceph_snap_context; |
| 21 | struct ceph_osd_request; |
| 22 | struct ceph_osd_client; |
| 23 | |
| 24 | /* |
| 25 | * completion callback for async writepages |
| 26 | */ |
Ilya Dryomov | 85e084f | 2016-04-28 16:07:24 +0200 | [diff] [blame] | 27 | typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 28 | |
Ilya Dryomov | 63244fa | 2016-04-28 16:07:23 +0200 | [diff] [blame] | 29 | #define CEPH_HOMELESS_OSD -1 |
| 30 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 31 | /* a given osd we're communicating with */ |
| 32 | struct ceph_osd { |
Elena Reshetova | 02113a0 | 2017-03-17 14:10:28 +0200 | [diff] [blame] | 33 | refcount_t o_ref; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 34 | struct ceph_osd_client *o_osdc; |
| 35 | int o_osd; |
| 36 | int o_incarnation; |
| 37 | struct rb_node o_node; |
| 38 | struct ceph_connection o_con; |
Ilya Dryomov | 5aea3dc | 2016-04-28 16:07:26 +0200 | [diff] [blame] | 39 | struct rb_root o_requests; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 40 | struct rb_root o_linger_requests; |
Ilya Dryomov | a02a946 | 2017-06-19 12:18:05 +0200 | [diff] [blame] | 41 | struct rb_root o_backoff_mappings; |
| 42 | struct rb_root o_backoffs_by_id; |
Yehuda Sadeh | f5a2041 | 2010-02-03 11:00:26 -0800 | [diff] [blame] | 43 | struct list_head o_osd_lru; |
Alex Elder | 6c4a191 | 2012-05-16 15:16:38 -0500 | [diff] [blame] | 44 | struct ceph_auth_handshake o_auth; |
Yehuda Sadeh | f5a2041 | 2010-02-03 11:00:26 -0800 | [diff] [blame] | 45 | unsigned long lru_ttl; |
Yehuda Sadeh | 422d2cb | 2010-02-26 15:32:31 -0800 | [diff] [blame] | 46 | struct list_head o_keepalive_item; |
Ilya Dryomov | 5aea3dc | 2016-04-28 16:07:26 +0200 | [diff] [blame] | 47 | struct mutex lock; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 48 | }; |
| 49 | |
Ilya Dryomov | 3f1af42 | 2016-02-09 17:50:15 +0100 | [diff] [blame] | 50 | #define CEPH_OSD_SLAB_OPS 2 |
| 51 | #define CEPH_OSD_MAX_OPS 16 |
Sage Weil | 1b83bef | 2013-02-25 16:11:12 -0800 | [diff] [blame] | 52 | |
Alex Elder | 2ac2b7a | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 53 | enum ceph_osd_data_type { |
Alex Elder | ec9123c | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 54 | CEPH_OSD_DATA_TYPE_NONE = 0, |
Alex Elder | 2ac2b7a | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 55 | CEPH_OSD_DATA_TYPE_PAGES, |
Alex Elder | 9a5e6d0 | 2013-03-08 13:35:36 -0600 | [diff] [blame] | 56 | CEPH_OSD_DATA_TYPE_PAGELIST, |
Alex Elder | 2ac2b7a | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 57 | #ifdef CONFIG_BLOCK |
| 58 | CEPH_OSD_DATA_TYPE_BIO, |
| 59 | #endif /* CONFIG_BLOCK */ |
Ilya Dryomov | b9e281c | 2018-01-20 10:30:11 +0100 | [diff] [blame] | 60 | CEPH_OSD_DATA_TYPE_BVECS, |
Alex Elder | 2ac2b7a | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 61 | }; |
| 62 | |
Alex Elder | 2794a82 | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 63 | struct ceph_osd_data { |
Alex Elder | 2ac2b7a | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 64 | enum ceph_osd_data_type type; |
| 65 | union { |
Alex Elder | 2794a82 | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 66 | struct { |
| 67 | struct page **pages; |
Alex Elder | e0c5948 | 2013-03-07 15:38:25 -0600 | [diff] [blame] | 68 | u64 length; |
Alex Elder | 2794a82 | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 69 | u32 alignment; |
| 70 | bool pages_from_pool; |
| 71 | bool own_pages; |
| 72 | }; |
Alex Elder | 9a5e6d0 | 2013-03-08 13:35:36 -0600 | [diff] [blame] | 73 | struct ceph_pagelist *pagelist; |
Alex Elder | 2794a82 | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 74 | #ifdef CONFIG_BLOCK |
Alex Elder | fdce58c | 2013-03-14 14:09:06 -0500 | [diff] [blame] | 75 | struct { |
Ilya Dryomov | 5359a17 | 2018-01-20 10:30:10 +0100 | [diff] [blame] | 76 | struct ceph_bio_iter bio_pos; |
| 77 | u32 bio_length; |
Alex Elder | fdce58c | 2013-03-14 14:09:06 -0500 | [diff] [blame] | 78 | }; |
Alex Elder | 2794a82 | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 79 | #endif /* CONFIG_BLOCK */ |
Ilya Dryomov | 0010f70 | 2018-05-04 16:57:30 +0200 | [diff] [blame] | 80 | struct { |
| 81 | struct ceph_bvec_iter bvec_pos; |
| 82 | u32 num_bvecs; |
| 83 | }; |
Alex Elder | 2794a82 | 2013-02-14 12:16:43 -0600 | [diff] [blame] | 84 | }; |
| 85 | }; |
| 86 | |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 87 | struct ceph_osd_req_op { |
| 88 | u16 op; /* CEPH_OSD_OP_* */ |
Ilya Dryomov | 7b25bf5 | 2014-02-25 16:22:26 +0200 | [diff] [blame] | 89 | u32 flags; /* CEPH_OSD_OP_FLAG_* */ |
Ilya Dryomov | de2aa10 | 2016-02-08 13:39:46 +0100 | [diff] [blame] | 90 | u32 indata_len; /* request */ |
Yan, Zheng | 7665d85 | 2016-01-07 16:48:57 +0800 | [diff] [blame] | 91 | u32 outdata_len; /* reply */ |
| 92 | s32 rval; |
| 93 | |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 94 | union { |
Alex Elder | 4971977 | 2013-02-11 12:33:24 -0600 | [diff] [blame] | 95 | struct ceph_osd_data raw_data_in; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 96 | struct { |
| 97 | u64 offset, length; |
| 98 | u64 truncate_size; |
| 99 | u32 truncate_seq; |
Alex Elder | 5476492 | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 100 | struct ceph_osd_data osd_data; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 101 | } extent; |
| 102 | struct { |
Ilya Dryomov | d7d5a00 | 2014-12-19 14:00:41 +0300 | [diff] [blame] | 103 | u32 name_len; |
| 104 | u32 value_len; |
Yan, Zheng | d74b50b | 2014-11-12 14:00:43 +0800 | [diff] [blame] | 105 | __u8 cmp_op; /* CEPH_OSD_CMPXATTR_OP_* */ |
| 106 | __u8 cmp_mode; /* CEPH_OSD_CMPXATTR_MODE_* */ |
| 107 | struct ceph_osd_data osd_data; |
| 108 | } xattr; |
| 109 | struct { |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 110 | const char *class_name; |
| 111 | const char *method_name; |
Alex Elder | 5476492 | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 112 | struct ceph_osd_data request_info; |
Alex Elder | 04017e2 | 2013-04-05 14:46:02 -0500 | [diff] [blame] | 113 | struct ceph_osd_data request_data; |
Alex Elder | 5476492 | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 114 | struct ceph_osd_data response_data; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 115 | __u8 class_len; |
| 116 | __u8 method_len; |
Ilya Dryomov | bb873b539 | 2016-05-26 00:29:52 +0200 | [diff] [blame] | 117 | u32 indata_len; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 118 | } cls; |
| 119 | struct { |
| 120 | u64 cookie; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 121 | __u8 op; /* CEPH_OSD_WATCH_OP_ */ |
| 122 | u32 gen; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 123 | } watch; |
Ilya Dryomov | c647b8a | 2014-02-25 16:22:27 +0200 | [diff] [blame] | 124 | struct { |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 125 | struct ceph_osd_data request_data; |
| 126 | } notify_ack; |
| 127 | struct { |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 128 | u64 cookie; |
| 129 | struct ceph_osd_data request_data; |
| 130 | struct ceph_osd_data response_data; |
| 131 | } notify; |
| 132 | struct { |
Douglas Fuller | a4ed38d | 2015-07-17 13:18:07 -0700 | [diff] [blame] | 133 | struct ceph_osd_data response_data; |
| 134 | } list_watchers; |
| 135 | struct { |
Ilya Dryomov | c647b8a | 2014-02-25 16:22:27 +0200 | [diff] [blame] | 136 | u64 expected_object_size; |
| 137 | u64 expected_write_size; |
| 138 | } alloc_hint; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 139 | }; |
| 140 | }; |
| 141 | |
Ilya Dryomov | 63244fa | 2016-04-28 16:07:23 +0200 | [diff] [blame] | 142 | struct ceph_osd_request_target { |
| 143 | struct ceph_object_id base_oid; |
| 144 | struct ceph_object_locator base_oloc; |
| 145 | struct ceph_object_id target_oid; |
| 146 | struct ceph_object_locator target_oloc; |
| 147 | |
Ilya Dryomov | dc98ff7 | 2017-06-15 16:30:53 +0200 | [diff] [blame] | 148 | struct ceph_pg pgid; /* last raw pg we mapped to */ |
| 149 | struct ceph_spg spgid; /* last actual spg we mapped to */ |
Ilya Dryomov | 63244fa | 2016-04-28 16:07:23 +0200 | [diff] [blame] | 150 | u32 pg_num; |
| 151 | u32 pg_num_mask; |
| 152 | struct ceph_osds acting; |
| 153 | struct ceph_osds up; |
| 154 | int size; |
| 155 | int min_size; |
| 156 | bool sort_bitwise; |
Ilya Dryomov | ae78dd8 | 2017-07-27 17:59:14 +0200 | [diff] [blame] | 157 | bool recovery_deletes; |
Ilya Dryomov | 63244fa | 2016-04-28 16:07:23 +0200 | [diff] [blame] | 158 | |
| 159 | unsigned int flags; /* CEPH_OSD_FLAG_* */ |
| 160 | bool paused; |
| 161 | |
Ilya Dryomov | 04c7d78 | 2017-06-15 16:30:55 +0200 | [diff] [blame] | 162 | u32 epoch; |
Ilya Dryomov | dc93e0e | 2017-06-05 14:45:00 +0200 | [diff] [blame] | 163 | u32 last_force_resend; |
| 164 | |
Ilya Dryomov | 63244fa | 2016-04-28 16:07:23 +0200 | [diff] [blame] | 165 | int osd; |
| 166 | }; |
| 167 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 168 | /* an in-flight request */ |
| 169 | struct ceph_osd_request { |
| 170 | u64 r_tid; /* unique for this client */ |
| 171 | struct rb_node r_node; |
Ilya Dryomov | 4609245 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 172 | struct rb_node r_mc_node; /* map check */ |
Ilya Dryomov | 88bc192 | 2018-05-21 16:00:29 +0200 | [diff] [blame^] | 173 | struct work_struct r_complete_work; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 174 | struct ceph_osd *r_osd; |
Ilya Dryomov | a66dd38 | 2016-04-28 16:07:23 +0200 | [diff] [blame] | 175 | |
| 176 | struct ceph_osd_request_target r_t; |
| 177 | #define r_base_oid r_t.base_oid |
| 178 | #define r_base_oloc r_t.base_oloc |
| 179 | #define r_flags r_t.flags |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 180 | |
| 181 | struct ceph_msg *r_request, *r_reply; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 182 | u32 r_sent; /* >0 if r_request is sending/sent */ |
Sage Weil | 1b83bef | 2013-02-25 16:11:12 -0800 | [diff] [blame] | 183 | |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 184 | /* request osd ops array */ |
| 185 | unsigned int r_num_ops; |
Alex Elder | 7952873 | 2013-04-03 21:32:51 -0500 | [diff] [blame] | 186 | |
Sage Weil | 1b83bef | 2013-02-25 16:11:12 -0800 | [diff] [blame] | 187 | int r_result; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 188 | |
| 189 | struct ceph_osd_client *r_osdc; |
Sage Weil | 415e49a | 2009-12-07 13:37:03 -0800 | [diff] [blame] | 190 | struct kref r_kref; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 191 | bool r_mempool; |
Ilya Dryomov | b18b955 | 2017-02-11 18:46:08 +0100 | [diff] [blame] | 192 | struct completion r_completion; /* private to osd_client.c */ |
Alex Elder | 26be880 | 2013-04-15 11:20:42 -0500 | [diff] [blame] | 193 | ceph_osdc_callback_t r_callback; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 194 | struct list_head r_unsafe_item; |
| 195 | |
| 196 | struct inode *r_inode; /* for use by callbacks */ |
Yehuda Sadeh | 3d14c5d | 2010-04-06 15:14:15 -0700 | [diff] [blame] | 197 | void *r_priv; /* ditto */ |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 198 | |
Ilya Dryomov | bb873b539 | 2016-05-26 00:29:52 +0200 | [diff] [blame] | 199 | /* set by submitter */ |
| 200 | u64 r_snapid; /* for reads, CEPH_NOSNAP o/w */ |
| 201 | struct ceph_snap_context *r_snapc; /* for writes */ |
| 202 | struct timespec r_mtime; /* ditto */ |
| 203 | u64 r_data_offset; /* ditto */ |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 204 | bool r_linger; /* don't resend on failure */ |
Jeff Layton | a1f4020 | 2017-04-04 08:39:37 -0400 | [diff] [blame] | 205 | bool r_abort_on_full; /* return ENOSPC when full */ |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 206 | |
Ilya Dryomov | bb873b539 | 2016-05-26 00:29:52 +0200 | [diff] [blame] | 207 | /* internal */ |
| 208 | unsigned long r_stamp; /* jiffies, send or check time */ |
Ilya Dryomov | 7cc5e38 | 2017-02-12 17:11:07 +0100 | [diff] [blame] | 209 | unsigned long r_start_stamp; /* jiffies */ |
Ilya Dryomov | bb873b539 | 2016-05-26 00:29:52 +0200 | [diff] [blame] | 210 | int r_attempts; |
Ilya Dryomov | 4609245 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 211 | u32 r_map_dne_bound; |
Ilya Dryomov | 3f1af42 | 2016-02-09 17:50:15 +0100 | [diff] [blame] | 212 | |
| 213 | struct ceph_osd_req_op r_ops[]; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 214 | }; |
| 215 | |
Ilya Dryomov | 205ee118 | 2014-01-27 17:40:20 +0200 | [diff] [blame] | 216 | struct ceph_request_redirect { |
| 217 | struct ceph_object_locator oloc; |
| 218 | }; |
| 219 | |
Ilya Dryomov | 8cb441c | 2017-06-15 16:30:54 +0200 | [diff] [blame] | 220 | /* |
| 221 | * osd request identifier |
| 222 | * |
| 223 | * caller name + incarnation# + tid to unique identify this request |
| 224 | */ |
| 225 | struct ceph_osd_reqid { |
| 226 | struct ceph_entity_name name; |
| 227 | __le64 tid; |
| 228 | __le32 inc; |
| 229 | } __packed; |
| 230 | |
| 231 | struct ceph_blkin_trace_info { |
| 232 | __le64 trace_id; |
| 233 | __le64 span_id; |
| 234 | __le64 parent_span_id; |
| 235 | } __packed; |
| 236 | |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 237 | typedef void (*rados_watchcb2_t)(void *arg, u64 notify_id, u64 cookie, |
| 238 | u64 notifier_id, void *data, size_t data_len); |
| 239 | typedef void (*rados_watcherrcb_t)(void *arg, u64 cookie, int err); |
Yehuda Sadeh | a40c4f1 | 2011-03-21 15:07:16 -0700 | [diff] [blame] | 240 | |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 241 | struct ceph_osd_linger_request { |
| 242 | struct ceph_osd_client *osdc; |
| 243 | u64 linger_id; |
| 244 | bool committed; |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 245 | bool is_watch; /* watch or notify */ |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 246 | |
| 247 | struct ceph_osd *osd; |
| 248 | struct ceph_osd_request *reg_req; |
| 249 | struct ceph_osd_request *ping_req; |
| 250 | unsigned long ping_sent; |
Ilya Dryomov | b07d3c4 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 251 | unsigned long watch_valid_thru; |
| 252 | struct list_head pending_lworks; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 253 | |
| 254 | struct ceph_osd_request_target t; |
Ilya Dryomov | 4609245 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 255 | u32 map_dne_bound; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 256 | |
| 257 | struct timespec mtime; |
| 258 | |
| 259 | struct kref kref; |
| 260 | struct mutex lock; |
| 261 | struct rb_node node; /* osd */ |
| 262 | struct rb_node osdc_node; /* osdc */ |
Ilya Dryomov | 4609245 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 263 | struct rb_node mc_node; /* map check */ |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 264 | struct list_head scan_item; |
| 265 | |
| 266 | struct completion reg_commit_wait; |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 267 | struct completion notify_finish_wait; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 268 | int reg_commit_error; |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 269 | int notify_finish_error; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 270 | int last_error; |
| 271 | |
| 272 | u32 register_gen; |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 273 | u64 notify_id; |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 274 | |
| 275 | rados_watchcb2_t wcb; |
| 276 | rados_watcherrcb_t errcb; |
| 277 | void *data; |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 278 | |
| 279 | struct page ***preply_pages; |
| 280 | size_t *preply_len; |
Yehuda Sadeh | a40c4f1 | 2011-03-21 15:07:16 -0700 | [diff] [blame] | 281 | }; |
| 282 | |
Douglas Fuller | a4ed38d | 2015-07-17 13:18:07 -0700 | [diff] [blame] | 283 | struct ceph_watch_item { |
| 284 | struct ceph_entity_name name; |
| 285 | u64 cookie; |
| 286 | struct ceph_entity_addr addr; |
| 287 | }; |
| 288 | |
Ilya Dryomov | a02a946 | 2017-06-19 12:18:05 +0200 | [diff] [blame] | 289 | struct ceph_spg_mapping { |
| 290 | struct rb_node node; |
| 291 | struct ceph_spg spgid; |
| 292 | |
| 293 | struct rb_root backoffs; |
| 294 | }; |
| 295 | |
| 296 | struct ceph_hobject_id { |
| 297 | void *key; |
| 298 | size_t key_len; |
| 299 | void *oid; |
| 300 | size_t oid_len; |
| 301 | u64 snapid; |
| 302 | u32 hash; |
| 303 | u8 is_max; |
| 304 | void *nspace; |
| 305 | size_t nspace_len; |
| 306 | s64 pool; |
| 307 | |
| 308 | /* cache */ |
| 309 | u32 hash_reverse_bits; |
| 310 | }; |
| 311 | |
| 312 | static inline void ceph_hoid_build_hash_cache(struct ceph_hobject_id *hoid) |
| 313 | { |
| 314 | hoid->hash_reverse_bits = bitrev32(hoid->hash); |
| 315 | } |
| 316 | |
| 317 | /* |
| 318 | * PG-wide backoff: [begin, end) |
| 319 | * per-object backoff: begin == end |
| 320 | */ |
| 321 | struct ceph_osd_backoff { |
| 322 | struct rb_node spg_node; |
| 323 | struct rb_node id_node; |
| 324 | |
| 325 | struct ceph_spg spgid; |
| 326 | u64 id; |
| 327 | struct ceph_hobject_id *begin; |
| 328 | struct ceph_hobject_id *end; |
| 329 | }; |
| 330 | |
Ilya Dryomov | 264048a | 2016-11-08 15:15:24 +0100 | [diff] [blame] | 331 | #define CEPH_LINGER_ID_START 0xffff000000000000ULL |
| 332 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 333 | struct ceph_osd_client { |
| 334 | struct ceph_client *client; |
| 335 | |
| 336 | struct ceph_osdmap *osdmap; /* current map */ |
Ilya Dryomov | 5aea3dc | 2016-04-28 16:07:26 +0200 | [diff] [blame] | 337 | struct rw_semaphore lock; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 338 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 339 | struct rb_root osds; /* osds */ |
Yehuda Sadeh | f5a2041 | 2010-02-03 11:00:26 -0800 | [diff] [blame] | 340 | struct list_head osd_lru; /* idle osds */ |
Ilya Dryomov | 9dd2845 | 2016-04-28 16:07:26 +0200 | [diff] [blame] | 341 | spinlock_t osd_lru_lock; |
Jeff Layton | 58eb793 | 2017-04-18 09:21:16 -0400 | [diff] [blame] | 342 | u32 epoch_barrier; |
Ilya Dryomov | 5aea3dc | 2016-04-28 16:07:26 +0200 | [diff] [blame] | 343 | struct ceph_osd homeless_osd; |
| 344 | atomic64_t last_tid; /* tid of last request */ |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 345 | u64 last_linger_id; |
| 346 | struct rb_root linger_requests; /* lingering requests */ |
Ilya Dryomov | 4609245 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 347 | struct rb_root map_checks; |
| 348 | struct rb_root linger_map_checks; |
Ilya Dryomov | 5aea3dc | 2016-04-28 16:07:26 +0200 | [diff] [blame] | 349 | atomic_t num_requests; |
| 350 | atomic_t num_homeless; |
Ilya Dryomov | 66850df | 2018-05-15 15:47:58 +0200 | [diff] [blame] | 351 | int abort_err; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 352 | struct delayed_work timeout_work; |
Yehuda Sadeh | f5a2041 | 2010-02-03 11:00:26 -0800 | [diff] [blame] | 353 | struct delayed_work osds_timeout_work; |
Sage Weil | 039934b | 2009-11-12 15:05:52 -0800 | [diff] [blame] | 354 | #ifdef CONFIG_DEBUG_FS |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 355 | struct dentry *debugfs_file; |
Sage Weil | 039934b | 2009-11-12 15:05:52 -0800 | [diff] [blame] | 356 | #endif |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 357 | |
| 358 | mempool_t *req_mempool; |
| 359 | |
Yehuda Sadeh | 0d59ab8 | 2010-01-13 17:03:23 -0800 | [diff] [blame] | 360 | struct ceph_msgpool msgpool_op; |
Sage Weil | c16e786 | 2010-03-01 13:02:00 -0800 | [diff] [blame] | 361 | struct ceph_msgpool msgpool_op_reply; |
Yehuda Sadeh | a40c4f1 | 2011-03-21 15:07:16 -0700 | [diff] [blame] | 362 | |
Yehuda Sadeh | a40c4f1 | 2011-03-21 15:07:16 -0700 | [diff] [blame] | 363 | struct workqueue_struct *notify_wq; |
Ilya Dryomov | 88bc192 | 2018-05-21 16:00:29 +0200 | [diff] [blame^] | 364 | struct workqueue_struct *completion_wq; |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 365 | }; |
| 366 | |
Ilya Dryomov | b7ec35b | 2016-04-28 16:07:25 +0200 | [diff] [blame] | 367 | static inline bool ceph_osdmap_flag(struct ceph_osd_client *osdc, int flag) |
| 368 | { |
| 369 | return osdc->osdmap->flags & flag; |
| 370 | } |
| 371 | |
Alex Elder | 5522ae0 | 2013-05-01 12:43:04 -0500 | [diff] [blame] | 372 | extern int ceph_osdc_setup(void); |
| 373 | extern void ceph_osdc_cleanup(void); |
| 374 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 375 | extern int ceph_osdc_init(struct ceph_osd_client *osdc, |
| 376 | struct ceph_client *client); |
| 377 | extern void ceph_osdc_stop(struct ceph_osd_client *osdc); |
| 378 | |
| 379 | extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, |
| 380 | struct ceph_msg *msg); |
| 381 | extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, |
| 382 | struct ceph_msg *msg); |
Jeff Layton | 58eb793 | 2017-04-18 09:21:16 -0400 | [diff] [blame] | 383 | void ceph_osdc_update_epoch_barrier(struct ceph_osd_client *osdc, u32 eb); |
Ilya Dryomov | 66850df | 2018-05-15 15:47:58 +0200 | [diff] [blame] | 384 | void ceph_osdc_abort_requests(struct ceph_osd_client *osdc, int err); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 385 | |
Alex Elder | 4971977 | 2013-02-11 12:33:24 -0600 | [diff] [blame] | 386 | extern void osd_req_op_init(struct ceph_osd_request *osd_req, |
Yan, Zheng | 144cba1 | 2015-04-27 11:09:54 +0800 | [diff] [blame] | 387 | unsigned int which, u16 opcode, u32 flags); |
Alex Elder | 4971977 | 2013-02-11 12:33:24 -0600 | [diff] [blame] | 388 | |
| 389 | extern void osd_req_op_raw_data_in_pages(struct ceph_osd_request *, |
| 390 | unsigned int which, |
| 391 | struct page **pages, u64 length, |
| 392 | u32 alignment, bool pages_from_pool, |
| 393 | bool own_pages); |
| 394 | |
Alex Elder | c99d2d4 | 2013-04-05 01:27:11 -0500 | [diff] [blame] | 395 | extern void osd_req_op_extent_init(struct ceph_osd_request *osd_req, |
| 396 | unsigned int which, u16 opcode, |
Alex Elder | 33803f3 | 2013-03-13 20:50:00 -0500 | [diff] [blame] | 397 | u64 offset, u64 length, |
| 398 | u64 truncate_size, u32 truncate_seq); |
Alex Elder | c99d2d4 | 2013-04-05 01:27:11 -0500 | [diff] [blame] | 399 | extern void osd_req_op_extent_update(struct ceph_osd_request *osd_req, |
| 400 | unsigned int which, u64 length); |
Yan, Zheng | 2c63f49 | 2016-01-07 17:32:54 +0800 | [diff] [blame] | 401 | extern void osd_req_op_extent_dup_last(struct ceph_osd_request *osd_req, |
| 402 | unsigned int which, u64 offset_inc); |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 403 | |
| 404 | extern struct ceph_osd_data *osd_req_op_extent_osd_data( |
| 405 | struct ceph_osd_request *osd_req, |
Alex Elder | 406e2c9 | 2013-04-15 14:50:36 -0500 | [diff] [blame] | 406 | unsigned int which); |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 407 | |
| 408 | extern void osd_req_op_extent_osd_data_pages(struct ceph_osd_request *, |
Alex Elder | 406e2c9 | 2013-04-15 14:50:36 -0500 | [diff] [blame] | 409 | unsigned int which, |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 410 | struct page **pages, u64 length, |
| 411 | u32 alignment, bool pages_from_pool, |
| 412 | bool own_pages); |
| 413 | extern void osd_req_op_extent_osd_data_pagelist(struct ceph_osd_request *, |
Alex Elder | 406e2c9 | 2013-04-15 14:50:36 -0500 | [diff] [blame] | 414 | unsigned int which, |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 415 | struct ceph_pagelist *pagelist); |
| 416 | #ifdef CONFIG_BLOCK |
Ilya Dryomov | 5359a17 | 2018-01-20 10:30:10 +0100 | [diff] [blame] | 417 | void osd_req_op_extent_osd_data_bio(struct ceph_osd_request *osd_req, |
| 418 | unsigned int which, |
| 419 | struct ceph_bio_iter *bio_pos, |
| 420 | u32 bio_length); |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 421 | #endif /* CONFIG_BLOCK */ |
Ilya Dryomov | 0010f70 | 2018-05-04 16:57:30 +0200 | [diff] [blame] | 422 | void osd_req_op_extent_osd_data_bvecs(struct ceph_osd_request *osd_req, |
| 423 | unsigned int which, |
| 424 | struct bio_vec *bvecs, u32 num_bvecs, |
| 425 | u32 bytes); |
Ilya Dryomov | b9e281c | 2018-01-20 10:30:11 +0100 | [diff] [blame] | 426 | void osd_req_op_extent_osd_data_bvec_pos(struct ceph_osd_request *osd_req, |
| 427 | unsigned int which, |
| 428 | struct ceph_bvec_iter *bvec_pos); |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 429 | |
Alex Elder | 04017e2 | 2013-04-05 14:46:02 -0500 | [diff] [blame] | 430 | extern void osd_req_op_cls_request_data_pagelist(struct ceph_osd_request *, |
| 431 | unsigned int which, |
| 432 | struct ceph_pagelist *pagelist); |
Alex Elder | 6c57b55 | 2013-04-19 15:34:49 -0500 | [diff] [blame] | 433 | extern void osd_req_op_cls_request_data_pages(struct ceph_osd_request *, |
| 434 | unsigned int which, |
| 435 | struct page **pages, u64 length, |
| 436 | u32 alignment, bool pages_from_pool, |
| 437 | bool own_pages); |
Ilya Dryomov | b9e281c | 2018-01-20 10:30:11 +0100 | [diff] [blame] | 438 | void osd_req_op_cls_request_data_bvecs(struct ceph_osd_request *osd_req, |
| 439 | unsigned int which, |
Ilya Dryomov | 0010f70 | 2018-05-04 16:57:30 +0200 | [diff] [blame] | 440 | struct bio_vec *bvecs, u32 num_bvecs, |
| 441 | u32 bytes); |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 442 | extern void osd_req_op_cls_response_data_pages(struct ceph_osd_request *, |
Alex Elder | c99d2d4 | 2013-04-05 01:27:11 -0500 | [diff] [blame] | 443 | unsigned int which, |
Alex Elder | a4ce40a | 2013-04-05 01:27:12 -0500 | [diff] [blame] | 444 | struct page **pages, u64 length, |
| 445 | u32 alignment, bool pages_from_pool, |
| 446 | bool own_pages); |
Chengguang Xu | fe943d5 | 2018-04-12 12:04:55 +0800 | [diff] [blame] | 447 | extern int osd_req_op_cls_init(struct ceph_osd_request *osd_req, |
Alex Elder | c99d2d4 | 2013-04-05 01:27:11 -0500 | [diff] [blame] | 448 | unsigned int which, u16 opcode, |
Alex Elder | 04017e2 | 2013-04-05 14:46:02 -0500 | [diff] [blame] | 449 | const char *class, const char *method); |
Yan, Zheng | d74b50b | 2014-11-12 14:00:43 +0800 | [diff] [blame] | 450 | extern int osd_req_op_xattr_init(struct ceph_osd_request *osd_req, unsigned int which, |
| 451 | u16 opcode, const char *name, const void *value, |
| 452 | size_t size, u8 cmp_op, u8 cmp_mode); |
Ilya Dryomov | c647b8a | 2014-02-25 16:22:27 +0200 | [diff] [blame] | 453 | extern void osd_req_op_alloc_hint_init(struct ceph_osd_request *osd_req, |
| 454 | unsigned int which, |
| 455 | u64 expected_object_size, |
| 456 | u64 expected_write_size); |
Alex Elder | 33803f3 | 2013-03-13 20:50:00 -0500 | [diff] [blame] | 457 | |
Yehuda Sadeh | 3499e8a | 2010-04-06 14:51:47 -0700 | [diff] [blame] | 458 | extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, |
Yehuda Sadeh | 3499e8a | 2010-04-06 14:51:47 -0700 | [diff] [blame] | 459 | struct ceph_snap_context *snapc, |
Alex Elder | acead00 | 2013-03-14 14:09:05 -0500 | [diff] [blame] | 460 | unsigned int num_ops, |
Yehuda Sadeh | 3499e8a | 2010-04-06 14:51:47 -0700 | [diff] [blame] | 461 | bool use_mempool, |
Alex Elder | 54a5400 | 2012-11-13 21:11:15 -0600 | [diff] [blame] | 462 | gfp_t gfp_flags); |
Ilya Dryomov | 13d1ad1 | 2016-04-27 14:15:51 +0200 | [diff] [blame] | 463 | int ceph_osdc_alloc_messages(struct ceph_osd_request *req, gfp_t gfp); |
Yehuda Sadeh | 3499e8a | 2010-04-06 14:51:47 -0700 | [diff] [blame] | 464 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 465 | extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, |
| 466 | struct ceph_file_layout *layout, |
| 467 | struct ceph_vino vino, |
Alex Elder | acead00 | 2013-03-14 14:09:05 -0500 | [diff] [blame] | 468 | u64 offset, u64 *len, |
Yan, Zheng | 715e4cd | 2014-11-13 14:40:37 +0800 | [diff] [blame] | 469 | unsigned int which, int num_ops, |
| 470 | int opcode, int flags, |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 471 | struct ceph_snap_context *snapc, |
Alex Elder | acead00 | 2013-03-14 14:09:05 -0500 | [diff] [blame] | 472 | u32 truncate_seq, u64 truncate_size, |
Alex Elder | 153e516 | 2013-03-01 18:00:15 -0600 | [diff] [blame] | 473 | bool use_mempool); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 474 | |
Ilya Dryomov | 9e94af2 | 2014-06-20 14:14:42 +0400 | [diff] [blame] | 475 | extern void ceph_osdc_get_request(struct ceph_osd_request *req); |
| 476 | extern void ceph_osdc_put_request(struct ceph_osd_request *req); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 477 | |
| 478 | extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, |
| 479 | struct ceph_osd_request *req, |
| 480 | bool nofail); |
Ilya Dryomov | c9f9b93 | 2014-06-19 11:38:13 +0400 | [diff] [blame] | 481 | extern void ceph_osdc_cancel_request(struct ceph_osd_request *req); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 482 | extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, |
| 483 | struct ceph_osd_request *req); |
| 484 | extern void ceph_osdc_sync(struct ceph_osd_client *osdc); |
| 485 | |
Josh Durgin | dd935f4 | 2013-08-28 21:43:09 -0700 | [diff] [blame] | 486 | extern void ceph_osdc_flush_notifies(struct ceph_osd_client *osdc); |
Ilya Dryomov | 7cca78c | 2016-04-28 16:07:28 +0200 | [diff] [blame] | 487 | void ceph_osdc_maybe_request_map(struct ceph_osd_client *osdc); |
Josh Durgin | dd935f4 | 2013-08-28 21:43:09 -0700 | [diff] [blame] | 488 | |
Douglas Fuller | 428a715 | 2015-06-17 14:49:45 -0400 | [diff] [blame] | 489 | int ceph_osdc_call(struct ceph_osd_client *osdc, |
| 490 | struct ceph_object_id *oid, |
| 491 | struct ceph_object_locator *oloc, |
| 492 | const char *class, const char *method, |
| 493 | unsigned int flags, |
| 494 | struct page *req_page, size_t req_len, |
| 495 | struct page *resp_page, size_t *resp_len); |
| 496 | |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 497 | extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, |
| 498 | struct ceph_vino vino, |
| 499 | struct ceph_file_layout *layout, |
| 500 | u64 off, u64 *plen, |
| 501 | u32 truncate_seq, u64 truncate_size, |
Sage Weil | b7495fc | 2010-11-09 12:43:12 -0800 | [diff] [blame] | 502 | struct page **pages, int nr_pages, |
| 503 | int page_align); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 504 | |
| 505 | extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, |
| 506 | struct ceph_vino vino, |
| 507 | struct ceph_file_layout *layout, |
| 508 | struct ceph_snap_context *sc, |
| 509 | u64 off, u64 len, |
| 510 | u32 truncate_seq, u64 truncate_size, |
| 511 | struct timespec *mtime, |
Alex Elder | 2480882 | 2013-02-15 11:42:29 -0600 | [diff] [blame] | 512 | struct page **pages, int nr_pages); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 513 | |
Ilya Dryomov | 922dab6 | 2016-05-26 01:15:02 +0200 | [diff] [blame] | 514 | /* watch/notify */ |
| 515 | struct ceph_osd_linger_request * |
| 516 | ceph_osdc_watch(struct ceph_osd_client *osdc, |
| 517 | struct ceph_object_id *oid, |
| 518 | struct ceph_object_locator *oloc, |
| 519 | rados_watchcb2_t wcb, |
| 520 | rados_watcherrcb_t errcb, |
| 521 | void *data); |
| 522 | int ceph_osdc_unwatch(struct ceph_osd_client *osdc, |
| 523 | struct ceph_osd_linger_request *lreq); |
| 524 | |
| 525 | int ceph_osdc_notify_ack(struct ceph_osd_client *osdc, |
| 526 | struct ceph_object_id *oid, |
| 527 | struct ceph_object_locator *oloc, |
| 528 | u64 notify_id, |
| 529 | u64 cookie, |
| 530 | void *payload, |
| 531 | size_t payload_len); |
Ilya Dryomov | 1907920 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 532 | int ceph_osdc_notify(struct ceph_osd_client *osdc, |
| 533 | struct ceph_object_id *oid, |
| 534 | struct ceph_object_locator *oloc, |
| 535 | void *payload, |
| 536 | size_t payload_len, |
| 537 | u32 timeout, |
| 538 | struct page ***preply_pages, |
| 539 | size_t *preply_len); |
Ilya Dryomov | b07d3c4 | 2016-04-28 16:07:27 +0200 | [diff] [blame] | 540 | int ceph_osdc_watch_check(struct ceph_osd_client *osdc, |
| 541 | struct ceph_osd_linger_request *lreq); |
Douglas Fuller | a4ed38d | 2015-07-17 13:18:07 -0700 | [diff] [blame] | 542 | int ceph_osdc_list_watchers(struct ceph_osd_client *osdc, |
| 543 | struct ceph_object_id *oid, |
| 544 | struct ceph_object_locator *oloc, |
| 545 | struct ceph_watch_item **watchers, |
| 546 | u32 *num_watchers); |
Sage Weil | f24e998 | 2009-10-06 11:31:10 -0700 | [diff] [blame] | 547 | #endif |
| 548 | |