blob: 7ffd719d89defcfef77565e552d066cab68fab8c [file] [log] [blame]
Thomas Gleixner09c434b2019-05-19 13:08:20 +01001// SPDX-License-Identifier: GPL-2.0-only
Rusty Russelle467cde2007-10-22 11:03:38 +10002//#define DEBUG
3#include <linux/spinlock.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09004#include <linux/slab.h>
Rusty Russelle467cde2007-10-22 11:03:38 +10005#include <linux/blkdev.h>
6#include <linux/hdreg.h>
Paul Gortmaker0c8d44f2011-07-01 15:56:05 -04007#include <linux/module.h>
Michael S. Tsirkin4678d6f92012-01-12 15:44:44 +10308#include <linux/mutex.h>
Christoph Hellwigad714732017-02-05 18:15:25 +01009#include <linux/interrupt.h>
Rusty Russelle467cde2007-10-22 11:03:38 +100010#include <linux/virtio.h>
11#include <linux/virtio_blk.h>
Jens Axboe3d1266c2007-10-24 13:21:21 +020012#include <linux/scatterlist.h>
Christoph Hellwig7a7c9242011-02-01 21:43:48 +010013#include <linux/string_helpers.h>
Liu Yuan6917f832011-04-24 02:49:26 +080014#include <scsi/scsi_cmnd.h>
Michael S. Tsirkin5087a502011-10-30 21:29:59 +020015#include <linux/idr.h>
Jens Axboe1cf7e9c2013-11-01 10:52:52 -060016#include <linux/blk-mq.h>
Christoph Hellwigad714732017-02-05 18:15:25 +010017#include <linux/blk-mq-virtio.h>
Jens Axboe1cf7e9c2013-11-01 10:52:52 -060018#include <linux/numa.h>
Jens Axboe3d1266c2007-10-24 13:21:21 +020019
Christian Borntraeger4f3bf192008-01-31 15:53:53 +010020#define PART_BITS 4
Ming Lei6a27b652014-06-26 17:41:48 +080021#define VQ_NAME_LEN 16
Changpeng Liu1f238162018-11-01 15:40:35 -070022#define MAX_DISCARD_SEGMENTS 256u
Rusty Russelle467cde2007-10-22 11:03:38 +100023
Michael S. Tsirkin5087a502011-10-30 21:29:59 +020024static int major;
25static DEFINE_IDA(vd_index_ida);
26
Jonghwan Choi2a647bf2013-05-20 10:25:39 +093027static struct workqueue_struct *virtblk_wq;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +010028
Ming Lei6a27b652014-06-26 17:41:48 +080029struct virtio_blk_vq {
30 struct virtqueue *vq;
31 spinlock_t lock;
32 char name[VQ_NAME_LEN];
33} ____cacheline_aligned_in_smp;
34
Michael S. Tsirkinbb6ec572015-01-15 13:33:31 +020035struct virtio_blk {
Rusty Russelle467cde2007-10-22 11:03:38 +100036 struct virtio_device *vdev;
Rusty Russelle467cde2007-10-22 11:03:38 +100037
38 /* The disk structure for the kernel. */
39 struct gendisk *disk;
40
Christoph Hellwig24d2f902014-04-15 14:14:00 -060041 /* Block layer tags. */
42 struct blk_mq_tag_set tag_set;
43
Christoph Hellwig7a7c9242011-02-01 21:43:48 +010044 /* Process context for config space updates */
45 struct work_struct config_work;
46
Rusty Russell0864b792008-12-30 09:26:05 -060047 /* What host tells us, plus 2 for header & tailer. */
48 unsigned int sg_elems;
49
Michael S. Tsirkin5087a502011-10-30 21:29:59 +020050 /* Ida index - used to track minor number allocations. */
51 int index;
Ming Lei6a27b652014-06-26 17:41:48 +080052
53 /* num of vqs */
54 int num_vqs;
55 struct virtio_blk_vq *vqs;
Rusty Russelle467cde2007-10-22 11:03:38 +100056};
57
Michael S. Tsirkinbb6ec572015-01-15 13:33:31 +020058struct virtblk_req {
Christoph Hellwig97b50a62017-01-28 09:32:53 +010059#ifdef CONFIG_VIRTIO_BLK_SCSI
60 struct scsi_request sreq; /* for SCSI passthrough, must be first */
Christoph Hellwiga14d7492017-01-09 08:56:23 -070061 u8 sense[SCSI_SENSE_BUFFERSIZE];
Christoph Hellwig97b50a62017-01-28 09:32:53 +010062 struct virtio_scsi_inhdr in_hdr;
63#endif
64 struct virtio_blk_outhdr out_hdr;
65 u8 status;
Asias Hea98755c2012-08-08 16:07:04 +080066 struct scatterlist sg[];
Rusty Russelle467cde2007-10-22 11:03:38 +100067};
68
Christoph Hellwig2a842ac2017-06-03 09:38:04 +020069static inline blk_status_t virtblk_result(struct virtblk_req *vbr)
Asias Hea98755c2012-08-08 16:07:04 +080070{
71 switch (vbr->status) {
72 case VIRTIO_BLK_S_OK:
Christoph Hellwig2a842ac2017-06-03 09:38:04 +020073 return BLK_STS_OK;
Asias Hea98755c2012-08-08 16:07:04 +080074 case VIRTIO_BLK_S_UNSUPP:
Christoph Hellwig2a842ac2017-06-03 09:38:04 +020075 return BLK_STS_NOTSUPP;
Asias Hea98755c2012-08-08 16:07:04 +080076 default:
Christoph Hellwig2a842ac2017-06-03 09:38:04 +020077 return BLK_STS_IOERR;
Asias Hea98755c2012-08-08 16:07:04 +080078 }
79}
80
Christoph Hellwig97b50a62017-01-28 09:32:53 +010081/*
82 * If this is a packet command we need a couple of additional headers. Behind
83 * the normal outhdr we put a segment with the scsi command block, and before
84 * the normal inhdr we put the sense data and the inhdr with additional status
85 * information.
86 */
87#ifdef CONFIG_VIRTIO_BLK_SCSI
88static int virtblk_add_req_scsi(struct virtqueue *vq, struct virtblk_req *vbr,
89 struct scatterlist *data_sg, bool have_data)
Asias Hec85a1f92012-08-08 16:07:05 +080090{
Paolo Bonzini20af3cf2013-03-20 15:44:27 +103091 struct scatterlist hdr, status, cmd, sense, inhdr, *sgs[6];
Paolo Bonzini8f39db92013-03-20 15:44:27 +103092 unsigned int num_out = 0, num_in = 0;
93
94 sg_init_one(&hdr, &vbr->out_hdr, sizeof(vbr->out_hdr));
95 sgs[num_out++] = &hdr;
Christoph Hellwig97b50a62017-01-28 09:32:53 +010096 sg_init_one(&cmd, vbr->sreq.cmd, vbr->sreq.cmd_len);
97 sgs[num_out++] = &cmd;
Paolo Bonzini20af3cf2013-03-20 15:44:27 +103098
Rusty Russell0a11cc32013-03-20 15:44:27 +103099 if (have_data) {
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +0200100 if (vbr->out_hdr.type & cpu_to_virtio32(vq->vdev, VIRTIO_BLK_T_OUT))
Paolo Bonzini20af3cf2013-03-20 15:44:27 +1030101 sgs[num_out++] = data_sg;
Paolo Bonzini8f39db92013-03-20 15:44:27 +1030102 else
Paolo Bonzini20af3cf2013-03-20 15:44:27 +1030103 sgs[num_out + num_in++] = data_sg;
104 }
105
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100106 sg_init_one(&sense, vbr->sense, SCSI_SENSE_BUFFERSIZE);
107 sgs[num_out + num_in++] = &sense;
108 sg_init_one(&inhdr, &vbr->in_hdr, sizeof(vbr->in_hdr));
109 sgs[num_out + num_in++] = &inhdr;
110 sg_init_one(&status, &vbr->status, sizeof(vbr->status));
111 sgs[num_out + num_in++] = &status;
112
113 return virtqueue_add_sgs(vq, sgs, num_out, num_in, vbr, GFP_ATOMIC);
114}
115
Christoph Hellwiga1a6e62b2017-04-20 16:02:59 +0200116static inline void virtblk_scsi_request_done(struct request *req)
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100117{
118 struct virtblk_req *vbr = blk_mq_rq_to_pdu(req);
119 struct virtio_blk *vblk = req->q->queuedata;
120 struct scsi_request *sreq = &vbr->sreq;
121
122 sreq->resid_len = virtio32_to_cpu(vblk->vdev, vbr->in_hdr.residual);
123 sreq->sense_len = virtio32_to_cpu(vblk->vdev, vbr->in_hdr.sense_len);
Christoph Hellwig17d53632017-04-20 16:03:01 +0200124 sreq->result = virtio32_to_cpu(vblk->vdev, vbr->in_hdr.errors);
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100125}
126
127static int virtblk_ioctl(struct block_device *bdev, fmode_t mode,
128 unsigned int cmd, unsigned long data)
129{
130 struct gendisk *disk = bdev->bd_disk;
131 struct virtio_blk *vblk = disk->private_data;
132
133 /*
134 * Only allow the generic SCSI ioctls if the host can support it.
135 */
136 if (!virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_SCSI))
137 return -ENOTTY;
138
139 return scsi_cmd_blk_ioctl(bdev, mode, cmd,
140 (void __user *)data);
141}
142#else
143static inline int virtblk_add_req_scsi(struct virtqueue *vq,
144 struct virtblk_req *vbr, struct scatterlist *data_sg,
145 bool have_data)
146{
147 return -EIO;
148}
Christoph Hellwiga1a6e62b2017-04-20 16:02:59 +0200149static inline void virtblk_scsi_request_done(struct request *req)
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100150{
151}
152#define virtblk_ioctl NULL
153#endif /* CONFIG_VIRTIO_BLK_SCSI */
154
155static int virtblk_add_req(struct virtqueue *vq, struct virtblk_req *vbr,
156 struct scatterlist *data_sg, bool have_data)
157{
158 struct scatterlist hdr, status, *sgs[3];
159 unsigned int num_out = 0, num_in = 0;
160
161 sg_init_one(&hdr, &vbr->out_hdr, sizeof(vbr->out_hdr));
162 sgs[num_out++] = &hdr;
163
164 if (have_data) {
165 if (vbr->out_hdr.type & cpu_to_virtio32(vq->vdev, VIRTIO_BLK_T_OUT))
166 sgs[num_out++] = data_sg;
167 else
168 sgs[num_out + num_in++] = data_sg;
Paolo Bonzini8f39db92013-03-20 15:44:27 +1030169 }
170
171 sg_init_one(&status, &vbr->status, sizeof(vbr->status));
172 sgs[num_out + num_in++] = &status;
173
174 return virtqueue_add_sgs(vq, sgs, num_out, num_in, vbr, GFP_ATOMIC);
Paolo Bonzini5ee21a52013-03-20 15:44:27 +1030175}
Asias Hec85a1f92012-08-08 16:07:05 +0800176
Changpeng Liu1f238162018-11-01 15:40:35 -0700177static int virtblk_setup_discard_write_zeroes(struct request *req, bool unmap)
178{
179 unsigned short segments = blk_rq_nr_discard_segments(req);
180 unsigned short n = 0;
181 struct virtio_blk_discard_write_zeroes *range;
182 struct bio *bio;
183 u32 flags = 0;
184
185 if (unmap)
186 flags |= VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP;
187
188 range = kmalloc_array(segments, sizeof(*range), GFP_ATOMIC);
189 if (!range)
190 return -ENOMEM;
191
192 __rq_for_each_bio(bio, req) {
193 u64 sector = bio->bi_iter.bi_sector;
194 u32 num_sectors = bio->bi_iter.bi_size >> SECTOR_SHIFT;
195
196 range[n].flags = cpu_to_le32(flags);
197 range[n].num_sectors = cpu_to_le32(num_sectors);
198 range[n].sector = cpu_to_le64(sector);
199 n++;
200 }
201
202 req->special_vec.bv_page = virt_to_page(range);
203 req->special_vec.bv_offset = offset_in_page(range);
204 req->special_vec.bv_len = sizeof(*range) * segments;
205 req->rq_flags |= RQF_SPECIAL_PAYLOAD;
206
207 return 0;
208}
209
Christoph Hellwig5124c282014-02-10 03:24:39 -0800210static inline void virtblk_request_done(struct request *req)
Asias Hec85a1f92012-08-08 16:07:05 +0800211{
Christoph Hellwig9d74e252014-04-14 10:30:07 +0200212 struct virtblk_req *vbr = blk_mq_rq_to_pdu(req);
Asias Hea98755c2012-08-08 16:07:04 +0800213
Changpeng Liu1f238162018-11-01 15:40:35 -0700214 if (req->rq_flags & RQF_SPECIAL_PAYLOAD) {
215 kfree(page_address(req->special_vec.bv_page) +
216 req->special_vec.bv_offset);
217 }
218
Christoph Hellwigaebf5262017-01-31 16:57:31 +0100219 switch (req_op(req)) {
220 case REQ_OP_SCSI_IN:
221 case REQ_OP_SCSI_OUT:
Christoph Hellwiga1a6e62b2017-04-20 16:02:59 +0200222 virtblk_scsi_request_done(req);
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100223 break;
Asias Hea98755c2012-08-08 16:07:04 +0800224 }
225
Christoph Hellwigd19633d2017-04-20 16:03:00 +0200226 blk_mq_end_request(req, virtblk_result(vbr));
Asias Hea98755c2012-08-08 16:07:04 +0800227}
228
229static void virtblk_done(struct virtqueue *vq)
Rusty Russelle467cde2007-10-22 11:03:38 +1000230{
231 struct virtio_blk *vblk = vq->vdev->priv;
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600232 bool req_done = false;
Ming Lei6a27b652014-06-26 17:41:48 +0800233 int qid = vq->index;
Rusty Russelle467cde2007-10-22 11:03:38 +1000234 struct virtblk_req *vbr;
Rusty Russelle467cde2007-10-22 11:03:38 +1000235 unsigned long flags;
Asias Hea98755c2012-08-08 16:07:04 +0800236 unsigned int len;
Rusty Russelle467cde2007-10-22 11:03:38 +1000237
Ming Lei6a27b652014-06-26 17:41:48 +0800238 spin_lock_irqsave(&vblk->vqs[qid].lock, flags);
Asias Hebb811102012-09-25 10:36:17 +0800239 do {
240 virtqueue_disable_cb(vq);
Ming Lei6a27b652014-06-26 17:41:48 +0800241 while ((vbr = virtqueue_get_buf(vblk->vqs[qid].vq, &len)) != NULL) {
Christoph Hellwig85dada02017-01-28 09:32:52 +0100242 struct request *req = blk_mq_rq_from_pdu(vbr);
243
Christoph Hellwig08e00292017-04-20 16:03:09 +0200244 blk_mq_complete_request(req);
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600245 req_done = true;
Rusty Russelle467cde2007-10-22 11:03:38 +1000246 }
Heinz Graalfs7f03b172013-10-29 09:40:30 +1030247 if (unlikely(virtqueue_is_broken(vq)))
248 break;
Asias Hebb811102012-09-25 10:36:17 +0800249 } while (!virtqueue_enable_cb(vq));
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600250
Rusty Russelle467cde2007-10-22 11:03:38 +1000251 /* In case queue is stopped waiting for more buffers. */
Asias Hea98755c2012-08-08 16:07:04 +0800252 if (req_done)
Christoph Hellwig1b4a3252014-04-16 09:44:54 +0200253 blk_mq_start_stopped_hw_queues(vblk->disk->queue, true);
Ming Lei6a27b652014-06-26 17:41:48 +0800254 spin_unlock_irqrestore(&vblk->vqs[qid].lock, flags);
Asias Hea98755c2012-08-08 16:07:04 +0800255}
256
Jens Axboe944e7c82018-11-26 11:00:12 -0700257static void virtio_commit_rqs(struct blk_mq_hw_ctx *hctx)
258{
259 struct virtio_blk *vblk = hctx->queue->queuedata;
260 struct virtio_blk_vq *vq = &vblk->vqs[hctx->queue_num];
261 bool kick;
262
263 spin_lock_irq(&vq->lock);
264 kick = virtqueue_kick_prepare(vq->vq);
265 spin_unlock_irq(&vq->lock);
266
267 if (kick)
268 virtqueue_notify(vq->vq);
269}
270
Christoph Hellwigfc17b652017-06-03 09:38:05 +0200271static blk_status_t virtio_queue_rq(struct blk_mq_hw_ctx *hctx,
Jens Axboe74c45052014-10-29 11:14:52 -0600272 const struct blk_mq_queue_data *bd)
Rusty Russelle467cde2007-10-22 11:03:38 +1000273{
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600274 struct virtio_blk *vblk = hctx->queue->queuedata;
Jens Axboe74c45052014-10-29 11:14:52 -0600275 struct request *req = bd->rq;
Christoph Hellwig9d74e252014-04-14 10:30:07 +0200276 struct virtblk_req *vbr = blk_mq_rq_to_pdu(req);
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600277 unsigned long flags;
Paolo Bonzini20af3cf2013-03-20 15:44:27 +1030278 unsigned int num;
Ming Lei6a27b652014-06-26 17:41:48 +0800279 int qid = hctx->queue_num;
Rusty Russell5261b852014-03-13 11:23:39 +1030280 int err;
Ming Leie8edca62014-05-30 10:49:29 +0800281 bool notify = false;
Changpeng Liu1f238162018-11-01 15:40:35 -0700282 bool unmap = false;
Christoph Hellwigaebf5262017-01-31 16:57:31 +0100283 u32 type;
Rusty Russelle467cde2007-10-22 11:03:38 +1000284
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600285 BUG_ON(req->nr_phys_segments + 2 > vblk->sg_elems);
Rusty Russelle467cde2007-10-22 11:03:38 +1000286
Christoph Hellwigaebf5262017-01-31 16:57:31 +0100287 switch (req_op(req)) {
288 case REQ_OP_READ:
289 case REQ_OP_WRITE:
290 type = 0;
291 break;
292 case REQ_OP_FLUSH:
293 type = VIRTIO_BLK_T_FLUSH;
294 break;
Changpeng Liu1f238162018-11-01 15:40:35 -0700295 case REQ_OP_DISCARD:
296 type = VIRTIO_BLK_T_DISCARD;
297 break;
298 case REQ_OP_WRITE_ZEROES:
299 type = VIRTIO_BLK_T_WRITE_ZEROES;
300 unmap = !(req->cmd_flags & REQ_NOUNMAP);
301 break;
Christoph Hellwigaebf5262017-01-31 16:57:31 +0100302 case REQ_OP_SCSI_IN:
303 case REQ_OP_SCSI_OUT:
304 type = VIRTIO_BLK_T_SCSI_CMD;
305 break;
306 case REQ_OP_DRV_IN:
307 type = VIRTIO_BLK_T_GET_ID;
308 break;
309 default:
310 WARN_ON_ONCE(1);
Christoph Hellwigfc17b652017-06-03 09:38:05 +0200311 return BLK_STS_IOERR;
Rusty Russelle467cde2007-10-22 11:03:38 +1000312 }
313
Christoph Hellwigaebf5262017-01-31 16:57:31 +0100314 vbr->out_hdr.type = cpu_to_virtio32(vblk->vdev, type);
315 vbr->out_hdr.sector = type ?
316 0 : cpu_to_virtio64(vblk->vdev, blk_rq_pos(req));
317 vbr->out_hdr.ioprio = cpu_to_virtio32(vblk->vdev, req_get_ioprio(req));
318
Christoph Hellwige2490072014-09-13 16:40:09 -0700319 blk_mq_start_request(req);
320
Changpeng Liu1f238162018-11-01 15:40:35 -0700321 if (type == VIRTIO_BLK_T_DISCARD || type == VIRTIO_BLK_T_WRITE_ZEROES) {
322 err = virtblk_setup_discard_write_zeroes(req, unmap);
323 if (err)
324 return BLK_STS_RESOURCE;
325 }
326
Christoph Hellwig85dada02017-01-28 09:32:52 +0100327 num = blk_rq_map_sg(hctx->queue, req, vbr->sg);
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200328 if (num) {
Christoph Hellwig85dada02017-01-28 09:32:52 +0100329 if (rq_data_dir(req) == WRITE)
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +0200330 vbr->out_hdr.type |= cpu_to_virtio32(vblk->vdev, VIRTIO_BLK_T_OUT);
Paolo Bonzini20af3cf2013-03-20 15:44:27 +1030331 else
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +0200332 vbr->out_hdr.type |= cpu_to_virtio32(vblk->vdev, VIRTIO_BLK_T_IN);
Rusty Russelle467cde2007-10-22 11:03:38 +1000333 }
334
Ming Lei6a27b652014-06-26 17:41:48 +0800335 spin_lock_irqsave(&vblk->vqs[qid].lock, flags);
Bart Van Assche6e9fe8d2017-08-17 16:23:08 -0700336 if (blk_rq_is_scsi(req))
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100337 err = virtblk_add_req_scsi(vblk->vqs[qid].vq, vbr, vbr->sg, num);
338 else
339 err = virtblk_add_req(vblk->vqs[qid].vq, vbr, vbr->sg, num);
Rusty Russell5261b852014-03-13 11:23:39 +1030340 if (err) {
Ming Lei6a27b652014-06-26 17:41:48 +0800341 virtqueue_kick(vblk->vqs[qid].vq);
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600342 blk_mq_stop_hw_queue(hctx);
Ming Lei6a27b652014-06-26 17:41:48 +0800343 spin_unlock_irqrestore(&vblk->vqs[qid].lock, flags);
Rusty Russell5261b852014-03-13 11:23:39 +1030344 /* Out of mem doesn't actually happen, since we fall back
345 * to direct descriptors */
346 if (err == -ENOMEM || err == -ENOSPC)
Ming Lei86ff7c22018-01-30 22:04:57 -0500347 return BLK_STS_DEV_RESOURCE;
Christoph Hellwigfc17b652017-06-03 09:38:05 +0200348 return BLK_STS_IOERR;
Asias Hea98755c2012-08-08 16:07:04 +0800349 }
350
Jens Axboe74c45052014-10-29 11:14:52 -0600351 if (bd->last && virtqueue_kick_prepare(vblk->vqs[qid].vq))
Ming Leie8edca62014-05-30 10:49:29 +0800352 notify = true;
Ming Lei6a27b652014-06-26 17:41:48 +0800353 spin_unlock_irqrestore(&vblk->vqs[qid].lock, flags);
Ming Leie8edca62014-05-30 10:49:29 +0800354
355 if (notify)
Ming Lei6a27b652014-06-26 17:41:48 +0800356 virtqueue_notify(vblk->vqs[qid].vq);
Christoph Hellwigfc17b652017-06-03 09:38:05 +0200357 return BLK_STS_OK;
Asias Hea98755c2012-08-08 16:07:04 +0800358}
359
john cooper4cb2ea22010-03-25 01:33:33 -0400360/* return id (s/n) string for *disk to *id_str
361 */
362static int virtblk_get_id(struct gendisk *disk, char *id_str)
363{
364 struct virtio_blk *vblk = disk->private_data;
Christoph Hellwigf9596692016-07-19 11:31:49 +0200365 struct request_queue *q = vblk->disk->queue;
john cooper4cb2ea22010-03-25 01:33:33 -0400366 struct request *req;
Mike Snitzere4c47762010-10-09 12:12:13 +1030367 int err;
john cooper4cb2ea22010-03-25 01:33:33 -0400368
Christoph Hellwigff005a02018-05-09 09:54:05 +0200369 req = blk_get_request(q, REQ_OP_DRV_IN, 0);
Christoph Hellwigf9596692016-07-19 11:31:49 +0200370 if (IS_ERR(req))
john cooper4cb2ea22010-03-25 01:33:33 -0400371 return PTR_ERR(req);
Mike Snitzere4c47762010-10-09 12:12:13 +1030372
Christoph Hellwigf9596692016-07-19 11:31:49 +0200373 err = blk_rq_map_kern(q, req, id_str, VIRTIO_BLK_ID_BYTES, GFP_KERNEL);
374 if (err)
375 goto out;
376
Christoph Hellwigb7819b92017-04-20 16:02:55 +0200377 blk_execute_rq(vblk->disk->queue, vblk->disk, req, false);
Christoph Hellwig2a842ac2017-06-03 09:38:04 +0200378 err = blk_status_to_errno(virtblk_result(blk_mq_rq_to_pdu(req)));
Christoph Hellwigf9596692016-07-19 11:31:49 +0200379out:
380 blk_put_request(req);
Mike Snitzere4c47762010-10-09 12:12:13 +1030381 return err;
john cooper4cb2ea22010-03-25 01:33:33 -0400382}
383
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100384/* We provide getgeo only to please some old bootloader/partitioning tools */
385static int virtblk_getgeo(struct block_device *bd, struct hd_geometry *geo)
386{
Ryan Harper48e40432008-04-16 13:56:37 -0500387 struct virtio_blk *vblk = bd->bd_disk->private_data;
Ryan Harper48e40432008-04-16 13:56:37 -0500388
389 /* see if the host passed in geometry config */
Rusty Russell855e0c52013-10-14 18:11:51 +1030390 if (virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_GEOMETRY)) {
391 virtio_cread(vblk->vdev, struct virtio_blk_config,
392 geometry.cylinders, &geo->cylinders);
393 virtio_cread(vblk->vdev, struct virtio_blk_config,
394 geometry.heads, &geo->heads);
395 virtio_cread(vblk->vdev, struct virtio_blk_config,
396 geometry.sectors, &geo->sectors);
Ryan Harper48e40432008-04-16 13:56:37 -0500397 } else {
398 /* some standard values, similar to sd */
399 geo->heads = 1 << 6;
400 geo->sectors = 1 << 5;
401 geo->cylinders = get_capacity(bd->bd_disk) >> 11;
402 }
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100403 return 0;
404}
405
Alexey Dobriyan83d5cde2009-09-21 17:01:13 -0700406static const struct block_device_operations virtblk_fops = {
Arnd Bergmann8a6cfeb2010-07-08 10:18:46 +0200407 .ioctl = virtblk_ioctl,
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100408 .owner = THIS_MODULE,
409 .getgeo = virtblk_getgeo,
Rusty Russelle467cde2007-10-22 11:03:38 +1000410};
411
Christian Borntraegerd50ed902008-02-01 09:05:00 +0100412static int index_to_minor(int index)
413{
414 return index << PART_BITS;
415}
416
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200417static int minor_to_index(int minor)
418{
419 return minor >> PART_BITS;
420}
421
Hannes Reineckee982c4d2018-09-28 08:17:23 +0200422static ssize_t serial_show(struct device *dev,
423 struct device_attribute *attr, char *buf)
Ryan Harpera5eb9e42010-06-23 22:19:57 -0500424{
425 struct gendisk *disk = dev_to_disk(dev);
426 int err;
427
428 /* sysfs gives us a PAGE_SIZE buffer */
429 BUILD_BUG_ON(PAGE_SIZE < VIRTIO_BLK_ID_BYTES);
430
431 buf[VIRTIO_BLK_ID_BYTES] = '\0';
432 err = virtblk_get_id(disk, buf);
433 if (!err)
434 return strlen(buf);
435
436 if (err == -EIO) /* Unsupported? Make it empty. */
437 return 0;
438
439 return err;
440}
Michael S. Tsirkin393c5252014-10-23 16:08:44 +0300441
Hannes Reineckee982c4d2018-09-28 08:17:23 +0200442static DEVICE_ATTR_RO(serial);
Ryan Harpera5eb9e42010-06-23 22:19:57 -0500443
Stefan Hajnoczidaf2a502018-01-03 16:03:39 +0000444/* The queue's logical block size must be set before calling this */
445static void virtblk_update_capacity(struct virtio_blk *vblk, bool resize)
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100446{
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100447 struct virtio_device *vdev = vblk->vdev;
448 struct request_queue *q = vblk->disk->queue;
449 char cap_str_2[10], cap_str_10[10];
Stefan Hajnoczi1046d302017-07-26 15:32:23 +0100450 unsigned long long nblocks;
James Bottomleyb9f28d82015-03-05 18:47:01 -0800451 u64 capacity;
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100452
453 /* Host must always specify the capacity. */
Rusty Russell855e0c52013-10-14 18:11:51 +1030454 virtio_cread(vdev, struct virtio_blk_config, capacity, &capacity);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100455
456 /* If capacity is too big, truncate with warning. */
457 if ((sector_t)capacity != capacity) {
458 dev_warn(&vdev->dev, "Capacity %llu too large: truncating\n",
459 (unsigned long long)capacity);
460 capacity = (sector_t)-1;
461 }
462
Stefan Hajnoczi1046d302017-07-26 15:32:23 +0100463 nblocks = DIV_ROUND_UP_ULL(capacity, queue_logical_block_size(q) >> 9);
464
465 string_get_size(nblocks, queue_logical_block_size(q),
James Bottomleyb9f28d82015-03-05 18:47:01 -0800466 STRING_UNITS_2, cap_str_2, sizeof(cap_str_2));
Stefan Hajnoczi1046d302017-07-26 15:32:23 +0100467 string_get_size(nblocks, queue_logical_block_size(q),
James Bottomleyb9f28d82015-03-05 18:47:01 -0800468 STRING_UNITS_10, cap_str_10, sizeof(cap_str_10));
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100469
470 dev_notice(&vdev->dev,
Stefan Hajnoczidaf2a502018-01-03 16:03:39 +0000471 "[%s] %s%llu %d-byte logical blocks (%s/%s)\n",
472 vblk->disk->disk_name,
473 resize ? "new size: " : "",
Stefan Hajnoczi1046d302017-07-26 15:32:23 +0100474 nblocks,
475 queue_logical_block_size(q),
476 cap_str_10,
477 cap_str_2);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100478
479 set_capacity(vblk->disk, capacity);
Stefan Hajnoczidaf2a502018-01-03 16:03:39 +0000480}
481
482static void virtblk_config_changed_work(struct work_struct *work)
483{
484 struct virtio_blk *vblk =
485 container_of(work, struct virtio_blk, config_work);
486 char *envp[] = { "RESIZE=1", NULL };
487
488 virtblk_update_capacity(vblk, true);
Vivek Goyale9986f32012-03-29 10:09:44 +0200489 revalidate_disk(vblk->disk);
Milos Vyletel9d9598b2013-03-12 15:34:40 +1030490 kobject_uevent_env(&disk_to_dev(vblk->disk)->kobj, KOBJ_CHANGE, envp);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100491}
492
493static void virtblk_config_changed(struct virtio_device *vdev)
494{
495 struct virtio_blk *vblk = vdev->priv;
496
497 queue_work(virtblk_wq, &vblk->config_work);
498}
499
Amit Shah6abd6e52011-12-22 16:58:29 +0530500static int init_vq(struct virtio_blk *vblk)
501{
Markus Elfring2ff98442016-09-13 13:43:50 +0200502 int err;
Ming Lei6a27b652014-06-26 17:41:48 +0800503 int i;
504 vq_callback_t **callbacks;
505 const char **names;
506 struct virtqueue **vqs;
507 unsigned short num_vqs;
508 struct virtio_device *vdev = vblk->vdev;
Christoph Hellwigad714732017-02-05 18:15:25 +0100509 struct irq_affinity desc = { 0, };
Amit Shah6abd6e52011-12-22 16:58:29 +0530510
Ming Lei6a27b652014-06-26 17:41:48 +0800511 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_MQ,
512 struct virtio_blk_config, num_queues,
513 &num_vqs);
514 if (err)
515 num_vqs = 1;
Amit Shah6abd6e52011-12-22 16:58:29 +0530516
Dongli Zhangbf348f92019-03-27 18:36:34 +0800517 num_vqs = min_t(unsigned int, nr_cpu_ids, num_vqs);
518
Markus Elfring668866b2016-09-13 11:32:22 +0200519 vblk->vqs = kmalloc_array(num_vqs, sizeof(*vblk->vqs), GFP_KERNEL);
Minfei Huang347a5292016-08-09 16:39:20 +0800520 if (!vblk->vqs)
521 return -ENOMEM;
522
Markus Elfring668866b2016-09-13 11:32:22 +0200523 names = kmalloc_array(num_vqs, sizeof(*names), GFP_KERNEL);
524 callbacks = kmalloc_array(num_vqs, sizeof(*callbacks), GFP_KERNEL);
525 vqs = kmalloc_array(num_vqs, sizeof(*vqs), GFP_KERNEL);
Minfei Huang347a5292016-08-09 16:39:20 +0800526 if (!names || !callbacks || !vqs) {
Ming Lei6a27b652014-06-26 17:41:48 +0800527 err = -ENOMEM;
528 goto out;
529 }
530
Ming Lei6a27b652014-06-26 17:41:48 +0800531 for (i = 0; i < num_vqs; i++) {
532 callbacks[i] = virtblk_done;
533 snprintf(vblk->vqs[i].name, VQ_NAME_LEN, "req.%d", i);
534 names[i] = vblk->vqs[i].name;
535 }
536
537 /* Discover virtqueues and write information to configuration. */
Michael S. Tsirkin9b2bbdb2017-03-06 18:19:39 +0200538 err = virtio_find_vqs(vdev, num_vqs, vqs, callbacks, names, &desc);
Ming Lei6a27b652014-06-26 17:41:48 +0800539 if (err)
Minfei Huang347a5292016-08-09 16:39:20 +0800540 goto out;
Ming Lei6a27b652014-06-26 17:41:48 +0800541
542 for (i = 0; i < num_vqs; i++) {
543 spin_lock_init(&vblk->vqs[i].lock);
544 vblk->vqs[i].vq = vqs[i];
545 }
546 vblk->num_vqs = num_vqs;
547
Minfei Huang347a5292016-08-09 16:39:20 +0800548out:
Ming Lei6a27b652014-06-26 17:41:48 +0800549 kfree(vqs);
Ming Lei6a27b652014-06-26 17:41:48 +0800550 kfree(callbacks);
Ming Lei6a27b652014-06-26 17:41:48 +0800551 kfree(names);
Ming Lei6a27b652014-06-26 17:41:48 +0800552 if (err)
553 kfree(vblk->vqs);
Amit Shah6abd6e52011-12-22 16:58:29 +0530554 return err;
555}
556
Ren Mingxinc0aa3e02012-04-10 15:28:05 +0800557/*
558 * Legacy naming scheme used for virtio devices. We are stuck with it for
559 * virtio blk but don't ever use it for any new driver.
560 */
561static int virtblk_name_format(char *prefix, int index, char *buf, int buflen)
562{
563 const int base = 'z' - 'a' + 1;
564 char *begin = buf + strlen(prefix);
565 char *end = buf + buflen;
566 char *p;
567 int unit;
568
569 p = end - 1;
570 *p = '\0';
571 unit = base;
572 do {
573 if (p == begin)
574 return -EINVAL;
575 *--p = 'a' + (index % unit);
576 index = (index / unit) - 1;
577 } while (index >= 0);
578
579 memmove(begin, p, end - p);
580 memcpy(buf, prefix, strlen(prefix));
581
582 return 0;
583}
584
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200585static int virtblk_get_cache_mode(struct virtio_device *vdev)
586{
587 u8 writeback;
588 int err;
589
Rusty Russell855e0c52013-10-14 18:11:51 +1030590 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_CONFIG_WCE,
591 struct virtio_blk_config, wce,
592 &writeback);
Michael S. Tsirkin592002f2016-02-24 17:07:27 +0200593
594 /*
595 * If WCE is not configurable and flush is not available,
596 * assume no writeback cache is in use.
597 */
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200598 if (err)
Michael S. Tsirkin592002f2016-02-24 17:07:27 +0200599 writeback = virtio_has_feature(vdev, VIRTIO_BLK_F_FLUSH);
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200600
601 return writeback;
602}
603
604static void virtblk_update_cache_mode(struct virtio_device *vdev)
605{
606 u8 writeback = virtblk_get_cache_mode(vdev);
607 struct virtio_blk *vblk = vdev->priv;
608
Jens Axboead9126a2016-03-30 10:12:58 -0600609 blk_queue_write_cache(vblk->disk->queue, writeback, false);
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200610 revalidate_disk(vblk->disk);
611}
612
613static const char *const virtblk_cache_types[] = {
614 "write through", "write back"
615};
616
617static ssize_t
Hannes Reineckee982c4d2018-09-28 08:17:23 +0200618cache_type_store(struct device *dev, struct device_attribute *attr,
619 const char *buf, size_t count)
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200620{
621 struct gendisk *disk = dev_to_disk(dev);
622 struct virtio_blk *vblk = disk->private_data;
623 struct virtio_device *vdev = vblk->vdev;
624 int i;
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200625
626 BUG_ON(!virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_CONFIG_WCE));
Andy Shevchenkof53d5aa2017-06-09 15:07:42 +0300627 i = sysfs_match_string(virtblk_cache_types, buf);
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200628 if (i < 0)
Andy Shevchenkof53d5aa2017-06-09 15:07:42 +0300629 return i;
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200630
Rusty Russell855e0c52013-10-14 18:11:51 +1030631 virtio_cwrite8(vdev, offsetof(struct virtio_blk_config, wce), i);
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200632 virtblk_update_cache_mode(vdev);
633 return count;
634}
635
636static ssize_t
Hannes Reineckee982c4d2018-09-28 08:17:23 +0200637cache_type_show(struct device *dev, struct device_attribute *attr, char *buf)
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200638{
639 struct gendisk *disk = dev_to_disk(dev);
640 struct virtio_blk *vblk = disk->private_data;
641 u8 writeback = virtblk_get_cache_mode(vblk->vdev);
642
643 BUG_ON(writeback >= ARRAY_SIZE(virtblk_cache_types));
644 return snprintf(buf, 40, "%s\n", virtblk_cache_types[writeback]);
645}
646
Hannes Reineckee982c4d2018-09-28 08:17:23 +0200647static DEVICE_ATTR_RW(cache_type);
648
649static struct attribute *virtblk_attrs[] = {
650 &dev_attr_serial.attr,
651 &dev_attr_cache_type.attr,
652 NULL,
653};
654
655static umode_t virtblk_attrs_are_visible(struct kobject *kobj,
656 struct attribute *a, int n)
657{
658 struct device *dev = container_of(kobj, struct device, kobj);
659 struct gendisk *disk = dev_to_disk(dev);
660 struct virtio_blk *vblk = disk->private_data;
661 struct virtio_device *vdev = vblk->vdev;
662
663 if (a == &dev_attr_cache_type.attr &&
664 !virtio_has_feature(vdev, VIRTIO_BLK_F_CONFIG_WCE))
665 return S_IRUGO;
666
667 return a->mode;
668}
669
670static const struct attribute_group virtblk_attr_group = {
671 .attrs = virtblk_attrs,
672 .is_visible = virtblk_attrs_are_visible,
673};
674
675static const struct attribute_group *virtblk_attr_groups[] = {
676 &virtblk_attr_group,
677 NULL,
678};
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200679
Christoph Hellwigd6296d392017-05-01 10:19:08 -0600680static int virtblk_init_request(struct blk_mq_tag_set *set, struct request *rq,
681 unsigned int hctx_idx, unsigned int numa_node)
Christoph Hellwige9b267d2014-04-15 13:59:10 -0600682{
Christoph Hellwigd6296d392017-05-01 10:19:08 -0600683 struct virtio_blk *vblk = set->driver_data;
Christoph Hellwige9b267d2014-04-15 13:59:10 -0600684 struct virtblk_req *vbr = blk_mq_rq_to_pdu(rq);
685
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100686#ifdef CONFIG_VIRTIO_BLK_SCSI
Christoph Hellwig82ed4db2017-01-27 09:46:29 +0100687 vbr->sreq.sense = vbr->sense;
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100688#endif
Christoph Hellwige9b267d2014-04-15 13:59:10 -0600689 sg_init_table(vbr->sg, vblk->sg_elems);
690 return 0;
691}
692
Christoph Hellwigad714732017-02-05 18:15:25 +0100693static int virtblk_map_queues(struct blk_mq_tag_set *set)
694{
695 struct virtio_blk *vblk = set->driver_data;
696
Dongli Zhang9bc00752019-03-12 09:31:56 +0800697 return blk_mq_virtio_map_queues(&set->map[HCTX_TYPE_DEFAULT],
698 vblk->vdev, 0);
Christoph Hellwigad714732017-02-05 18:15:25 +0100699}
700
Bart Van Asscheefea2ab2017-10-27 08:23:21 -0600701#ifdef CONFIG_VIRTIO_BLK_SCSI
702static void virtblk_initialize_rq(struct request *req)
703{
704 struct virtblk_req *vbr = blk_mq_rq_to_pdu(req);
705
706 scsi_req_init(&vbr->sreq);
707}
708#endif
709
Eric Biggersf363b082017-03-30 13:39:16 -0700710static const struct blk_mq_ops virtio_mq_ops = {
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600711 .queue_rq = virtio_queue_rq,
Jens Axboe944e7c82018-11-26 11:00:12 -0700712 .commit_rqs = virtio_commit_rqs,
Christoph Hellwig5124c282014-02-10 03:24:39 -0800713 .complete = virtblk_request_done,
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600714 .init_request = virtblk_init_request,
Bart Van Asscheefea2ab2017-10-27 08:23:21 -0600715#ifdef CONFIG_VIRTIO_BLK_SCSI
716 .initialize_rq_fn = virtblk_initialize_rq,
717#endif
Christoph Hellwigad714732017-02-05 18:15:25 +0100718 .map_queues = virtblk_map_queues,
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600719};
720
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600721static unsigned int virtblk_queue_depth;
722module_param_named(queue_depth, virtblk_queue_depth, uint, 0444);
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600723
Greg Kroah-Hartman8d85fce2012-12-21 15:13:49 -0800724static int virtblk_probe(struct virtio_device *vdev)
Rusty Russelle467cde2007-10-22 11:03:38 +1000725{
726 struct virtio_blk *vblk;
Christoph Hellwig69740c82010-02-24 14:22:25 -0600727 struct request_queue *q;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200728 int err, index;
Asias Hea98755c2012-08-08 16:07:04 +0800729
Joerg Roedelfd1068e2019-02-07 12:59:17 +0100730 u32 v, blk_size, max_size, sg_elems, opt_io_size;
Christoph Hellwig69740c82010-02-24 14:22:25 -0600731 u16 min_io_size;
732 u8 physical_block_exp, alignment_offset;
Rusty Russelle467cde2007-10-22 11:03:38 +1000733
Michael S. Tsirkina4379fd2015-01-12 16:23:37 +0200734 if (!vdev->config->get) {
735 dev_err(&vdev->dev, "%s failure: config access disabled\n",
736 __func__);
737 return -EINVAL;
738 }
739
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200740 err = ida_simple_get(&vd_index_ida, 0, minor_to_index(1 << MINORBITS),
741 GFP_KERNEL);
742 if (err < 0)
743 goto out;
744 index = err;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100745
Rusty Russell0864b792008-12-30 09:26:05 -0600746 /* We need to know how many segments before we allocate. */
Rusty Russell855e0c52013-10-14 18:11:51 +1030747 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_SEG_MAX,
748 struct virtio_blk_config, seg_max,
749 &sg_elems);
Christoph Hellwiga5b365a2010-05-25 14:17:54 +0200750
751 /* We need at least one SG element, whatever they say. */
752 if (err || !sg_elems)
Rusty Russell0864b792008-12-30 09:26:05 -0600753 sg_elems = 1;
754
755 /* We need an extra sg elements at head and tail. */
756 sg_elems += 2;
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600757 vdev->priv = vblk = kmalloc(sizeof(*vblk), GFP_KERNEL);
Rusty Russelle467cde2007-10-22 11:03:38 +1000758 if (!vblk) {
759 err = -ENOMEM;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200760 goto out_free_index;
Rusty Russelle467cde2007-10-22 11:03:38 +1000761 }
762
Rusty Russelle467cde2007-10-22 11:03:38 +1000763 vblk->vdev = vdev;
Rusty Russell0864b792008-12-30 09:26:05 -0600764 vblk->sg_elems = sg_elems;
Asias Hea98755c2012-08-08 16:07:04 +0800765
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100766 INIT_WORK(&vblk->config_work, virtblk_config_changed_work);
Rusty Russelle467cde2007-10-22 11:03:38 +1000767
Amit Shah6abd6e52011-12-22 16:58:29 +0530768 err = init_vq(vblk);
769 if (err)
Rusty Russelle467cde2007-10-22 11:03:38 +1000770 goto out_free_vblk;
Rusty Russelle467cde2007-10-22 11:03:38 +1000771
Rusty Russelle467cde2007-10-22 11:03:38 +1000772 /* FIXME: How many partitions? How long is a piece of string? */
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100773 vblk->disk = alloc_disk(1 << PART_BITS);
Rusty Russelle467cde2007-10-22 11:03:38 +1000774 if (!vblk->disk) {
775 err = -ENOMEM;
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600776 goto out_free_vq;
Rusty Russelle467cde2007-10-22 11:03:38 +1000777 }
778
Rusty Russellfc4324b2014-03-19 17:08:24 +1030779 /* Default queue sizing is to fill the ring. */
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600780 if (!virtblk_queue_depth) {
Ming Lei6a27b652014-06-26 17:41:48 +0800781 virtblk_queue_depth = vblk->vqs[0].vq->num_free;
Rusty Russellfc4324b2014-03-19 17:08:24 +1030782 /* ... but without indirect descs, we use 2 descs per req */
783 if (!virtio_has_feature(vdev, VIRTIO_RING_F_INDIRECT_DESC))
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600784 virtblk_queue_depth /= 2;
Rusty Russellfc4324b2014-03-19 17:08:24 +1030785 }
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600786
787 memset(&vblk->tag_set, 0, sizeof(vblk->tag_set));
788 vblk->tag_set.ops = &virtio_mq_ops;
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600789 vblk->tag_set.queue_depth = virtblk_queue_depth;
790 vblk->tag_set.numa_node = NUMA_NO_NODE;
791 vblk->tag_set.flags = BLK_MQ_F_SHOULD_MERGE;
792 vblk->tag_set.cmd_size =
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600793 sizeof(struct virtblk_req) +
794 sizeof(struct scatterlist) * sg_elems;
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600795 vblk->tag_set.driver_data = vblk;
Ming Lei6a27b652014-06-26 17:41:48 +0800796 vblk->tag_set.nr_hw_queues = vblk->num_vqs;
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600797
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600798 err = blk_mq_alloc_tag_set(&vblk->tag_set);
799 if (err)
800 goto out_put_disk;
801
Omar Sandoval6bf6b0a2017-01-09 11:44:12 -0800802 q = blk_mq_init_queue(&vblk->tag_set);
Ming Lei35b489d2015-01-02 14:25:27 +0000803 if (IS_ERR(q)) {
Rusty Russelle467cde2007-10-22 11:03:38 +1000804 err = -ENOMEM;
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600805 goto out_free_tags;
Rusty Russelle467cde2007-10-22 11:03:38 +1000806 }
Omar Sandoval6bf6b0a2017-01-09 11:44:12 -0800807 vblk->disk->queue = q;
Rusty Russelle467cde2007-10-22 11:03:38 +1000808
Christoph Hellwig69740c82010-02-24 14:22:25 -0600809 q->queuedata = vblk;
Fernando Luis Vázquez Cao7d116b62008-10-27 18:45:15 +0900810
Ren Mingxinc0aa3e02012-04-10 15:28:05 +0800811 virtblk_name_format("vd", index, vblk->disk->disk_name, DISK_NAME_LEN);
Christian Borntraegerd50ed902008-02-01 09:05:00 +0100812
Rusty Russelle467cde2007-10-22 11:03:38 +1000813 vblk->disk->major = major;
Christian Borntraegerd50ed902008-02-01 09:05:00 +0100814 vblk->disk->first_minor = index_to_minor(index);
Rusty Russelle467cde2007-10-22 11:03:38 +1000815 vblk->disk->private_data = vblk;
816 vblk->disk->fops = &virtblk_fops;
Fam Zheng5fa31422015-09-06 17:05:42 +0800817 vblk->disk->flags |= GENHD_FL_EXT_DEVT;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200818 vblk->index = index;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100819
Tejun Heo02c42b72010-09-03 11:56:18 +0200820 /* configure queue flush support */
Paolo Bonzinicd5d5032012-07-03 15:19:37 +0200821 virtblk_update_cache_mode(vdev);
Rusty Russelle467cde2007-10-22 11:03:38 +1000822
Christian Borntraeger3ef53602008-05-16 11:17:03 +0200823 /* If disk is read-only in the host, the guest should obey */
824 if (virtio_has_feature(vdev, VIRTIO_BLK_F_RO))
825 set_disk_ro(vblk->disk, 1);
826
Rusty Russell0864b792008-12-30 09:26:05 -0600827 /* We can handle whatever the host told us to handle. */
Martin K. Petersenee714f22010-03-10 00:48:32 -0500828 blk_queue_max_segments(q, vblk->sg_elems-2);
Rusty Russell0864b792008-12-30 09:26:05 -0600829
Rusty Russell4b7f7e22008-12-30 09:26:04 -0600830 /* No real sector limit. */
Martin K. Petersenee714f22010-03-10 00:48:32 -0500831 blk_queue_max_hw_sectors(q, -1U);
Rusty Russell4b7f7e22008-12-30 09:26:04 -0600832
Joerg Roedelfd1068e2019-02-07 12:59:17 +0100833 max_size = virtio_max_dma_size(vdev);
834
Rusty Russella586d4f2008-02-04 23:49:56 -0500835 /* Host can optionally specify maximum segment size and number of
836 * segments. */
Rusty Russell855e0c52013-10-14 18:11:51 +1030837 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_SIZE_MAX,
838 struct virtio_blk_config, size_max, &v);
Rusty Russelle467cde2007-10-22 11:03:38 +1000839 if (!err)
Joerg Roedelfd1068e2019-02-07 12:59:17 +0100840 max_size = min(max_size, v);
841
842 blk_queue_max_segment_size(q, max_size);
Rusty Russelle467cde2007-10-22 11:03:38 +1000843
Christian Borntraeger066f4d82008-05-29 11:08:26 +0200844 /* Host can optionally specify the block size of the device */
Rusty Russell855e0c52013-10-14 18:11:51 +1030845 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_BLK_SIZE,
846 struct virtio_blk_config, blk_size,
847 &blk_size);
Christian Borntraeger066f4d82008-05-29 11:08:26 +0200848 if (!err)
Christoph Hellwig69740c82010-02-24 14:22:25 -0600849 blk_queue_logical_block_size(q, blk_size);
850 else
851 blk_size = queue_logical_block_size(q);
852
853 /* Use topology information if available */
Rusty Russell855e0c52013-10-14 18:11:51 +1030854 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
855 struct virtio_blk_config, physical_block_exp,
856 &physical_block_exp);
Christoph Hellwig69740c82010-02-24 14:22:25 -0600857 if (!err && physical_block_exp)
858 blk_queue_physical_block_size(q,
859 blk_size * (1 << physical_block_exp));
860
Rusty Russell855e0c52013-10-14 18:11:51 +1030861 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
862 struct virtio_blk_config, alignment_offset,
863 &alignment_offset);
Christoph Hellwig69740c82010-02-24 14:22:25 -0600864 if (!err && alignment_offset)
865 blk_queue_alignment_offset(q, blk_size * alignment_offset);
866
Rusty Russell855e0c52013-10-14 18:11:51 +1030867 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
868 struct virtio_blk_config, min_io_size,
869 &min_io_size);
Christoph Hellwig69740c82010-02-24 14:22:25 -0600870 if (!err && min_io_size)
871 blk_queue_io_min(q, blk_size * min_io_size);
872
Rusty Russell855e0c52013-10-14 18:11:51 +1030873 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
874 struct virtio_blk_config, opt_io_size,
875 &opt_io_size);
Christoph Hellwig69740c82010-02-24 14:22:25 -0600876 if (!err && opt_io_size)
877 blk_queue_io_opt(q, blk_size * opt_io_size);
878
Changpeng Liu1f238162018-11-01 15:40:35 -0700879 if (virtio_has_feature(vdev, VIRTIO_BLK_F_DISCARD)) {
880 q->limits.discard_granularity = blk_size;
881
882 virtio_cread(vdev, struct virtio_blk_config,
883 discard_sector_alignment, &v);
884 q->limits.discard_alignment = v ? v << SECTOR_SHIFT : 0;
885
886 virtio_cread(vdev, struct virtio_blk_config,
887 max_discard_sectors, &v);
888 blk_queue_max_discard_sectors(q, v ? v : UINT_MAX);
889
890 virtio_cread(vdev, struct virtio_blk_config, max_discard_seg,
891 &v);
892 blk_queue_max_discard_segments(q,
893 min_not_zero(v,
894 MAX_DISCARD_SEGMENTS));
895
896 blk_queue_flag_set(QUEUE_FLAG_DISCARD, q);
897 }
898
899 if (virtio_has_feature(vdev, VIRTIO_BLK_F_WRITE_ZEROES)) {
900 virtio_cread(vdev, struct virtio_blk_config,
901 max_write_zeroes_sectors, &v);
902 blk_queue_max_write_zeroes_sectors(q, v ? v : UINT_MAX);
903 }
904
Stefan Hajnoczidaf2a502018-01-03 16:03:39 +0000905 virtblk_update_capacity(vblk, false);
Michael S. Tsirkin7a113702014-10-15 10:22:30 +1030906 virtio_device_ready(vdev);
907
Hannes Reineckee982c4d2018-09-28 08:17:23 +0200908 device_add_disk(&vdev->dev, vblk->disk, virtblk_attr_groups);
Rusty Russelle467cde2007-10-22 11:03:38 +1000909 return 0;
910
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600911out_free_tags:
912 blk_mq_free_tag_set(&vblk->tag_set);
Rusty Russelle467cde2007-10-22 11:03:38 +1000913out_put_disk:
914 put_disk(vblk->disk);
Rusty Russelle467cde2007-10-22 11:03:38 +1000915out_free_vq:
Michael S. Tsirkind2a7ddd2009-06-12 22:16:36 -0600916 vdev->config->del_vqs(vdev);
Rusty Russelle467cde2007-10-22 11:03:38 +1000917out_free_vblk:
918 kfree(vblk);
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200919out_free_index:
920 ida_simple_remove(&vd_index_ida, index);
Rusty Russelle467cde2007-10-22 11:03:38 +1000921out:
922 return err;
923}
924
Greg Kroah-Hartman8d85fce2012-12-21 15:13:49 -0800925static void virtblk_remove(struct virtio_device *vdev)
Rusty Russelle467cde2007-10-22 11:03:38 +1000926{
927 struct virtio_blk *vblk = vdev->priv;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200928 int index = vblk->index;
Alexander Graff4953fe2013-01-02 15:37:17 +1030929 int refc;
Rusty Russelle467cde2007-10-22 11:03:38 +1000930
Michael S. Tsirkincc74f712014-10-15 10:22:26 +1030931 /* Make sure no work handler is accessing the device. */
932 flush_work(&vblk->config_work);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100933
Asias He02e2b122012-05-25 10:34:47 +0800934 del_gendisk(vblk->disk);
Asias He483001c2012-05-25 10:34:48 +0800935 blk_cleanup_queue(vblk->disk->queue);
Asias He02e2b122012-05-25 10:34:47 +0800936
Christoph Hellwig24d2f902014-04-15 14:14:00 -0600937 blk_mq_free_tag_set(&vblk->tag_set);
938
Rusty Russell6e5aa7e2008-02-04 23:50:03 -0500939 /* Stop all the virtqueues. */
940 vdev->config->reset(vdev);
941
Peter Zijlstra2c935bc2016-11-14 17:29:48 +0100942 refc = kref_read(&disk_to_dev(vblk->disk)->kobj.kref);
Rusty Russelle467cde2007-10-22 11:03:38 +1000943 put_disk(vblk->disk);
Michael S. Tsirkind2a7ddd2009-06-12 22:16:36 -0600944 vdev->config->del_vqs(vdev);
Ming Lei6a27b652014-06-26 17:41:48 +0800945 kfree(vblk->vqs);
Rusty Russelle467cde2007-10-22 11:03:38 +1000946 kfree(vblk);
Alexander Graff4953fe2013-01-02 15:37:17 +1030947
948 /* Only free device id if we don't have any users */
949 if (refc == 1)
950 ida_simple_remove(&vd_index_ida, index);
Rusty Russelle467cde2007-10-22 11:03:38 +1000951}
952
Aaron Lu89107002013-09-17 09:25:23 +0930953#ifdef CONFIG_PM_SLEEP
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530954static int virtblk_freeze(struct virtio_device *vdev)
955{
956 struct virtio_blk *vblk = vdev->priv;
957
958 /* Ensure we don't receive any more interrupts */
959 vdev->config->reset(vdev);
960
Michael S. Tsirkincc74f712014-10-15 10:22:26 +1030961 /* Make sure no work handler is accessing the device. */
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530962 flush_work(&vblk->config_work);
963
Sagi Grimberg9b3e9902017-07-04 10:03:03 +0300964 blk_mq_quiesce_queue(vblk->disk->queue);
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530965
966 vdev->config->del_vqs(vdev);
967 return 0;
968}
969
970static int virtblk_restore(struct virtio_device *vdev)
971{
972 struct virtio_blk *vblk = vdev->priv;
973 int ret;
974
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530975 ret = init_vq(vdev->priv);
Michael S. Tsirkin6d62c372014-10-15 10:22:32 +1030976 if (ret)
977 return ret;
Jens Axboe1cf7e9c2013-11-01 10:52:52 -0600978
Michael S. Tsirkin6d62c372014-10-15 10:22:32 +1030979 virtio_device_ready(vdev);
980
Sagi Grimberg9b3e9902017-07-04 10:03:03 +0300981 blk_mq_unquiesce_queue(vblk->disk->queue);
Michael S. Tsirkin6d62c372014-10-15 10:22:32 +1030982 return 0;
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530983}
984#endif
985
Márton Németh47483e22010-01-10 13:40:02 +0100986static const struct virtio_device_id id_table[] = {
Rusty Russelle467cde2007-10-22 11:03:38 +1000987 { VIRTIO_ID_BLOCK, VIRTIO_DEV_ANY_ID },
988 { 0 },
989};
990
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +0200991static unsigned int features_legacy[] = {
Tejun Heo02c42b72010-09-03 11:56:18 +0200992 VIRTIO_BLK_F_SEG_MAX, VIRTIO_BLK_F_SIZE_MAX, VIRTIO_BLK_F_GEOMETRY,
Christoph Hellwig97b50a62017-01-28 09:32:53 +0100993 VIRTIO_BLK_F_RO, VIRTIO_BLK_F_BLK_SIZE,
994#ifdef CONFIG_VIRTIO_BLK_SCSI
995 VIRTIO_BLK_F_SCSI,
996#endif
Michael S. Tsirkin592002f2016-02-24 17:07:27 +0200997 VIRTIO_BLK_F_FLUSH, VIRTIO_BLK_F_TOPOLOGY, VIRTIO_BLK_F_CONFIG_WCE,
Changpeng Liu1f238162018-11-01 15:40:35 -0700998 VIRTIO_BLK_F_MQ, VIRTIO_BLK_F_DISCARD, VIRTIO_BLK_F_WRITE_ZEROES,
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +0200999}
1000;
1001static unsigned int features[] = {
1002 VIRTIO_BLK_F_SEG_MAX, VIRTIO_BLK_F_SIZE_MAX, VIRTIO_BLK_F_GEOMETRY,
1003 VIRTIO_BLK_F_RO, VIRTIO_BLK_F_BLK_SIZE,
Michael S. Tsirkin592002f2016-02-24 17:07:27 +02001004 VIRTIO_BLK_F_FLUSH, VIRTIO_BLK_F_TOPOLOGY, VIRTIO_BLK_F_CONFIG_WCE,
Changpeng Liu1f238162018-11-01 15:40:35 -07001005 VIRTIO_BLK_F_MQ, VIRTIO_BLK_F_DISCARD, VIRTIO_BLK_F_WRITE_ZEROES,
Rusty Russellc45a6812008-05-02 21:50:50 -05001006};
1007
Greg Kroah-Hartman8d85fce2012-12-21 15:13:49 -08001008static struct virtio_driver virtio_blk = {
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +02001009 .feature_table = features,
1010 .feature_table_size = ARRAY_SIZE(features),
1011 .feature_table_legacy = features_legacy,
1012 .feature_table_size_legacy = ARRAY_SIZE(features_legacy),
1013 .driver.name = KBUILD_MODNAME,
1014 .driver.owner = THIS_MODULE,
1015 .id_table = id_table,
1016 .probe = virtblk_probe,
1017 .remove = virtblk_remove,
1018 .config_changed = virtblk_config_changed,
Aaron Lu89107002013-09-17 09:25:23 +09301019#ifdef CONFIG_PM_SLEEP
Michael S. Tsirkin19c1c5a2014-10-07 16:39:49 +02001020 .freeze = virtblk_freeze,
1021 .restore = virtblk_restore,
Amit Shahf8fb5bc2011-12-22 16:58:30 +05301022#endif
Rusty Russelle467cde2007-10-22 11:03:38 +10001023};
1024
1025static int __init init(void)
1026{
Christoph Hellwig7a7c9242011-02-01 21:43:48 +01001027 int error;
1028
1029 virtblk_wq = alloc_workqueue("virtio-blk", 0, 0);
1030 if (!virtblk_wq)
1031 return -ENOMEM;
1032
Christian Borntraeger4f3bf192008-01-31 15:53:53 +01001033 major = register_blkdev(0, "virtblk");
Christoph Hellwig7a7c9242011-02-01 21:43:48 +01001034 if (major < 0) {
1035 error = major;
1036 goto out_destroy_workqueue;
1037 }
1038
1039 error = register_virtio_driver(&virtio_blk);
1040 if (error)
1041 goto out_unregister_blkdev;
1042 return 0;
1043
1044out_unregister_blkdev:
1045 unregister_blkdev(major, "virtblk");
1046out_destroy_workqueue:
1047 destroy_workqueue(virtblk_wq);
1048 return error;
Rusty Russelle467cde2007-10-22 11:03:38 +10001049}
1050
1051static void __exit fini(void)
1052{
Rusty Russelle467cde2007-10-22 11:03:38 +10001053 unregister_virtio_driver(&virtio_blk);
Michael S. Tsirkin38f37b52014-10-23 18:57:19 +03001054 unregister_blkdev(major, "virtblk");
Christoph Hellwig7a7c9242011-02-01 21:43:48 +01001055 destroy_workqueue(virtblk_wq);
Rusty Russelle467cde2007-10-22 11:03:38 +10001056}
1057module_init(init);
1058module_exit(fini);
1059
1060MODULE_DEVICE_TABLE(virtio, id_table);
1061MODULE_DESCRIPTION("Virtio block driver");
1062MODULE_LICENSE("GPL");