blob: d2fe679519e441818f77e851ef33ce47371844ae [file] [log] [blame]
Rusty Russelle467cde2007-10-22 11:03:38 +10001//#define DEBUG
2#include <linux/spinlock.h>
3#include <linux/blkdev.h>
4#include <linux/hdreg.h>
5#include <linux/virtio.h>
6#include <linux/virtio_blk.h>
Jens Axboe3d1266c2007-10-24 13:21:21 +02007#include <linux/scatterlist.h>
8
9#define VIRTIO_MAX_SG (3+MAX_PHYS_SEGMENTS)
Rusty Russelle467cde2007-10-22 11:03:38 +100010
11static unsigned char virtblk_index = 'a';
12struct virtio_blk
13{
14 spinlock_t lock;
15
16 struct virtio_device *vdev;
17 struct virtqueue *vq;
18
19 /* The disk structure for the kernel. */
20 struct gendisk *disk;
21
22 /* Request tracking. */
23 struct list_head reqs;
24
25 mempool_t *pool;
26
27 /* Scatterlist: can be too big for stack. */
Jens Axboe3d1266c2007-10-24 13:21:21 +020028 struct scatterlist sg[VIRTIO_MAX_SG];
Rusty Russelle467cde2007-10-22 11:03:38 +100029};
30
31struct virtblk_req
32{
33 struct list_head list;
34 struct request *req;
35 struct virtio_blk_outhdr out_hdr;
36 struct virtio_blk_inhdr in_hdr;
37};
38
Rusty Russell18445c42008-02-04 23:49:57 -050039static void blk_done(struct virtqueue *vq)
Rusty Russelle467cde2007-10-22 11:03:38 +100040{
41 struct virtio_blk *vblk = vq->vdev->priv;
42 struct virtblk_req *vbr;
43 unsigned int len;
44 unsigned long flags;
45
46 spin_lock_irqsave(&vblk->lock, flags);
47 while ((vbr = vblk->vq->vq_ops->get_buf(vblk->vq, &len)) != NULL) {
48 int uptodate;
49 switch (vbr->in_hdr.status) {
50 case VIRTIO_BLK_S_OK:
51 uptodate = 1;
52 break;
53 case VIRTIO_BLK_S_UNSUPP:
54 uptodate = -ENOTTY;
55 break;
56 default:
57 uptodate = 0;
58 break;
59 }
60
61 end_dequeued_request(vbr->req, uptodate);
62 list_del(&vbr->list);
63 mempool_free(vbr, vblk->pool);
64 }
65 /* In case queue is stopped waiting for more buffers. */
66 blk_start_queue(vblk->disk->queue);
67 spin_unlock_irqrestore(&vblk->lock, flags);
Rusty Russelle467cde2007-10-22 11:03:38 +100068}
69
70static bool do_req(struct request_queue *q, struct virtio_blk *vblk,
71 struct request *req)
72{
73 unsigned long num, out, in;
74 struct virtblk_req *vbr;
75
76 vbr = mempool_alloc(vblk->pool, GFP_ATOMIC);
77 if (!vbr)
78 /* When another request finishes we'll try again. */
79 return false;
80
81 vbr->req = req;
82 if (blk_fs_request(vbr->req)) {
83 vbr->out_hdr.type = 0;
84 vbr->out_hdr.sector = vbr->req->sector;
85 vbr->out_hdr.ioprio = vbr->req->ioprio;
86 } else if (blk_pc_request(vbr->req)) {
87 vbr->out_hdr.type = VIRTIO_BLK_T_SCSI_CMD;
88 vbr->out_hdr.sector = 0;
89 vbr->out_hdr.ioprio = vbr->req->ioprio;
90 } else {
91 /* We don't put anything else in the queue. */
92 BUG();
93 }
94
95 if (blk_barrier_rq(vbr->req))
96 vbr->out_hdr.type |= VIRTIO_BLK_T_BARRIER;
97
Jens Axboe3d1266c2007-10-24 13:21:21 +020098 /* This init could be done at vblk creation time */
99 sg_init_table(vblk->sg, VIRTIO_MAX_SG);
Rusty Russelle467cde2007-10-22 11:03:38 +1000100 sg_set_buf(&vblk->sg[0], &vbr->out_hdr, sizeof(vbr->out_hdr));
101 num = blk_rq_map_sg(q, vbr->req, vblk->sg+1);
102 sg_set_buf(&vblk->sg[num+1], &vbr->in_hdr, sizeof(vbr->in_hdr));
103
104 if (rq_data_dir(vbr->req) == WRITE) {
105 vbr->out_hdr.type |= VIRTIO_BLK_T_OUT;
106 out = 1 + num;
107 in = 1;
108 } else {
109 vbr->out_hdr.type |= VIRTIO_BLK_T_IN;
110 out = 1;
111 in = 1 + num;
112 }
113
114 if (vblk->vq->vq_ops->add_buf(vblk->vq, vblk->sg, out, in, vbr)) {
115 mempool_free(vbr, vblk->pool);
116 return false;
117 }
118
119 list_add_tail(&vbr->list, &vblk->reqs);
120 return true;
121}
122
123static void do_virtblk_request(struct request_queue *q)
124{
125 struct virtio_blk *vblk = NULL;
126 struct request *req;
127 unsigned int issued = 0;
128
129 while ((req = elv_next_request(q)) != NULL) {
130 vblk = req->rq_disk->private_data;
131 BUG_ON(req->nr_phys_segments > ARRAY_SIZE(vblk->sg));
132
133 /* If this request fails, stop queue and wait for something to
134 finish to restart it. */
135 if (!do_req(q, vblk, req)) {
136 blk_stop_queue(q);
137 break;
138 }
139 blkdev_dequeue_request(req);
140 issued++;
141 }
142
143 if (issued)
144 vblk->vq->vq_ops->kick(vblk->vq);
145}
146
147static int virtblk_ioctl(struct inode *inode, struct file *filp,
148 unsigned cmd, unsigned long data)
149{
150 return scsi_cmd_ioctl(filp, inode->i_bdev->bd_disk->queue,
151 inode->i_bdev->bd_disk, cmd,
152 (void __user *)data);
153}
154
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100155/* We provide getgeo only to please some old bootloader/partitioning tools */
156static int virtblk_getgeo(struct block_device *bd, struct hd_geometry *geo)
157{
158 /* some standard values, similar to sd */
159 geo->heads = 1 << 6;
160 geo->sectors = 1 << 5;
161 geo->cylinders = get_capacity(bd->bd_disk) >> 11;
162 return 0;
163}
164
Rusty Russelle467cde2007-10-22 11:03:38 +1000165static struct block_device_operations virtblk_fops = {
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100166 .ioctl = virtblk_ioctl,
167 .owner = THIS_MODULE,
168 .getgeo = virtblk_getgeo,
Rusty Russelle467cde2007-10-22 11:03:38 +1000169};
170
171static int virtblk_probe(struct virtio_device *vdev)
172{
173 struct virtio_blk *vblk;
174 int err, major;
Rusty Russelle467cde2007-10-22 11:03:38 +1000175 u64 cap;
176 u32 v;
177
178 vdev->priv = vblk = kmalloc(sizeof(*vblk), GFP_KERNEL);
179 if (!vblk) {
180 err = -ENOMEM;
181 goto out;
182 }
183
184 INIT_LIST_HEAD(&vblk->reqs);
185 spin_lock_init(&vblk->lock);
186 vblk->vdev = vdev;
187
188 /* We expect one virtqueue, for output. */
Rusty Russella586d4f2008-02-04 23:49:56 -0500189 vblk->vq = vdev->config->find_vq(vdev, 0, blk_done);
Rusty Russelle467cde2007-10-22 11:03:38 +1000190 if (IS_ERR(vblk->vq)) {
191 err = PTR_ERR(vblk->vq);
192 goto out_free_vblk;
193 }
194
195 vblk->pool = mempool_create_kmalloc_pool(1,sizeof(struct virtblk_req));
196 if (!vblk->pool) {
197 err = -ENOMEM;
198 goto out_free_vq;
199 }
200
201 major = register_blkdev(0, "virtblk");
202 if (major < 0) {
203 err = major;
204 goto out_mempool;
205 }
206
207 /* FIXME: How many partitions? How long is a piece of string? */
208 vblk->disk = alloc_disk(1 << 4);
209 if (!vblk->disk) {
210 err = -ENOMEM;
211 goto out_unregister_blkdev;
212 }
213
214 vblk->disk->queue = blk_init_queue(do_virtblk_request, &vblk->lock);
215 if (!vblk->disk->queue) {
216 err = -ENOMEM;
217 goto out_put_disk;
218 }
219
220 sprintf(vblk->disk->disk_name, "vd%c", virtblk_index++);
221 vblk->disk->major = major;
222 vblk->disk->first_minor = 0;
223 vblk->disk->private_data = vblk;
224 vblk->disk->fops = &virtblk_fops;
225
226 /* If barriers are supported, tell block layer that queue is ordered */
Rusty Russella586d4f2008-02-04 23:49:56 -0500227 if (vdev->config->feature(vdev, VIRTIO_BLK_F_BARRIER))
Rusty Russelle467cde2007-10-22 11:03:38 +1000228 blk_queue_ordered(vblk->disk->queue, QUEUE_ORDERED_TAG, NULL);
229
Rusty Russella586d4f2008-02-04 23:49:56 -0500230 /* Host must always specify the capacity. */
231 __virtio_config_val(vdev, offsetof(struct virtio_blk_config, capacity),
232 &cap);
Rusty Russelle467cde2007-10-22 11:03:38 +1000233
234 /* If capacity is too big, truncate with warning. */
235 if ((sector_t)cap != cap) {
236 dev_warn(&vdev->dev, "Capacity %llu too large: truncating\n",
237 (unsigned long long)cap);
238 cap = (sector_t)-1;
239 }
240 set_capacity(vblk->disk, cap);
241
Rusty Russella586d4f2008-02-04 23:49:56 -0500242 /* Host can optionally specify maximum segment size and number of
243 * segments. */
244 err = virtio_config_val(vdev, VIRTIO_BLK_F_SIZE_MAX,
245 offsetof(struct virtio_blk_config, size_max),
246 &v);
Rusty Russelle467cde2007-10-22 11:03:38 +1000247 if (!err)
248 blk_queue_max_segment_size(vblk->disk->queue, v);
Rusty Russelle467cde2007-10-22 11:03:38 +1000249
Rusty Russella586d4f2008-02-04 23:49:56 -0500250 err = virtio_config_val(vdev, VIRTIO_BLK_F_SEG_MAX,
251 offsetof(struct virtio_blk_config, seg_max),
252 &v);
Rusty Russelle467cde2007-10-22 11:03:38 +1000253 if (!err)
254 blk_queue_max_hw_segments(vblk->disk->queue, v);
Rusty Russelle467cde2007-10-22 11:03:38 +1000255
256 add_disk(vblk->disk);
257 return 0;
258
259out_put_disk:
260 put_disk(vblk->disk);
261out_unregister_blkdev:
262 unregister_blkdev(major, "virtblk");
263out_mempool:
264 mempool_destroy(vblk->pool);
265out_free_vq:
266 vdev->config->del_vq(vblk->vq);
267out_free_vblk:
268 kfree(vblk);
269out:
270 return err;
271}
272
273static void virtblk_remove(struct virtio_device *vdev)
274{
275 struct virtio_blk *vblk = vdev->priv;
276 int major = vblk->disk->major;
277
Rusty Russell6e5aa7e2008-02-04 23:50:03 -0500278 /* Nothing should be pending. */
Rusty Russelle467cde2007-10-22 11:03:38 +1000279 BUG_ON(!list_empty(&vblk->reqs));
Rusty Russell6e5aa7e2008-02-04 23:50:03 -0500280
281 /* Stop all the virtqueues. */
282 vdev->config->reset(vdev);
283
Rusty Russelle467cde2007-10-22 11:03:38 +1000284 blk_cleanup_queue(vblk->disk->queue);
285 put_disk(vblk->disk);
286 unregister_blkdev(major, "virtblk");
287 mempool_destroy(vblk->pool);
Rusty Russell74b25532007-11-19 11:20:42 -0500288 vdev->config->del_vq(vblk->vq);
Rusty Russelle467cde2007-10-22 11:03:38 +1000289 kfree(vblk);
290}
291
292static struct virtio_device_id id_table[] = {
293 { VIRTIO_ID_BLOCK, VIRTIO_DEV_ANY_ID },
294 { 0 },
295};
296
297static struct virtio_driver virtio_blk = {
298 .driver.name = KBUILD_MODNAME,
299 .driver.owner = THIS_MODULE,
300 .id_table = id_table,
301 .probe = virtblk_probe,
302 .remove = __devexit_p(virtblk_remove),
303};
304
305static int __init init(void)
306{
307 return register_virtio_driver(&virtio_blk);
308}
309
310static void __exit fini(void)
311{
312 unregister_virtio_driver(&virtio_blk);
313}
314module_init(init);
315module_exit(fini);
316
317MODULE_DEVICE_TABLE(virtio, id_table);
318MODULE_DESCRIPTION("Virtio block driver");
319MODULE_LICENSE("GPL");