]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - drivers/block/virtio_blk.c
virtio_ring: add new function virtqueue_is_broken()
[mirror_ubuntu-artful-kernel.git] / drivers / block / virtio_blk.c
CommitLineData
e467cde2
RR
1//#define DEBUG
2#include <linux/spinlock.h>
5a0e3ad6 3#include <linux/slab.h>
e467cde2
RR
4#include <linux/blkdev.h>
5#include <linux/hdreg.h>
0c8d44f2 6#include <linux/module.h>
4678d6f9 7#include <linux/mutex.h>
e467cde2
RR
8#include <linux/virtio.h>
9#include <linux/virtio_blk.h>
3d1266c7 10#include <linux/scatterlist.h>
7a7c924c 11#include <linux/string_helpers.h>
6917f83f 12#include <scsi/scsi_cmnd.h>
5087a50e 13#include <linux/idr.h>
3d1266c7 14
4f3bf19c 15#define PART_BITS 4
e467cde2 16
a98755c5
AH
17static bool use_bio;
18module_param(use_bio, bool, S_IRUGO);
19
5087a50e
MT
20static int major;
21static DEFINE_IDA(vd_index_ida);
22
2a647bfe 23static struct workqueue_struct *virtblk_wq;
4f3bf19c 24
e467cde2
RR
25struct virtio_blk
26{
e467cde2
RR
27 struct virtio_device *vdev;
28 struct virtqueue *vq;
a98755c5 29 wait_queue_head_t queue_wait;
e467cde2
RR
30
31 /* The disk structure for the kernel. */
32 struct gendisk *disk;
33
e467cde2
RR
34 mempool_t *pool;
35
7a7c924c
CH
36 /* Process context for config space updates */
37 struct work_struct config_work;
38
4678d6f9
MT
39 /* Lock for config space updates */
40 struct mutex config_lock;
41
42 /* enable config space updates */
43 bool config_enable;
44
0864b79a
RR
45 /* What host tells us, plus 2 for header & tailer. */
46 unsigned int sg_elems;
47
5087a50e
MT
48 /* Ida index - used to track minor number allocations. */
49 int index;
50
e467cde2 51 /* Scatterlist: can be too big for stack. */
0864b79a 52 struct scatterlist sg[/*sg_elems*/];
e467cde2
RR
53};
54
55struct virtblk_req
56{
e467cde2 57 struct request *req;
a98755c5 58 struct bio *bio;
e467cde2 59 struct virtio_blk_outhdr out_hdr;
1cde26f9 60 struct virtio_scsi_inhdr in_hdr;
c85a1f91
AH
61 struct work_struct work;
62 struct virtio_blk *vblk;
63 int flags;
cb38fa23 64 u8 status;
a98755c5 65 struct scatterlist sg[];
e467cde2
RR
66};
67
c85a1f91
AH
68enum {
69 VBLK_IS_FLUSH = 1,
70 VBLK_REQ_FLUSH = 2,
71 VBLK_REQ_DATA = 4,
72 VBLK_REQ_FUA = 8,
73};
74
a98755c5
AH
75static inline int virtblk_result(struct virtblk_req *vbr)
76{
77 switch (vbr->status) {
78 case VIRTIO_BLK_S_OK:
79 return 0;
80 case VIRTIO_BLK_S_UNSUPP:
81 return -ENOTTY;
82 default:
83 return -EIO;
84 }
85}
86
c85a1f91
AH
87static inline struct virtblk_req *virtblk_alloc_req(struct virtio_blk *vblk,
88 gfp_t gfp_mask)
89{
90 struct virtblk_req *vbr;
91
92 vbr = mempool_alloc(vblk->pool, gfp_mask);
f22cf8eb
DC
93 if (!vbr)
94 return NULL;
c85a1f91
AH
95
96 vbr->vblk = vblk;
f22cf8eb
DC
97 if (use_bio)
98 sg_init_table(vbr->sg, vblk->sg_elems);
c85a1f91
AH
99
100 return vbr;
101}
102
8f39db9d 103static int __virtblk_add_req(struct virtqueue *vq,
20af3cfd
PB
104 struct virtblk_req *vbr,
105 struct scatterlist *data_sg,
0a11cc36 106 bool have_data)
c85a1f91 107{
20af3cfd 108 struct scatterlist hdr, status, cmd, sense, inhdr, *sgs[6];
8f39db9d 109 unsigned int num_out = 0, num_in = 0;
20af3cfd 110 int type = vbr->out_hdr.type & ~VIRTIO_BLK_T_OUT;
8f39db9d
PB
111
112 sg_init_one(&hdr, &vbr->out_hdr, sizeof(vbr->out_hdr));
113 sgs[num_out++] = &hdr;
114
20af3cfd
PB
115 /*
116 * If this is a packet command we need a couple of additional headers.
117 * Behind the normal outhdr we put a segment with the scsi command
118 * block, and before the normal inhdr we put the sense data and the
119 * inhdr with additional status information.
120 */
121 if (type == VIRTIO_BLK_T_SCSI_CMD) {
122 sg_init_one(&cmd, vbr->req->cmd, vbr->req->cmd_len);
123 sgs[num_out++] = &cmd;
124 }
125
0a11cc36 126 if (have_data) {
8f39db9d 127 if (vbr->out_hdr.type & VIRTIO_BLK_T_OUT)
20af3cfd 128 sgs[num_out++] = data_sg;
8f39db9d 129 else
20af3cfd
PB
130 sgs[num_out + num_in++] = data_sg;
131 }
132
133 if (type == VIRTIO_BLK_T_SCSI_CMD) {
134 sg_init_one(&sense, vbr->req->sense, SCSI_SENSE_BUFFERSIZE);
135 sgs[num_out + num_in++] = &sense;
136 sg_init_one(&inhdr, &vbr->in_hdr, sizeof(vbr->in_hdr));
137 sgs[num_out + num_in++] = &inhdr;
8f39db9d
PB
138 }
139
140 sg_init_one(&status, &vbr->status, sizeof(vbr->status));
141 sgs[num_out + num_in++] = &status;
142
143 return virtqueue_add_sgs(vq, sgs, num_out, num_in, vbr, GFP_ATOMIC);
5ee21a52
PB
144}
145
0a11cc36 146static void virtblk_add_req(struct virtblk_req *vbr, bool have_data)
5ee21a52
PB
147{
148 struct virtio_blk *vblk = vbr->vblk;
c85a1f91 149 DEFINE_WAIT(wait);
5ee21a52 150 int ret;
c85a1f91 151
5ee21a52 152 spin_lock_irq(vblk->disk->queue->queue_lock);
20af3cfd 153 while (unlikely((ret = __virtblk_add_req(vblk->vq, vbr, vbr->sg,
0a11cc36 154 have_data)) < 0)) {
c85a1f91
AH
155 prepare_to_wait_exclusive(&vblk->queue_wait, &wait,
156 TASK_UNINTERRUPTIBLE);
157
5ee21a52
PB
158 spin_unlock_irq(vblk->disk->queue->queue_lock);
159 io_schedule();
c85a1f91 160 spin_lock_irq(vblk->disk->queue->queue_lock);
c85a1f91 161
5ee21a52 162 finish_wait(&vblk->queue_wait, &wait);
c85a1f91
AH
163 }
164
c85a1f91
AH
165 virtqueue_kick(vblk->vq);
166 spin_unlock_irq(vblk->disk->queue->queue_lock);
167}
168
5ee21a52 169static void virtblk_bio_send_flush(struct virtblk_req *vbr)
c85a1f91 170{
c85a1f91
AH
171 vbr->flags |= VBLK_IS_FLUSH;
172 vbr->out_hdr.type = VIRTIO_BLK_T_FLUSH;
173 vbr->out_hdr.sector = 0;
174 vbr->out_hdr.ioprio = 0;
c85a1f91 175
0a11cc36 176 virtblk_add_req(vbr, false);
c85a1f91
AH
177}
178
5ee21a52 179static void virtblk_bio_send_data(struct virtblk_req *vbr)
c85a1f91
AH
180{
181 struct virtio_blk *vblk = vbr->vblk;
c85a1f91 182 struct bio *bio = vbr->bio;
0a11cc36 183 bool have_data;
c85a1f91
AH
184
185 vbr->flags &= ~VBLK_IS_FLUSH;
186 vbr->out_hdr.type = 0;
187 vbr->out_hdr.sector = bio->bi_sector;
188 vbr->out_hdr.ioprio = bio_prio(bio);
189
0a11cc36
RR
190 if (blk_bio_map_sg(vblk->disk->queue, bio, vbr->sg)) {
191 have_data = true;
8f39db9d 192 if (bio->bi_rw & REQ_WRITE)
c85a1f91 193 vbr->out_hdr.type |= VIRTIO_BLK_T_OUT;
8f39db9d 194 else
c85a1f91 195 vbr->out_hdr.type |= VIRTIO_BLK_T_IN;
0a11cc36
RR
196 } else
197 have_data = false;
c85a1f91 198
0a11cc36 199 virtblk_add_req(vbr, have_data);
c85a1f91
AH
200}
201
202static void virtblk_bio_send_data_work(struct work_struct *work)
203{
204 struct virtblk_req *vbr;
205
206 vbr = container_of(work, struct virtblk_req, work);
207
208 virtblk_bio_send_data(vbr);
209}
210
211static void virtblk_bio_send_flush_work(struct work_struct *work)
212{
213 struct virtblk_req *vbr;
214
215 vbr = container_of(work, struct virtblk_req, work);
216
217 virtblk_bio_send_flush(vbr);
218}
219
220static inline void virtblk_request_done(struct virtblk_req *vbr)
a98755c5 221{
c85a1f91 222 struct virtio_blk *vblk = vbr->vblk;
a98755c5
AH
223 struct request *req = vbr->req;
224 int error = virtblk_result(vbr);
225
226 if (req->cmd_type == REQ_TYPE_BLOCK_PC) {
227 req->resid_len = vbr->in_hdr.residual;
228 req->sense_len = vbr->in_hdr.sense_len;
229 req->errors = vbr->in_hdr.errors;
230 } else if (req->cmd_type == REQ_TYPE_SPECIAL) {
231 req->errors = (error != 0);
232 }
233
234 __blk_end_request_all(req, error);
235 mempool_free(vbr, vblk->pool);
236}
237
c85a1f91 238static inline void virtblk_bio_flush_done(struct virtblk_req *vbr)
a98755c5 239{
c85a1f91
AH
240 struct virtio_blk *vblk = vbr->vblk;
241
242 if (vbr->flags & VBLK_REQ_DATA) {
243 /* Send out the actual write data */
244 INIT_WORK(&vbr->work, virtblk_bio_send_data_work);
245 queue_work(virtblk_wq, &vbr->work);
246 } else {
247 bio_endio(vbr->bio, virtblk_result(vbr));
248 mempool_free(vbr, vblk->pool);
249 }
250}
251
252static inline void virtblk_bio_data_done(struct virtblk_req *vbr)
253{
254 struct virtio_blk *vblk = vbr->vblk;
255
256 if (unlikely(vbr->flags & VBLK_REQ_FUA)) {
257 /* Send out a flush before end the bio */
258 vbr->flags &= ~VBLK_REQ_DATA;
259 INIT_WORK(&vbr->work, virtblk_bio_send_flush_work);
260 queue_work(virtblk_wq, &vbr->work);
261 } else {
262 bio_endio(vbr->bio, virtblk_result(vbr));
263 mempool_free(vbr, vblk->pool);
264 }
265}
266
267static inline void virtblk_bio_done(struct virtblk_req *vbr)
268{
269 if (unlikely(vbr->flags & VBLK_IS_FLUSH))
270 virtblk_bio_flush_done(vbr);
271 else
272 virtblk_bio_data_done(vbr);
a98755c5
AH
273}
274
275static void virtblk_done(struct virtqueue *vq)
e467cde2
RR
276{
277 struct virtio_blk *vblk = vq->vdev->priv;
c85a1f91 278 bool bio_done = false, req_done = false;
e467cde2 279 struct virtblk_req *vbr;
e467cde2 280 unsigned long flags;
a98755c5 281 unsigned int len;
e467cde2 282
2c95a329 283 spin_lock_irqsave(vblk->disk->queue->queue_lock, flags);
bb811108
AH
284 do {
285 virtqueue_disable_cb(vq);
286 while ((vbr = virtqueue_get_buf(vblk->vq, &len)) != NULL) {
287 if (vbr->bio) {
288 virtblk_bio_done(vbr);
289 bio_done = true;
290 } else {
291 virtblk_request_done(vbr);
292 req_done = true;
293 }
33659ebb 294 }
bb811108 295 } while (!virtqueue_enable_cb(vq));
e467cde2 296 /* In case queue is stopped waiting for more buffers. */
a98755c5
AH
297 if (req_done)
298 blk_start_queue(vblk->disk->queue);
2c95a329 299 spin_unlock_irqrestore(vblk->disk->queue->queue_lock, flags);
a98755c5
AH
300
301 if (bio_done)
302 wake_up(&vblk->queue_wait);
303}
304
e467cde2
RR
305static bool do_req(struct request_queue *q, struct virtio_blk *vblk,
306 struct request *req)
307{
20af3cfd 308 unsigned int num;
e467cde2
RR
309 struct virtblk_req *vbr;
310
a98755c5 311 vbr = virtblk_alloc_req(vblk, GFP_ATOMIC);
e467cde2
RR
312 if (!vbr)
313 /* When another request finishes we'll try again. */
314 return false;
315
316 vbr->req = req;
a98755c5 317 vbr->bio = NULL;
dd40e456
FT
318 if (req->cmd_flags & REQ_FLUSH) {
319 vbr->out_hdr.type = VIRTIO_BLK_T_FLUSH;
4cb2ea28 320 vbr->out_hdr.sector = 0;
321 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
dd40e456
FT
322 } else {
323 switch (req->cmd_type) {
324 case REQ_TYPE_FS:
325 vbr->out_hdr.type = 0;
326 vbr->out_hdr.sector = blk_rq_pos(vbr->req);
327 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
328 break;
329 case REQ_TYPE_BLOCK_PC:
330 vbr->out_hdr.type = VIRTIO_BLK_T_SCSI_CMD;
f1b0ef06
CH
331 vbr->out_hdr.sector = 0;
332 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
333 break;
dd40e456
FT
334 case REQ_TYPE_SPECIAL:
335 vbr->out_hdr.type = VIRTIO_BLK_T_GET_ID;
336 vbr->out_hdr.sector = 0;
337 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
338 break;
339 default:
340 /* We don't put anything else in the queue. */
341 BUG();
f1b0ef06 342 }
e467cde2
RR
343 }
344
20af3cfd 345 num = blk_rq_map_sg(q, vbr->req, vblk->sg);
1cde26f9 346 if (num) {
20af3cfd 347 if (rq_data_dir(vbr->req) == WRITE)
1cde26f9 348 vbr->out_hdr.type |= VIRTIO_BLK_T_OUT;
20af3cfd 349 else
1cde26f9 350 vbr->out_hdr.type |= VIRTIO_BLK_T_IN;
e467cde2
RR
351 }
352
20af3cfd 353 if (__virtblk_add_req(vblk->vq, vbr, vblk->sg, num) < 0) {
e467cde2
RR
354 mempool_free(vbr, vblk->pool);
355 return false;
356 }
357
e467cde2
RR
358 return true;
359}
360
a98755c5 361static void virtblk_request(struct request_queue *q)
e467cde2 362{
6c3b46f7 363 struct virtio_blk *vblk = q->queuedata;
e467cde2
RR
364 struct request *req;
365 unsigned int issued = 0;
366
9934c8c0 367 while ((req = blk_peek_request(q)) != NULL) {
0864b79a 368 BUG_ON(req->nr_phys_segments + 2 > vblk->sg_elems);
e467cde2
RR
369
370 /* If this request fails, stop queue and wait for something to
371 finish to restart it. */
372 if (!do_req(q, vblk, req)) {
373 blk_stop_queue(q);
374 break;
375 }
9934c8c0 376 blk_start_request(req);
e467cde2
RR
377 issued++;
378 }
379
380 if (issued)
09ec6b69 381 virtqueue_kick(vblk->vq);
e467cde2
RR
382}
383
a98755c5
AH
384static void virtblk_make_request(struct request_queue *q, struct bio *bio)
385{
386 struct virtio_blk *vblk = q->queuedata;
a98755c5
AH
387 struct virtblk_req *vbr;
388
389 BUG_ON(bio->bi_phys_segments + 2 > vblk->sg_elems);
a98755c5
AH
390
391 vbr = virtblk_alloc_req(vblk, GFP_NOIO);
392 if (!vbr) {
393 bio_endio(bio, -ENOMEM);
394 return;
395 }
396
397 vbr->bio = bio;
c85a1f91
AH
398 vbr->flags = 0;
399 if (bio->bi_rw & REQ_FLUSH)
400 vbr->flags |= VBLK_REQ_FLUSH;
401 if (bio->bi_rw & REQ_FUA)
402 vbr->flags |= VBLK_REQ_FUA;
403 if (bio->bi_size)
404 vbr->flags |= VBLK_REQ_DATA;
405
406 if (unlikely(vbr->flags & VBLK_REQ_FLUSH))
407 virtblk_bio_send_flush(vbr);
408 else
409 virtblk_bio_send_data(vbr);
a98755c5
AH
410}
411
4cb2ea28 412/* return id (s/n) string for *disk to *id_str
413 */
414static int virtblk_get_id(struct gendisk *disk, char *id_str)
415{
416 struct virtio_blk *vblk = disk->private_data;
417 struct request *req;
418 struct bio *bio;
e4c4776d 419 int err;
4cb2ea28 420
421 bio = bio_map_kern(vblk->disk->queue, id_str, VIRTIO_BLK_ID_BYTES,
422 GFP_KERNEL);
423 if (IS_ERR(bio))
424 return PTR_ERR(bio);
425
426 req = blk_make_request(vblk->disk->queue, bio, GFP_KERNEL);
427 if (IS_ERR(req)) {
428 bio_put(bio);
429 return PTR_ERR(req);
430 }
431
432 req->cmd_type = REQ_TYPE_SPECIAL;
e4c4776d
MS
433 err = blk_execute_rq(vblk->disk->queue, vblk->disk, req, false);
434 blk_put_request(req);
435
436 return err;
4cb2ea28 437}
438
fe5a50a1
CH
439static int virtblk_ioctl(struct block_device *bdev, fmode_t mode,
440 unsigned int cmd, unsigned long data)
e467cde2 441{
1cde26f9
HR
442 struct gendisk *disk = bdev->bd_disk;
443 struct virtio_blk *vblk = disk->private_data;
444
445 /*
446 * Only allow the generic SCSI ioctls if the host can support it.
447 */
448 if (!virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_SCSI))
d9ecdea7 449 return -ENOTTY;
1cde26f9 450
577ebb37
PB
451 return scsi_cmd_blk_ioctl(bdev, mode, cmd,
452 (void __user *)data);
e467cde2
RR
453}
454
135da0b0
CB
455/* We provide getgeo only to please some old bootloader/partitioning tools */
456static int virtblk_getgeo(struct block_device *bd, struct hd_geometry *geo)
457{
48e4043d 458 struct virtio_blk *vblk = bd->bd_disk->private_data;
48e4043d
RH
459
460 /* see if the host passed in geometry config */
855e0c52
RR
461 if (virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_GEOMETRY)) {
462 virtio_cread(vblk->vdev, struct virtio_blk_config,
463 geometry.cylinders, &geo->cylinders);
464 virtio_cread(vblk->vdev, struct virtio_blk_config,
465 geometry.heads, &geo->heads);
466 virtio_cread(vblk->vdev, struct virtio_blk_config,
467 geometry.sectors, &geo->sectors);
48e4043d
RH
468 } else {
469 /* some standard values, similar to sd */
470 geo->heads = 1 << 6;
471 geo->sectors = 1 << 5;
472 geo->cylinders = get_capacity(bd->bd_disk) >> 11;
473 }
135da0b0
CB
474 return 0;
475}
476
83d5cde4 477static const struct block_device_operations virtblk_fops = {
8a6cfeb6 478 .ioctl = virtblk_ioctl,
135da0b0
CB
479 .owner = THIS_MODULE,
480 .getgeo = virtblk_getgeo,
e467cde2
RR
481};
482
d50ed907
CB
483static int index_to_minor(int index)
484{
485 return index << PART_BITS;
486}
487
5087a50e
MT
488static int minor_to_index(int minor)
489{
490 return minor >> PART_BITS;
491}
492
a5eb9e4f
RH
493static ssize_t virtblk_serial_show(struct device *dev,
494 struct device_attribute *attr, char *buf)
495{
496 struct gendisk *disk = dev_to_disk(dev);
497 int err;
498
499 /* sysfs gives us a PAGE_SIZE buffer */
500 BUILD_BUG_ON(PAGE_SIZE < VIRTIO_BLK_ID_BYTES);
501
502 buf[VIRTIO_BLK_ID_BYTES] = '\0';
503 err = virtblk_get_id(disk, buf);
504 if (!err)
505 return strlen(buf);
506
507 if (err == -EIO) /* Unsupported? Make it empty. */
508 return 0;
509
510 return err;
511}
512DEVICE_ATTR(serial, S_IRUGO, virtblk_serial_show, NULL);
513
7a7c924c
CH
514static void virtblk_config_changed_work(struct work_struct *work)
515{
516 struct virtio_blk *vblk =
517 container_of(work, struct virtio_blk, config_work);
518 struct virtio_device *vdev = vblk->vdev;
519 struct request_queue *q = vblk->disk->queue;
520 char cap_str_2[10], cap_str_10[10];
9d9598b8 521 char *envp[] = { "RESIZE=1", NULL };
7a7c924c
CH
522 u64 capacity, size;
523
4678d6f9
MT
524 mutex_lock(&vblk->config_lock);
525 if (!vblk->config_enable)
526 goto done;
527
7a7c924c 528 /* Host must always specify the capacity. */
855e0c52 529 virtio_cread(vdev, struct virtio_blk_config, capacity, &capacity);
7a7c924c
CH
530
531 /* If capacity is too big, truncate with warning. */
532 if ((sector_t)capacity != capacity) {
533 dev_warn(&vdev->dev, "Capacity %llu too large: truncating\n",
534 (unsigned long long)capacity);
535 capacity = (sector_t)-1;
536 }
537
538 size = capacity * queue_logical_block_size(q);
539 string_get_size(size, STRING_UNITS_2, cap_str_2, sizeof(cap_str_2));
540 string_get_size(size, STRING_UNITS_10, cap_str_10, sizeof(cap_str_10));
541
542 dev_notice(&vdev->dev,
543 "new size: %llu %d-byte logical blocks (%s/%s)\n",
544 (unsigned long long)capacity,
545 queue_logical_block_size(q),
546 cap_str_10, cap_str_2);
547
548 set_capacity(vblk->disk, capacity);
e9986f30 549 revalidate_disk(vblk->disk);
9d9598b8 550 kobject_uevent_env(&disk_to_dev(vblk->disk)->kobj, KOBJ_CHANGE, envp);
4678d6f9
MT
551done:
552 mutex_unlock(&vblk->config_lock);
7a7c924c
CH
553}
554
555static void virtblk_config_changed(struct virtio_device *vdev)
556{
557 struct virtio_blk *vblk = vdev->priv;
558
559 queue_work(virtblk_wq, &vblk->config_work);
560}
561
6abd6e5a
AS
562static int init_vq(struct virtio_blk *vblk)
563{
564 int err = 0;
565
566 /* We expect one virtqueue, for output. */
a98755c5 567 vblk->vq = virtio_find_single_vq(vblk->vdev, virtblk_done, "requests");
6abd6e5a
AS
568 if (IS_ERR(vblk->vq))
569 err = PTR_ERR(vblk->vq);
570
571 return err;
572}
573
c0aa3e09
RM
574/*
575 * Legacy naming scheme used for virtio devices. We are stuck with it for
576 * virtio blk but don't ever use it for any new driver.
577 */
578static int virtblk_name_format(char *prefix, int index, char *buf, int buflen)
579{
580 const int base = 'z' - 'a' + 1;
581 char *begin = buf + strlen(prefix);
582 char *end = buf + buflen;
583 char *p;
584 int unit;
585
586 p = end - 1;
587 *p = '\0';
588 unit = base;
589 do {
590 if (p == begin)
591 return -EINVAL;
592 *--p = 'a' + (index % unit);
593 index = (index / unit) - 1;
594 } while (index >= 0);
595
596 memmove(begin, p, end - p);
597 memcpy(buf, prefix, strlen(prefix));
598
599 return 0;
600}
601
cd5d5038
PB
602static int virtblk_get_cache_mode(struct virtio_device *vdev)
603{
604 u8 writeback;
605 int err;
606
855e0c52
RR
607 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_CONFIG_WCE,
608 struct virtio_blk_config, wce,
609 &writeback);
cd5d5038
PB
610 if (err)
611 writeback = virtio_has_feature(vdev, VIRTIO_BLK_F_WCE);
612
613 return writeback;
614}
615
616static void virtblk_update_cache_mode(struct virtio_device *vdev)
617{
618 u8 writeback = virtblk_get_cache_mode(vdev);
619 struct virtio_blk *vblk = vdev->priv;
620
c85a1f91 621 if (writeback)
cd5d5038
PB
622 blk_queue_flush(vblk->disk->queue, REQ_FLUSH);
623 else
624 blk_queue_flush(vblk->disk->queue, 0);
625
626 revalidate_disk(vblk->disk);
627}
628
629static const char *const virtblk_cache_types[] = {
630 "write through", "write back"
631};
632
633static ssize_t
634virtblk_cache_type_store(struct device *dev, struct device_attribute *attr,
635 const char *buf, size_t count)
636{
637 struct gendisk *disk = dev_to_disk(dev);
638 struct virtio_blk *vblk = disk->private_data;
639 struct virtio_device *vdev = vblk->vdev;
640 int i;
cd5d5038
PB
641
642 BUG_ON(!virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_CONFIG_WCE));
643 for (i = ARRAY_SIZE(virtblk_cache_types); --i >= 0; )
644 if (sysfs_streq(buf, virtblk_cache_types[i]))
645 break;
646
647 if (i < 0)
648 return -EINVAL;
649
855e0c52 650 virtio_cwrite8(vdev, offsetof(struct virtio_blk_config, wce), i);
cd5d5038
PB
651 virtblk_update_cache_mode(vdev);
652 return count;
653}
654
655static ssize_t
656virtblk_cache_type_show(struct device *dev, struct device_attribute *attr,
657 char *buf)
658{
659 struct gendisk *disk = dev_to_disk(dev);
660 struct virtio_blk *vblk = disk->private_data;
661 u8 writeback = virtblk_get_cache_mode(vblk->vdev);
662
663 BUG_ON(writeback >= ARRAY_SIZE(virtblk_cache_types));
664 return snprintf(buf, 40, "%s\n", virtblk_cache_types[writeback]);
665}
666
667static const struct device_attribute dev_attr_cache_type_ro =
668 __ATTR(cache_type, S_IRUGO,
669 virtblk_cache_type_show, NULL);
670static const struct device_attribute dev_attr_cache_type_rw =
671 __ATTR(cache_type, S_IRUGO|S_IWUSR,
672 virtblk_cache_type_show, virtblk_cache_type_store);
673
8d85fce7 674static int virtblk_probe(struct virtio_device *vdev)
e467cde2
RR
675{
676 struct virtio_blk *vblk;
69740c8b 677 struct request_queue *q;
5087a50e 678 int err, index;
a98755c5
AH
679 int pool_size;
680
e467cde2 681 u64 cap;
69740c8b
CH
682 u32 v, blk_size, sg_elems, opt_io_size;
683 u16 min_io_size;
684 u8 physical_block_exp, alignment_offset;
e467cde2 685
5087a50e
MT
686 err = ida_simple_get(&vd_index_ida, 0, minor_to_index(1 << MINORBITS),
687 GFP_KERNEL);
688 if (err < 0)
689 goto out;
690 index = err;
4f3bf19c 691
0864b79a 692 /* We need to know how many segments before we allocate. */
855e0c52
RR
693 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_SEG_MAX,
694 struct virtio_blk_config, seg_max,
695 &sg_elems);
a5b365a6
CH
696
697 /* We need at least one SG element, whatever they say. */
698 if (err || !sg_elems)
0864b79a
RR
699 sg_elems = 1;
700
701 /* We need an extra sg elements at head and tail. */
702 sg_elems += 2;
703 vdev->priv = vblk = kmalloc(sizeof(*vblk) +
704 sizeof(vblk->sg[0]) * sg_elems, GFP_KERNEL);
e467cde2
RR
705 if (!vblk) {
706 err = -ENOMEM;
5087a50e 707 goto out_free_index;
e467cde2
RR
708 }
709
a98755c5 710 init_waitqueue_head(&vblk->queue_wait);
e467cde2 711 vblk->vdev = vdev;
0864b79a
RR
712 vblk->sg_elems = sg_elems;
713 sg_init_table(vblk->sg, vblk->sg_elems);
4678d6f9 714 mutex_init(&vblk->config_lock);
a98755c5 715
7a7c924c 716 INIT_WORK(&vblk->config_work, virtblk_config_changed_work);
4678d6f9 717 vblk->config_enable = true;
e467cde2 718
6abd6e5a
AS
719 err = init_vq(vblk);
720 if (err)
e467cde2 721 goto out_free_vblk;
e467cde2 722
a98755c5
AH
723 pool_size = sizeof(struct virtblk_req);
724 if (use_bio)
725 pool_size += sizeof(struct scatterlist) * sg_elems;
726 vblk->pool = mempool_create_kmalloc_pool(1, pool_size);
e467cde2
RR
727 if (!vblk->pool) {
728 err = -ENOMEM;
729 goto out_free_vq;
730 }
731
e467cde2 732 /* FIXME: How many partitions? How long is a piece of string? */
4f3bf19c 733 vblk->disk = alloc_disk(1 << PART_BITS);
e467cde2
RR
734 if (!vblk->disk) {
735 err = -ENOMEM;
4f3bf19c 736 goto out_mempool;
e467cde2
RR
737 }
738
a98755c5 739 q = vblk->disk->queue = blk_init_queue(virtblk_request, NULL);
69740c8b 740 if (!q) {
e467cde2
RR
741 err = -ENOMEM;
742 goto out_put_disk;
743 }
744
a98755c5
AH
745 if (use_bio)
746 blk_queue_make_request(q, virtblk_make_request);
69740c8b 747 q->queuedata = vblk;
7d116b62 748
c0aa3e09 749 virtblk_name_format("vd", index, vblk->disk->disk_name, DISK_NAME_LEN);
d50ed907 750
e467cde2 751 vblk->disk->major = major;
d50ed907 752 vblk->disk->first_minor = index_to_minor(index);
e467cde2
RR
753 vblk->disk->private_data = vblk;
754 vblk->disk->fops = &virtblk_fops;
c4839346 755 vblk->disk->driverfs_dev = &vdev->dev;
5087a50e 756 vblk->index = index;
4f3bf19c 757
02c42b7a 758 /* configure queue flush support */
cd5d5038 759 virtblk_update_cache_mode(vdev);
e467cde2 760
3ef53609
CB
761 /* If disk is read-only in the host, the guest should obey */
762 if (virtio_has_feature(vdev, VIRTIO_BLK_F_RO))
763 set_disk_ro(vblk->disk, 1);
764
a586d4f6 765 /* Host must always specify the capacity. */
855e0c52 766 virtio_cread(vdev, struct virtio_blk_config, capacity, &cap);
e467cde2
RR
767
768 /* If capacity is too big, truncate with warning. */
769 if ((sector_t)cap != cap) {
770 dev_warn(&vdev->dev, "Capacity %llu too large: truncating\n",
771 (unsigned long long)cap);
772 cap = (sector_t)-1;
773 }
774 set_capacity(vblk->disk, cap);
775
0864b79a 776 /* We can handle whatever the host told us to handle. */
ee714f2d 777 blk_queue_max_segments(q, vblk->sg_elems-2);
0864b79a 778
4eff3cae 779 /* No need to bounce any requests */
69740c8b 780 blk_queue_bounce_limit(q, BLK_BOUNCE_ANY);
4eff3cae 781
4b7f7e20 782 /* No real sector limit. */
ee714f2d 783 blk_queue_max_hw_sectors(q, -1U);
4b7f7e20 784
a586d4f6
RR
785 /* Host can optionally specify maximum segment size and number of
786 * segments. */
855e0c52
RR
787 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_SIZE_MAX,
788 struct virtio_blk_config, size_max, &v);
e467cde2 789 if (!err)
69740c8b 790 blk_queue_max_segment_size(q, v);
4b7f7e20 791 else
69740c8b 792 blk_queue_max_segment_size(q, -1U);
e467cde2 793
066f4d82 794 /* Host can optionally specify the block size of the device */
855e0c52
RR
795 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_BLK_SIZE,
796 struct virtio_blk_config, blk_size,
797 &blk_size);
066f4d82 798 if (!err)
69740c8b
CH
799 blk_queue_logical_block_size(q, blk_size);
800 else
801 blk_size = queue_logical_block_size(q);
802
803 /* Use topology information if available */
855e0c52
RR
804 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
805 struct virtio_blk_config, physical_block_exp,
806 &physical_block_exp);
69740c8b
CH
807 if (!err && physical_block_exp)
808 blk_queue_physical_block_size(q,
809 blk_size * (1 << physical_block_exp));
810
855e0c52
RR
811 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
812 struct virtio_blk_config, alignment_offset,
813 &alignment_offset);
69740c8b
CH
814 if (!err && alignment_offset)
815 blk_queue_alignment_offset(q, blk_size * alignment_offset);
816
855e0c52
RR
817 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
818 struct virtio_blk_config, min_io_size,
819 &min_io_size);
69740c8b
CH
820 if (!err && min_io_size)
821 blk_queue_io_min(q, blk_size * min_io_size);
822
855e0c52
RR
823 err = virtio_cread_feature(vdev, VIRTIO_BLK_F_TOPOLOGY,
824 struct virtio_blk_config, opt_io_size,
825 &opt_io_size);
69740c8b
CH
826 if (!err && opt_io_size)
827 blk_queue_io_opt(q, blk_size * opt_io_size);
828
e467cde2 829 add_disk(vblk->disk);
a5eb9e4f
RH
830 err = device_create_file(disk_to_dev(vblk->disk), &dev_attr_serial);
831 if (err)
832 goto out_del_disk;
833
cd5d5038
PB
834 if (virtio_has_feature(vdev, VIRTIO_BLK_F_CONFIG_WCE))
835 err = device_create_file(disk_to_dev(vblk->disk),
836 &dev_attr_cache_type_rw);
837 else
838 err = device_create_file(disk_to_dev(vblk->disk),
839 &dev_attr_cache_type_ro);
840 if (err)
841 goto out_del_disk;
e467cde2
RR
842 return 0;
843
a5eb9e4f
RH
844out_del_disk:
845 del_gendisk(vblk->disk);
846 blk_cleanup_queue(vblk->disk->queue);
e467cde2
RR
847out_put_disk:
848 put_disk(vblk->disk);
e467cde2
RR
849out_mempool:
850 mempool_destroy(vblk->pool);
851out_free_vq:
d2a7ddda 852 vdev->config->del_vqs(vdev);
e467cde2
RR
853out_free_vblk:
854 kfree(vblk);
5087a50e
MT
855out_free_index:
856 ida_simple_remove(&vd_index_ida, index);
e467cde2
RR
857out:
858 return err;
859}
860
8d85fce7 861static void virtblk_remove(struct virtio_device *vdev)
e467cde2
RR
862{
863 struct virtio_blk *vblk = vdev->priv;
5087a50e 864 int index = vblk->index;
f4953fe6 865 int refc;
e467cde2 866
4678d6f9
MT
867 /* Prevent config work handler from accessing the device. */
868 mutex_lock(&vblk->config_lock);
869 vblk->config_enable = false;
870 mutex_unlock(&vblk->config_lock);
7a7c924c 871
02e2b124 872 del_gendisk(vblk->disk);
483001c7 873 blk_cleanup_queue(vblk->disk->queue);
02e2b124 874
6e5aa7ef
RR
875 /* Stop all the virtqueues. */
876 vdev->config->reset(vdev);
877
4678d6f9
MT
878 flush_work(&vblk->config_work);
879
f4953fe6 880 refc = atomic_read(&disk_to_dev(vblk->disk)->kobj.kref.refcount);
e467cde2 881 put_disk(vblk->disk);
e467cde2 882 mempool_destroy(vblk->pool);
d2a7ddda 883 vdev->config->del_vqs(vdev);
e467cde2 884 kfree(vblk);
f4953fe6
AG
885
886 /* Only free device id if we don't have any users */
887 if (refc == 1)
888 ida_simple_remove(&vd_index_ida, index);
e467cde2
RR
889}
890
89107000 891#ifdef CONFIG_PM_SLEEP
f8fb5bc2
AS
892static int virtblk_freeze(struct virtio_device *vdev)
893{
894 struct virtio_blk *vblk = vdev->priv;
895
896 /* Ensure we don't receive any more interrupts */
897 vdev->config->reset(vdev);
898
899 /* Prevent config work handler from accessing the device. */
900 mutex_lock(&vblk->config_lock);
901 vblk->config_enable = false;
902 mutex_unlock(&vblk->config_lock);
903
904 flush_work(&vblk->config_work);
905
906 spin_lock_irq(vblk->disk->queue->queue_lock);
907 blk_stop_queue(vblk->disk->queue);
908 spin_unlock_irq(vblk->disk->queue->queue_lock);
909 blk_sync_queue(vblk->disk->queue);
910
911 vdev->config->del_vqs(vdev);
912 return 0;
913}
914
915static int virtblk_restore(struct virtio_device *vdev)
916{
917 struct virtio_blk *vblk = vdev->priv;
918 int ret;
919
920 vblk->config_enable = true;
921 ret = init_vq(vdev->priv);
922 if (!ret) {
923 spin_lock_irq(vblk->disk->queue->queue_lock);
924 blk_start_queue(vblk->disk->queue);
925 spin_unlock_irq(vblk->disk->queue->queue_lock);
926 }
927 return ret;
928}
929#endif
930
47483e25 931static const struct virtio_device_id id_table[] = {
e467cde2
RR
932 { VIRTIO_ID_BLOCK, VIRTIO_DEV_ANY_ID },
933 { 0 },
934};
935
c45a6816 936static unsigned int features[] = {
02c42b7a
TH
937 VIRTIO_BLK_F_SEG_MAX, VIRTIO_BLK_F_SIZE_MAX, VIRTIO_BLK_F_GEOMETRY,
938 VIRTIO_BLK_F_RO, VIRTIO_BLK_F_BLK_SIZE, VIRTIO_BLK_F_SCSI,
cd5d5038 939 VIRTIO_BLK_F_WCE, VIRTIO_BLK_F_TOPOLOGY, VIRTIO_BLK_F_CONFIG_WCE
c45a6816
RR
940};
941
8d85fce7 942static struct virtio_driver virtio_blk = {
7a7c924c
CH
943 .feature_table = features,
944 .feature_table_size = ARRAY_SIZE(features),
945 .driver.name = KBUILD_MODNAME,
946 .driver.owner = THIS_MODULE,
947 .id_table = id_table,
948 .probe = virtblk_probe,
8d85fce7 949 .remove = virtblk_remove,
7a7c924c 950 .config_changed = virtblk_config_changed,
89107000 951#ifdef CONFIG_PM_SLEEP
f8fb5bc2
AS
952 .freeze = virtblk_freeze,
953 .restore = virtblk_restore,
954#endif
e467cde2
RR
955};
956
957static int __init init(void)
958{
7a7c924c
CH
959 int error;
960
961 virtblk_wq = alloc_workqueue("virtio-blk", 0, 0);
962 if (!virtblk_wq)
963 return -ENOMEM;
964
4f3bf19c 965 major = register_blkdev(0, "virtblk");
7a7c924c
CH
966 if (major < 0) {
967 error = major;
968 goto out_destroy_workqueue;
969 }
970
971 error = register_virtio_driver(&virtio_blk);
972 if (error)
973 goto out_unregister_blkdev;
974 return 0;
975
976out_unregister_blkdev:
977 unregister_blkdev(major, "virtblk");
978out_destroy_workqueue:
979 destroy_workqueue(virtblk_wq);
980 return error;
e467cde2
RR
981}
982
983static void __exit fini(void)
984{
4f3bf19c 985 unregister_blkdev(major, "virtblk");
e467cde2 986 unregister_virtio_driver(&virtio_blk);
7a7c924c 987 destroy_workqueue(virtblk_wq);
e467cde2
RR
988}
989module_init(init);
990module_exit(fini);
991
992MODULE_DEVICE_TABLE(virtio, id_table);
993MODULE_DESCRIPTION("Virtio block driver");
994MODULE_LICENSE("GPL");