root / hw / virtio-blk.c @ b0cd712c
History | View | Annotate | Download (14.7 kB)
1 | 6e02c38d | aliguori | /*
|
---|---|---|---|
2 | 6e02c38d | aliguori | * Virtio Block Device
|
3 | 6e02c38d | aliguori | *
|
4 | 6e02c38d | aliguori | * Copyright IBM, Corp. 2007
|
5 | 6e02c38d | aliguori | *
|
6 | 6e02c38d | aliguori | * Authors:
|
7 | 6e02c38d | aliguori | * Anthony Liguori <aliguori@us.ibm.com>
|
8 | 6e02c38d | aliguori | *
|
9 | 6e02c38d | aliguori | * This work is licensed under the terms of the GNU GPL, version 2. See
|
10 | 6e02c38d | aliguori | * the COPYING file in the top-level directory.
|
11 | 6e02c38d | aliguori | *
|
12 | 6e02c38d | aliguori | */
|
13 | 6e02c38d | aliguori | |
14 | 869a5c6d | aliguori | #include <qemu-common.h> |
15 | d75d25e3 | Markus Armbruster | #include "qemu-error.h" |
16 | 6d519a5f | Stefan Hajnoczi | #include "trace.h" |
17 | 2446333c | Blue Swirl | #include "blockdev.h" |
18 | 6e02c38d | aliguori | #include "virtio-blk.h" |
19 | 1063b8b1 | Christoph Hellwig | #ifdef __linux__
|
20 | 1063b8b1 | Christoph Hellwig | # include <scsi/sg.h> |
21 | 1063b8b1 | Christoph Hellwig | #endif
|
22 | 6e02c38d | aliguori | |
23 | 6e02c38d | aliguori | typedef struct VirtIOBlock |
24 | 6e02c38d | aliguori | { |
25 | 6e02c38d | aliguori | VirtIODevice vdev; |
26 | 6e02c38d | aliguori | BlockDriverState *bs; |
27 | 6e02c38d | aliguori | VirtQueue *vq; |
28 | 869a5c6d | aliguori | void *rq;
|
29 | 213189ab | Markus Armbruster | QEMUBH *bh; |
30 | 9752c371 | Christoph Hellwig | BlockConf *conf; |
31 | 8cfacf07 | Christoph Hellwig | unsigned short sector_mask; |
32 | 2930b313 | john cooper | char sn[BLOCK_SERIAL_STRLEN];
|
33 | 9d0d3138 | Alex Williamson | DeviceState *qdev; |
34 | 6e02c38d | aliguori | } VirtIOBlock; |
35 | 6e02c38d | aliguori | |
36 | 6e02c38d | aliguori | static VirtIOBlock *to_virtio_blk(VirtIODevice *vdev)
|
37 | 6e02c38d | aliguori | { |
38 | 6e02c38d | aliguori | return (VirtIOBlock *)vdev;
|
39 | 6e02c38d | aliguori | } |
40 | 6e02c38d | aliguori | |
41 | 6e02c38d | aliguori | typedef struct VirtIOBlockReq |
42 | 6e02c38d | aliguori | { |
43 | 6e02c38d | aliguori | VirtIOBlock *dev; |
44 | 6e02c38d | aliguori | VirtQueueElement elem; |
45 | 6e02c38d | aliguori | struct virtio_blk_inhdr *in;
|
46 | 6e02c38d | aliguori | struct virtio_blk_outhdr *out;
|
47 | 1063b8b1 | Christoph Hellwig | struct virtio_scsi_inhdr *scsi;
|
48 | d28a1b6e | aliguori | QEMUIOVector qiov; |
49 | 869a5c6d | aliguori | struct VirtIOBlockReq *next;
|
50 | 6e02c38d | aliguori | } VirtIOBlockReq; |
51 | 6e02c38d | aliguori | |
52 | 869a5c6d | aliguori | static void virtio_blk_req_complete(VirtIOBlockReq *req, int status) |
53 | 869a5c6d | aliguori | { |
54 | 869a5c6d | aliguori | VirtIOBlock *s = req->dev; |
55 | 869a5c6d | aliguori | |
56 | 6d519a5f | Stefan Hajnoczi | trace_virtio_blk_req_complete(req, status); |
57 | 6d519a5f | Stefan Hajnoczi | |
58 | 869a5c6d | aliguori | req->in->status = status; |
59 | d28a1b6e | aliguori | virtqueue_push(s->vq, &req->elem, req->qiov.size + sizeof(*req->in));
|
60 | 869a5c6d | aliguori | virtio_notify(&s->vdev, s->vq); |
61 | 869a5c6d | aliguori | |
62 | 869a5c6d | aliguori | qemu_free(req); |
63 | 869a5c6d | aliguori | } |
64 | 869a5c6d | aliguori | |
65 | f35d68f0 | Kevin Wolf | static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error, |
66 | f35d68f0 | Kevin Wolf | int is_read)
|
67 | 869a5c6d | aliguori | { |
68 | abd7f68d | Markus Armbruster | BlockErrorAction action = bdrv_get_on_error(req->dev->bs, is_read); |
69 | 869a5c6d | aliguori | VirtIOBlock *s = req->dev; |
70 | 869a5c6d | aliguori | |
71 | eaa6c85f | Luiz Capitulino | if (action == BLOCK_ERR_IGNORE) {
|
72 | 908bb949 | Kevin Wolf | bdrv_mon_event(s->bs, BDRV_ACTION_IGNORE, is_read); |
73 | 869a5c6d | aliguori | return 0; |
74 | eaa6c85f | Luiz Capitulino | } |
75 | 869a5c6d | aliguori | |
76 | 869a5c6d | aliguori | if ((error == ENOSPC && action == BLOCK_ERR_STOP_ENOSPC)
|
77 | 869a5c6d | aliguori | || action == BLOCK_ERR_STOP_ANY) { |
78 | 869a5c6d | aliguori | req->next = s->rq; |
79 | 869a5c6d | aliguori | s->rq = req; |
80 | 908bb949 | Kevin Wolf | bdrv_mon_event(s->bs, BDRV_ACTION_STOP, is_read); |
81 | 554a310b | Luiz Capitulino | vm_stop(0);
|
82 | 869a5c6d | aliguori | } else {
|
83 | 869a5c6d | aliguori | virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); |
84 | 908bb949 | Kevin Wolf | bdrv_mon_event(s->bs, BDRV_ACTION_REPORT, is_read); |
85 | 869a5c6d | aliguori | } |
86 | 869a5c6d | aliguori | |
87 | 869a5c6d | aliguori | return 1; |
88 | 869a5c6d | aliguori | } |
89 | 869a5c6d | aliguori | |
90 | 6e02c38d | aliguori | static void virtio_blk_rw_complete(void *opaque, int ret) |
91 | 6e02c38d | aliguori | { |
92 | 6e02c38d | aliguori | VirtIOBlockReq *req = opaque; |
93 | 6e02c38d | aliguori | |
94 | 6d519a5f | Stefan Hajnoczi | trace_virtio_blk_rw_complete(req, ret); |
95 | 6d519a5f | Stefan Hajnoczi | |
96 | f35d68f0 | Kevin Wolf | if (ret) {
|
97 | f35d68f0 | Kevin Wolf | int is_read = !(req->out->type & VIRTIO_BLK_T_OUT);
|
98 | f35d68f0 | Kevin Wolf | if (virtio_blk_handle_rw_error(req, -ret, is_read))
|
99 | 869a5c6d | aliguori | return;
|
100 | 6e02c38d | aliguori | } |
101 | 6e02c38d | aliguori | |
102 | f35d68f0 | Kevin Wolf | virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); |
103 | 869a5c6d | aliguori | } |
104 | 6e02c38d | aliguori | |
105 | aa659be3 | Christoph Hellwig | static void virtio_blk_flush_complete(void *opaque, int ret) |
106 | aa659be3 | Christoph Hellwig | { |
107 | aa659be3 | Christoph Hellwig | VirtIOBlockReq *req = opaque; |
108 | aa659be3 | Christoph Hellwig | |
109 | aa659be3 | Christoph Hellwig | virtio_blk_req_complete(req, ret ? VIRTIO_BLK_S_IOERR : VIRTIO_BLK_S_OK); |
110 | aa659be3 | Christoph Hellwig | } |
111 | aa659be3 | Christoph Hellwig | |
112 | 869a5c6d | aliguori | static VirtIOBlockReq *virtio_blk_alloc_request(VirtIOBlock *s)
|
113 | 869a5c6d | aliguori | { |
114 | de6c8042 | Stefan Hajnoczi | VirtIOBlockReq *req = qemu_malloc(sizeof(*req));
|
115 | 487414f1 | aliguori | req->dev = s; |
116 | de6c8042 | Stefan Hajnoczi | req->qiov.size = 0;
|
117 | de6c8042 | Stefan Hajnoczi | req->next = NULL;
|
118 | 869a5c6d | aliguori | return req;
|
119 | 6e02c38d | aliguori | } |
120 | 6e02c38d | aliguori | |
121 | 6e02c38d | aliguori | static VirtIOBlockReq *virtio_blk_get_request(VirtIOBlock *s)
|
122 | 6e02c38d | aliguori | { |
123 | 869a5c6d | aliguori | VirtIOBlockReq *req = virtio_blk_alloc_request(s); |
124 | 6e02c38d | aliguori | |
125 | 869a5c6d | aliguori | if (req != NULL) { |
126 | 869a5c6d | aliguori | if (!virtqueue_pop(s->vq, &req->elem)) {
|
127 | 869a5c6d | aliguori | qemu_free(req); |
128 | 869a5c6d | aliguori | return NULL; |
129 | 869a5c6d | aliguori | } |
130 | 6e02c38d | aliguori | } |
131 | 6e02c38d | aliguori | |
132 | 6e02c38d | aliguori | return req;
|
133 | 6e02c38d | aliguori | } |
134 | 6e02c38d | aliguori | |
135 | 1063b8b1 | Christoph Hellwig | #ifdef __linux__
|
136 | 1063b8b1 | Christoph Hellwig | static void virtio_blk_handle_scsi(VirtIOBlockReq *req) |
137 | 1063b8b1 | Christoph Hellwig | { |
138 | 1063b8b1 | Christoph Hellwig | struct sg_io_hdr hdr;
|
139 | 4277906d | Christoph Hellwig | int ret;
|
140 | 1063b8b1 | Christoph Hellwig | int status;
|
141 | 1063b8b1 | Christoph Hellwig | int i;
|
142 | 1063b8b1 | Christoph Hellwig | |
143 | 1063b8b1 | Christoph Hellwig | /*
|
144 | 1063b8b1 | Christoph Hellwig | * We require at least one output segment each for the virtio_blk_outhdr
|
145 | 1063b8b1 | Christoph Hellwig | * and the SCSI command block.
|
146 | 1063b8b1 | Christoph Hellwig | *
|
147 | 1063b8b1 | Christoph Hellwig | * We also at least require the virtio_blk_inhdr, the virtio_scsi_inhdr
|
148 | 1063b8b1 | Christoph Hellwig | * and the sense buffer pointer in the input segments.
|
149 | 1063b8b1 | Christoph Hellwig | */
|
150 | 1063b8b1 | Christoph Hellwig | if (req->elem.out_num < 2 || req->elem.in_num < 3) { |
151 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); |
152 | 1063b8b1 | Christoph Hellwig | return;
|
153 | 1063b8b1 | Christoph Hellwig | } |
154 | 1063b8b1 | Christoph Hellwig | |
155 | 1063b8b1 | Christoph Hellwig | /*
|
156 | 1063b8b1 | Christoph Hellwig | * No support for bidirection commands yet.
|
157 | 1063b8b1 | Christoph Hellwig | */
|
158 | 1063b8b1 | Christoph Hellwig | if (req->elem.out_num > 2 && req->elem.in_num > 3) { |
159 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); |
160 | 1063b8b1 | Christoph Hellwig | return;
|
161 | 1063b8b1 | Christoph Hellwig | } |
162 | 1063b8b1 | Christoph Hellwig | |
163 | 1063b8b1 | Christoph Hellwig | /*
|
164 | 1063b8b1 | Christoph Hellwig | * The scsi inhdr is placed in the second-to-last input segment, just
|
165 | 1063b8b1 | Christoph Hellwig | * before the regular inhdr.
|
166 | 1063b8b1 | Christoph Hellwig | */
|
167 | 1063b8b1 | Christoph Hellwig | req->scsi = (void *)req->elem.in_sg[req->elem.in_num - 2].iov_base; |
168 | 1063b8b1 | Christoph Hellwig | |
169 | 1063b8b1 | Christoph Hellwig | memset(&hdr, 0, sizeof(struct sg_io_hdr)); |
170 | 1063b8b1 | Christoph Hellwig | hdr.interface_id = 'S';
|
171 | 1063b8b1 | Christoph Hellwig | hdr.cmd_len = req->elem.out_sg[1].iov_len;
|
172 | 1063b8b1 | Christoph Hellwig | hdr.cmdp = req->elem.out_sg[1].iov_base;
|
173 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_len = 0;
|
174 | 1063b8b1 | Christoph Hellwig | |
175 | 1063b8b1 | Christoph Hellwig | if (req->elem.out_num > 2) { |
176 | 1063b8b1 | Christoph Hellwig | /*
|
177 | 1063b8b1 | Christoph Hellwig | * If there are more than the minimally required 2 output segments
|
178 | 1063b8b1 | Christoph Hellwig | * there is write payload starting from the third iovec.
|
179 | 1063b8b1 | Christoph Hellwig | */
|
180 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_direction = SG_DXFER_TO_DEV; |
181 | 1063b8b1 | Christoph Hellwig | hdr.iovec_count = req->elem.out_num - 2;
|
182 | 1063b8b1 | Christoph Hellwig | |
183 | 1063b8b1 | Christoph Hellwig | for (i = 0; i < hdr.iovec_count; i++) |
184 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_len += req->elem.out_sg[i + 2].iov_len;
|
185 | 1063b8b1 | Christoph Hellwig | |
186 | 1063b8b1 | Christoph Hellwig | hdr.dxferp = req->elem.out_sg + 2;
|
187 | 1063b8b1 | Christoph Hellwig | |
188 | 1063b8b1 | Christoph Hellwig | } else if (req->elem.in_num > 3) { |
189 | 1063b8b1 | Christoph Hellwig | /*
|
190 | 1063b8b1 | Christoph Hellwig | * If we have more than 3 input segments the guest wants to actually
|
191 | 1063b8b1 | Christoph Hellwig | * read data.
|
192 | 1063b8b1 | Christoph Hellwig | */
|
193 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_direction = SG_DXFER_FROM_DEV; |
194 | 1063b8b1 | Christoph Hellwig | hdr.iovec_count = req->elem.in_num - 3;
|
195 | 1063b8b1 | Christoph Hellwig | for (i = 0; i < hdr.iovec_count; i++) |
196 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_len += req->elem.in_sg[i].iov_len; |
197 | 1063b8b1 | Christoph Hellwig | |
198 | 1063b8b1 | Christoph Hellwig | hdr.dxferp = req->elem.in_sg; |
199 | 1063b8b1 | Christoph Hellwig | } else {
|
200 | 1063b8b1 | Christoph Hellwig | /*
|
201 | 1063b8b1 | Christoph Hellwig | * Some SCSI commands don't actually transfer any data.
|
202 | 1063b8b1 | Christoph Hellwig | */
|
203 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_direction = SG_DXFER_NONE; |
204 | 1063b8b1 | Christoph Hellwig | } |
205 | 1063b8b1 | Christoph Hellwig | |
206 | 1063b8b1 | Christoph Hellwig | hdr.sbp = req->elem.in_sg[req->elem.in_num - 3].iov_base;
|
207 | 1063b8b1 | Christoph Hellwig | hdr.mx_sb_len = req->elem.in_sg[req->elem.in_num - 3].iov_len;
|
208 | 1063b8b1 | Christoph Hellwig | |
209 | 1063b8b1 | Christoph Hellwig | ret = bdrv_ioctl(req->dev->bs, SG_IO, &hdr); |
210 | 1063b8b1 | Christoph Hellwig | if (ret) {
|
211 | 1063b8b1 | Christoph Hellwig | status = VIRTIO_BLK_S_UNSUPP; |
212 | 1063b8b1 | Christoph Hellwig | hdr.status = ret; |
213 | 1063b8b1 | Christoph Hellwig | hdr.resid = hdr.dxfer_len; |
214 | 1063b8b1 | Christoph Hellwig | } else if (hdr.status) { |
215 | 1063b8b1 | Christoph Hellwig | status = VIRTIO_BLK_S_IOERR; |
216 | 1063b8b1 | Christoph Hellwig | } else {
|
217 | 1063b8b1 | Christoph Hellwig | status = VIRTIO_BLK_S_OK; |
218 | 1063b8b1 | Christoph Hellwig | } |
219 | 1063b8b1 | Christoph Hellwig | |
220 | 1063b8b1 | Christoph Hellwig | req->scsi->errors = hdr.status; |
221 | 1063b8b1 | Christoph Hellwig | req->scsi->residual = hdr.resid; |
222 | 1063b8b1 | Christoph Hellwig | req->scsi->sense_len = hdr.sb_len_wr; |
223 | 1063b8b1 | Christoph Hellwig | req->scsi->data_len = hdr.dxfer_len; |
224 | 1063b8b1 | Christoph Hellwig | |
225 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, status); |
226 | 1063b8b1 | Christoph Hellwig | } |
227 | 1063b8b1 | Christoph Hellwig | #else
|
228 | 1063b8b1 | Christoph Hellwig | static void virtio_blk_handle_scsi(VirtIOBlockReq *req) |
229 | 1063b8b1 | Christoph Hellwig | { |
230 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); |
231 | 1063b8b1 | Christoph Hellwig | } |
232 | 1063b8b1 | Christoph Hellwig | #endif /* __linux__ */ |
233 | 1063b8b1 | Christoph Hellwig | |
234 | c20fd872 | Christoph Hellwig | typedef struct MultiReqBuffer { |
235 | c20fd872 | Christoph Hellwig | BlockRequest blkreq[32];
|
236 | c20fd872 | Christoph Hellwig | unsigned int num_writes; |
237 | c20fd872 | Christoph Hellwig | } MultiReqBuffer; |
238 | c20fd872 | Christoph Hellwig | |
239 | c20fd872 | Christoph Hellwig | static void virtio_submit_multiwrite(BlockDriverState *bs, MultiReqBuffer *mrb) |
240 | 869a5c6d | aliguori | { |
241 | 91553dcc | Kevin Wolf | int i, ret;
|
242 | 91553dcc | Kevin Wolf | |
243 | c20fd872 | Christoph Hellwig | if (!mrb->num_writes) {
|
244 | c20fd872 | Christoph Hellwig | return;
|
245 | c20fd872 | Christoph Hellwig | } |
246 | c20fd872 | Christoph Hellwig | |
247 | c20fd872 | Christoph Hellwig | ret = bdrv_aio_multiwrite(bs, mrb->blkreq, mrb->num_writes); |
248 | 91553dcc | Kevin Wolf | if (ret != 0) { |
249 | c20fd872 | Christoph Hellwig | for (i = 0; i < mrb->num_writes; i++) { |
250 | c20fd872 | Christoph Hellwig | if (mrb->blkreq[i].error) {
|
251 | c20fd872 | Christoph Hellwig | virtio_blk_rw_complete(mrb->blkreq[i].opaque, -EIO); |
252 | 91553dcc | Kevin Wolf | } |
253 | 91553dcc | Kevin Wolf | } |
254 | 91553dcc | Kevin Wolf | } |
255 | c20fd872 | Christoph Hellwig | |
256 | c20fd872 | Christoph Hellwig | mrb->num_writes = 0;
|
257 | 91553dcc | Kevin Wolf | } |
258 | 87b245db | Christoph Hellwig | |
259 | c20fd872 | Christoph Hellwig | static void virtio_blk_handle_flush(VirtIOBlockReq *req, MultiReqBuffer *mrb) |
260 | aa659be3 | Christoph Hellwig | { |
261 | aa659be3 | Christoph Hellwig | BlockDriverAIOCB *acb; |
262 | aa659be3 | Christoph Hellwig | |
263 | 618fbb84 | Christoph Hellwig | /*
|
264 | 618fbb84 | Christoph Hellwig | * Make sure all outstanding writes are posted to the backing device.
|
265 | 618fbb84 | Christoph Hellwig | */
|
266 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(req->dev->bs, mrb); |
267 | 618fbb84 | Christoph Hellwig | |
268 | aa659be3 | Christoph Hellwig | acb = bdrv_aio_flush(req->dev->bs, virtio_blk_flush_complete, req); |
269 | aa659be3 | Christoph Hellwig | if (!acb) {
|
270 | aa659be3 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); |
271 | aa659be3 | Christoph Hellwig | } |
272 | aa659be3 | Christoph Hellwig | } |
273 | aa659be3 | Christoph Hellwig | |
274 | c20fd872 | Christoph Hellwig | static void virtio_blk_handle_write(VirtIOBlockReq *req, MultiReqBuffer *mrb) |
275 | 91553dcc | Kevin Wolf | { |
276 | c20fd872 | Christoph Hellwig | BlockRequest *blkreq; |
277 | c20fd872 | Christoph Hellwig | |
278 | 6d519a5f | Stefan Hajnoczi | trace_virtio_blk_handle_write(req, req->out->sector, req->qiov.size / 512);
|
279 | 6d519a5f | Stefan Hajnoczi | |
280 | 8cfacf07 | Christoph Hellwig | if (req->out->sector & req->dev->sector_mask) {
|
281 | 8cfacf07 | Christoph Hellwig | virtio_blk_rw_complete(req, -EIO); |
282 | 8cfacf07 | Christoph Hellwig | return;
|
283 | 8cfacf07 | Christoph Hellwig | } |
284 | 8cfacf07 | Christoph Hellwig | |
285 | c20fd872 | Christoph Hellwig | if (mrb->num_writes == 32) { |
286 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(req->dev->bs, mrb); |
287 | 87b245db | Christoph Hellwig | } |
288 | 91553dcc | Kevin Wolf | |
289 | c20fd872 | Christoph Hellwig | blkreq = &mrb->blkreq[mrb->num_writes]; |
290 | c20fd872 | Christoph Hellwig | blkreq->sector = req->out->sector; |
291 | c20fd872 | Christoph Hellwig | blkreq->nb_sectors = req->qiov.size / BDRV_SECTOR_SIZE; |
292 | c20fd872 | Christoph Hellwig | blkreq->qiov = &req->qiov; |
293 | c20fd872 | Christoph Hellwig | blkreq->cb = virtio_blk_rw_complete; |
294 | c20fd872 | Christoph Hellwig | blkreq->opaque = req; |
295 | c20fd872 | Christoph Hellwig | blkreq->error = 0;
|
296 | 91553dcc | Kevin Wolf | |
297 | c20fd872 | Christoph Hellwig | mrb->num_writes++; |
298 | d28a1b6e | aliguori | } |
299 | 869a5c6d | aliguori | |
300 | d28a1b6e | aliguori | static void virtio_blk_handle_read(VirtIOBlockReq *req) |
301 | d28a1b6e | aliguori | { |
302 | 87b245db | Christoph Hellwig | BlockDriverAIOCB *acb; |
303 | 87b245db | Christoph Hellwig | |
304 | 8cfacf07 | Christoph Hellwig | if (req->out->sector & req->dev->sector_mask) {
|
305 | 8cfacf07 | Christoph Hellwig | virtio_blk_rw_complete(req, -EIO); |
306 | 8cfacf07 | Christoph Hellwig | return;
|
307 | 8cfacf07 | Christoph Hellwig | } |
308 | 8cfacf07 | Christoph Hellwig | |
309 | 87b245db | Christoph Hellwig | acb = bdrv_aio_readv(req->dev->bs, req->out->sector, &req->qiov, |
310 | 1573a35d | Jes Sorensen | req->qiov.size / BDRV_SECTOR_SIZE, |
311 | 1573a35d | Jes Sorensen | virtio_blk_rw_complete, req); |
312 | 87b245db | Christoph Hellwig | if (!acb) {
|
313 | 6c510fbf | Kevin Wolf | virtio_blk_rw_complete(req, -EIO); |
314 | 87b245db | Christoph Hellwig | } |
315 | 869a5c6d | aliguori | } |
316 | 869a5c6d | aliguori | |
317 | bc6694d4 | Kevin Wolf | static void virtio_blk_handle_request(VirtIOBlockReq *req, |
318 | bc6694d4 | Kevin Wolf | MultiReqBuffer *mrb) |
319 | bc6694d4 | Kevin Wolf | { |
320 | bc6694d4 | Kevin Wolf | if (req->elem.out_num < 1 || req->elem.in_num < 1) { |
321 | bc6694d4 | Kevin Wolf | fprintf(stderr, "virtio-blk missing headers\n");
|
322 | bc6694d4 | Kevin Wolf | exit(1);
|
323 | bc6694d4 | Kevin Wolf | } |
324 | bc6694d4 | Kevin Wolf | |
325 | bc6694d4 | Kevin Wolf | if (req->elem.out_sg[0].iov_len < sizeof(*req->out) || |
326 | bc6694d4 | Kevin Wolf | req->elem.in_sg[req->elem.in_num - 1].iov_len < sizeof(*req->in)) { |
327 | bc6694d4 | Kevin Wolf | fprintf(stderr, "virtio-blk header not in correct element\n");
|
328 | bc6694d4 | Kevin Wolf | exit(1);
|
329 | bc6694d4 | Kevin Wolf | } |
330 | bc6694d4 | Kevin Wolf | |
331 | bc6694d4 | Kevin Wolf | req->out = (void *)req->elem.out_sg[0].iov_base; |
332 | bc6694d4 | Kevin Wolf | req->in = (void *)req->elem.in_sg[req->elem.in_num - 1].iov_base; |
333 | bc6694d4 | Kevin Wolf | |
334 | bc6694d4 | Kevin Wolf | if (req->out->type & VIRTIO_BLK_T_FLUSH) {
|
335 | c20fd872 | Christoph Hellwig | virtio_blk_handle_flush(req, mrb); |
336 | bc6694d4 | Kevin Wolf | } else if (req->out->type & VIRTIO_BLK_T_SCSI_CMD) { |
337 | bc6694d4 | Kevin Wolf | virtio_blk_handle_scsi(req); |
338 | 2930b313 | john cooper | } else if (req->out->type & VIRTIO_BLK_T_GET_ID) { |
339 | 2930b313 | john cooper | VirtIOBlock *s = req->dev; |
340 | 2930b313 | john cooper | |
341 | 2930b313 | john cooper | memcpy(req->elem.in_sg[0].iov_base, s->sn,
|
342 | 2930b313 | john cooper | MIN(req->elem.in_sg[0].iov_len, sizeof(s->sn))); |
343 | 2930b313 | john cooper | virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); |
344 | bc6694d4 | Kevin Wolf | } else if (req->out->type & VIRTIO_BLK_T_OUT) { |
345 | bc6694d4 | Kevin Wolf | qemu_iovec_init_external(&req->qiov, &req->elem.out_sg[1],
|
346 | bc6694d4 | Kevin Wolf | req->elem.out_num - 1);
|
347 | c20fd872 | Christoph Hellwig | virtio_blk_handle_write(req, mrb); |
348 | bc6694d4 | Kevin Wolf | } else {
|
349 | bc6694d4 | Kevin Wolf | qemu_iovec_init_external(&req->qiov, &req->elem.in_sg[0],
|
350 | bc6694d4 | Kevin Wolf | req->elem.in_num - 1);
|
351 | bc6694d4 | Kevin Wolf | virtio_blk_handle_read(req); |
352 | bc6694d4 | Kevin Wolf | } |
353 | bc6694d4 | Kevin Wolf | } |
354 | bc6694d4 | Kevin Wolf | |
355 | 6e02c38d | aliguori | static void virtio_blk_handle_output(VirtIODevice *vdev, VirtQueue *vq) |
356 | 6e02c38d | aliguori | { |
357 | 6e02c38d | aliguori | VirtIOBlock *s = to_virtio_blk(vdev); |
358 | 6e02c38d | aliguori | VirtIOBlockReq *req; |
359 | bc6694d4 | Kevin Wolf | MultiReqBuffer mrb = { |
360 | bc6694d4 | Kevin Wolf | .num_writes = 0,
|
361 | bc6694d4 | Kevin Wolf | }; |
362 | 6e02c38d | aliguori | |
363 | 6e02c38d | aliguori | while ((req = virtio_blk_get_request(s))) {
|
364 | bc6694d4 | Kevin Wolf | virtio_blk_handle_request(req, &mrb); |
365 | 6e02c38d | aliguori | } |
366 | 91553dcc | Kevin Wolf | |
367 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(s->bs, &mrb); |
368 | 91553dcc | Kevin Wolf | |
369 | 6e02c38d | aliguori | /*
|
370 | 6e02c38d | aliguori | * FIXME: Want to check for completions before returning to guest mode,
|
371 | 6e02c38d | aliguori | * so cached reads and writes are reported as quickly as possible. But
|
372 | 6e02c38d | aliguori | * that should be done in the generic block layer.
|
373 | 6e02c38d | aliguori | */
|
374 | 6e02c38d | aliguori | } |
375 | 6e02c38d | aliguori | |
376 | 213189ab | Markus Armbruster | static void virtio_blk_dma_restart_bh(void *opaque) |
377 | 869a5c6d | aliguori | { |
378 | 869a5c6d | aliguori | VirtIOBlock *s = opaque; |
379 | 869a5c6d | aliguori | VirtIOBlockReq *req = s->rq; |
380 | f1b52868 | Kevin Wolf | MultiReqBuffer mrb = { |
381 | f1b52868 | Kevin Wolf | .num_writes = 0,
|
382 | f1b52868 | Kevin Wolf | }; |
383 | 869a5c6d | aliguori | |
384 | 213189ab | Markus Armbruster | qemu_bh_delete(s->bh); |
385 | 213189ab | Markus Armbruster | s->bh = NULL;
|
386 | 869a5c6d | aliguori | |
387 | 869a5c6d | aliguori | s->rq = NULL;
|
388 | 869a5c6d | aliguori | |
389 | 869a5c6d | aliguori | while (req) {
|
390 | f1b52868 | Kevin Wolf | virtio_blk_handle_request(req, &mrb); |
391 | 869a5c6d | aliguori | req = req->next; |
392 | 869a5c6d | aliguori | } |
393 | f1b52868 | Kevin Wolf | |
394 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(s->bs, &mrb); |
395 | 869a5c6d | aliguori | } |
396 | 869a5c6d | aliguori | |
397 | 213189ab | Markus Armbruster | static void virtio_blk_dma_restart_cb(void *opaque, int running, int reason) |
398 | 213189ab | Markus Armbruster | { |
399 | 213189ab | Markus Armbruster | VirtIOBlock *s = opaque; |
400 | 213189ab | Markus Armbruster | |
401 | 213189ab | Markus Armbruster | if (!running)
|
402 | 213189ab | Markus Armbruster | return;
|
403 | 213189ab | Markus Armbruster | |
404 | 213189ab | Markus Armbruster | if (!s->bh) {
|
405 | 213189ab | Markus Armbruster | s->bh = qemu_bh_new(virtio_blk_dma_restart_bh, s); |
406 | 213189ab | Markus Armbruster | qemu_bh_schedule(s->bh); |
407 | 213189ab | Markus Armbruster | } |
408 | 213189ab | Markus Armbruster | } |
409 | 213189ab | Markus Armbruster | |
410 | 6e02c38d | aliguori | static void virtio_blk_reset(VirtIODevice *vdev) |
411 | 6e02c38d | aliguori | { |
412 | 6e02c38d | aliguori | /*
|
413 | 6e02c38d | aliguori | * This should cancel pending requests, but can't do nicely until there
|
414 | 6e02c38d | aliguori | * are per-device request lists.
|
415 | 6e02c38d | aliguori | */
|
416 | 6e02c38d | aliguori | qemu_aio_flush(); |
417 | 6e02c38d | aliguori | } |
418 | 6e02c38d | aliguori | |
419 | bf011293 | john cooper | /* coalesce internal state, copy to pci i/o region 0
|
420 | bf011293 | john cooper | */
|
421 | 6e02c38d | aliguori | static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config) |
422 | 6e02c38d | aliguori | { |
423 | 6e02c38d | aliguori | VirtIOBlock *s = to_virtio_blk(vdev); |
424 | 6e02c38d | aliguori | struct virtio_blk_config blkcfg;
|
425 | 6e02c38d | aliguori | uint64_t capacity; |
426 | 6e02c38d | aliguori | int cylinders, heads, secs;
|
427 | 6e02c38d | aliguori | |
428 | 6e02c38d | aliguori | bdrv_get_geometry(s->bs, &capacity); |
429 | 6e02c38d | aliguori | bdrv_get_geometry_hint(s->bs, &cylinders, &heads, &secs); |
430 | 5c5dafdc | Gerd Hoffmann | memset(&blkcfg, 0, sizeof(blkcfg)); |
431 | 6e02c38d | aliguori | stq_raw(&blkcfg.capacity, capacity); |
432 | 6e02c38d | aliguori | stl_raw(&blkcfg.seg_max, 128 - 2); |
433 | 6e02c38d | aliguori | stw_raw(&blkcfg.cylinders, cylinders); |
434 | 6e02c38d | aliguori | blkcfg.heads = heads; |
435 | 8cfacf07 | Christoph Hellwig | blkcfg.sectors = secs & ~s->sector_mask; |
436 | 8cfacf07 | Christoph Hellwig | blkcfg.blk_size = s->conf->logical_block_size; |
437 | c7085da7 | Blue Swirl | blkcfg.size_max = 0;
|
438 | 9752c371 | Christoph Hellwig | blkcfg.physical_block_exp = get_physical_block_exp(s->conf); |
439 | 9752c371 | Christoph Hellwig | blkcfg.alignment_offset = 0;
|
440 | 8cfacf07 | Christoph Hellwig | blkcfg.min_io_size = s->conf->min_io_size / blkcfg.blk_size; |
441 | 8cfacf07 | Christoph Hellwig | blkcfg.opt_io_size = s->conf->opt_io_size / blkcfg.blk_size; |
442 | 37d5ddd6 | hch@lst.de | memcpy(config, &blkcfg, sizeof(struct virtio_blk_config)); |
443 | 6e02c38d | aliguori | } |
444 | 6e02c38d | aliguori | |
445 | 8172539d | Michael S. Tsirkin | static uint32_t virtio_blk_get_features(VirtIODevice *vdev, uint32_t features)
|
446 | 6e02c38d | aliguori | { |
447 | bf011293 | john cooper | VirtIOBlock *s = to_virtio_blk(vdev); |
448 | 1063b8b1 | Christoph Hellwig | |
449 | 1063b8b1 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_SEG_MAX);
|
450 | 1063b8b1 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_GEOMETRY);
|
451 | 9752c371 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_TOPOLOGY);
|
452 | 8cfacf07 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_BLK_SIZE);
|
453 | aa659be3 | Christoph Hellwig | |
454 | aa659be3 | Christoph Hellwig | if (bdrv_enable_write_cache(s->bs))
|
455 | aa659be3 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_WCACHE);
|
456 | c79662f7 | Naphtali Sprei | |
457 | c79662f7 | Naphtali Sprei | if (bdrv_is_read_only(s->bs))
|
458 | c79662f7 | Naphtali Sprei | features |= 1 << VIRTIO_BLK_F_RO;
|
459 | 1063b8b1 | Christoph Hellwig | |
460 | 1063b8b1 | Christoph Hellwig | return features;
|
461 | 6e02c38d | aliguori | } |
462 | 6e02c38d | aliguori | |
463 | 6e02c38d | aliguori | static void virtio_blk_save(QEMUFile *f, void *opaque) |
464 | 6e02c38d | aliguori | { |
465 | 6e02c38d | aliguori | VirtIOBlock *s = opaque; |
466 | 869a5c6d | aliguori | VirtIOBlockReq *req = s->rq; |
467 | 869a5c6d | aliguori | |
468 | 6e02c38d | aliguori | virtio_save(&s->vdev, f); |
469 | 869a5c6d | aliguori | |
470 | 869a5c6d | aliguori | while (req) {
|
471 | 869a5c6d | aliguori | qemu_put_sbyte(f, 1);
|
472 | 869a5c6d | aliguori | qemu_put_buffer(f, (unsigned char*)&req->elem, sizeof(req->elem)); |
473 | 869a5c6d | aliguori | req = req->next; |
474 | 869a5c6d | aliguori | } |
475 | 869a5c6d | aliguori | qemu_put_sbyte(f, 0);
|
476 | 6e02c38d | aliguori | } |
477 | 6e02c38d | aliguori | |
478 | 6e02c38d | aliguori | static int virtio_blk_load(QEMUFile *f, void *opaque, int version_id) |
479 | 6e02c38d | aliguori | { |
480 | 6e02c38d | aliguori | VirtIOBlock *s = opaque; |
481 | 6e02c38d | aliguori | |
482 | 869a5c6d | aliguori | if (version_id != 2) |
483 | 6e02c38d | aliguori | return -EINVAL;
|
484 | 6e02c38d | aliguori | |
485 | 6e02c38d | aliguori | virtio_load(&s->vdev, f); |
486 | 869a5c6d | aliguori | while (qemu_get_sbyte(f)) {
|
487 | 869a5c6d | aliguori | VirtIOBlockReq *req = virtio_blk_alloc_request(s); |
488 | 869a5c6d | aliguori | qemu_get_buffer(f, (unsigned char*)&req->elem, sizeof(req->elem)); |
489 | 869a5c6d | aliguori | req->next = s->rq; |
490 | 20a81e4d | Yoshiaki Tamura | s->rq = req; |
491 | b6a4805b | Kevin Wolf | |
492 | b6a4805b | Kevin Wolf | virtqueue_map_sg(req->elem.in_sg, req->elem.in_addr, |
493 | b6a4805b | Kevin Wolf | req->elem.in_num, 1);
|
494 | b6a4805b | Kevin Wolf | virtqueue_map_sg(req->elem.out_sg, req->elem.out_addr, |
495 | b6a4805b | Kevin Wolf | req->elem.out_num, 0);
|
496 | 869a5c6d | aliguori | } |
497 | 6e02c38d | aliguori | |
498 | 6e02c38d | aliguori | return 0; |
499 | 6e02c38d | aliguori | } |
500 | 6e02c38d | aliguori | |
501 | 428c149b | Christoph Hellwig | VirtIODevice *virtio_blk_init(DeviceState *dev, BlockConf *conf) |
502 | 6e02c38d | aliguori | { |
503 | 6e02c38d | aliguori | VirtIOBlock *s; |
504 | 6e02c38d | aliguori | int cylinders, heads, secs;
|
505 | 6e02c38d | aliguori | static int virtio_blk_id; |
506 | 2930b313 | john cooper | DriveInfo *dinfo; |
507 | cf21e106 | Paul Brook | |
508 | d75d25e3 | Markus Armbruster | if (!conf->bs) {
|
509 | d75d25e3 | Markus Armbruster | error_report("virtio-blk-pci: drive property not set");
|
510 | d75d25e3 | Markus Armbruster | return NULL; |
511 | d75d25e3 | Markus Armbruster | } |
512 | 98f28ad7 | Markus Armbruster | if (!bdrv_is_inserted(conf->bs)) {
|
513 | 98f28ad7 | Markus Armbruster | error_report("Device needs media, but drive is empty");
|
514 | 98f28ad7 | Markus Armbruster | return NULL; |
515 | 98f28ad7 | Markus Armbruster | } |
516 | d75d25e3 | Markus Armbruster | |
517 | 53c25cea | Paul Brook | s = (VirtIOBlock *)virtio_common_init("virtio-blk", VIRTIO_ID_BLOCK,
|
518 | 37d5ddd6 | hch@lst.de | sizeof(struct virtio_blk_config), |
519 | 53c25cea | Paul Brook | sizeof(VirtIOBlock));
|
520 | 6e02c38d | aliguori | |
521 | 6e02c38d | aliguori | s->vdev.get_config = virtio_blk_update_config; |
522 | 6e02c38d | aliguori | s->vdev.get_features = virtio_blk_get_features; |
523 | 6e02c38d | aliguori | s->vdev.reset = virtio_blk_reset; |
524 | f8b6cc00 | Markus Armbruster | s->bs = conf->bs; |
525 | 9752c371 | Christoph Hellwig | s->conf = conf; |
526 | 869a5c6d | aliguori | s->rq = NULL;
|
527 | 1573a35d | Jes Sorensen | s->sector_mask = (s->conf->logical_block_size / BDRV_SECTOR_SIZE) - 1;
|
528 | 6e02c38d | aliguori | bdrv_guess_geometry(s->bs, &cylinders, &heads, &secs); |
529 | 6e02c38d | aliguori | |
530 | 2930b313 | john cooper | /* NB: per existing s/n string convention the string is terminated
|
531 | 2930b313 | john cooper | * by '\0' only when less than sizeof (s->sn)
|
532 | 2930b313 | john cooper | */
|
533 | 2930b313 | john cooper | dinfo = drive_get_by_blockdev(s->bs); |
534 | 2930b313 | john cooper | strncpy(s->sn, dinfo->serial, sizeof (s->sn));
|
535 | 2930b313 | john cooper | |
536 | 6e02c38d | aliguori | s->vq = virtio_add_queue(&s->vdev, 128, virtio_blk_handle_output);
|
537 | 6e02c38d | aliguori | |
538 | 869a5c6d | aliguori | qemu_add_vm_change_state_handler(virtio_blk_dma_restart_cb, s); |
539 | 9d0d3138 | Alex Williamson | s->qdev = dev; |
540 | 0be71e32 | Alex Williamson | register_savevm(dev, "virtio-blk", virtio_blk_id++, 2, |
541 | 6e02c38d | aliguori | virtio_blk_save, virtio_blk_load, s); |
542 | 7d0d6950 | Markus Armbruster | bdrv_set_removable(s->bs, 0);
|
543 | 316a7af3 | Christoph Hellwig | s->bs->buffer_alignment = conf->logical_block_size; |
544 | 6e02c38d | aliguori | |
545 | 53c25cea | Paul Brook | return &s->vdev;
|
546 | 6e02c38d | aliguori | } |
547 | 9d0d3138 | Alex Williamson | |
548 | 9d0d3138 | Alex Williamson | void virtio_blk_exit(VirtIODevice *vdev)
|
549 | 9d0d3138 | Alex Williamson | { |
550 | 9d0d3138 | Alex Williamson | VirtIOBlock *s = to_virtio_blk(vdev); |
551 | 9d0d3138 | Alex Williamson | unregister_savevm(s->qdev, "virtio-blk", s);
|
552 | 9d0d3138 | Alex Williamson | } |