root / hw / virtio-blk.c @ 508240c0
History | View | Annotate | Download (15.2 kB)
1 | 6e02c38d | aliguori | /*
|
---|---|---|---|
2 | 6e02c38d | aliguori | * Virtio Block Device
|
3 | 6e02c38d | aliguori | *
|
4 | 6e02c38d | aliguori | * Copyright IBM, Corp. 2007
|
5 | 6e02c38d | aliguori | *
|
6 | 6e02c38d | aliguori | * Authors:
|
7 | 6e02c38d | aliguori | * Anthony Liguori <aliguori@us.ibm.com>
|
8 | 6e02c38d | aliguori | *
|
9 | 6e02c38d | aliguori | * This work is licensed under the terms of the GNU GPL, version 2. See
|
10 | 6e02c38d | aliguori | * the COPYING file in the top-level directory.
|
11 | 6e02c38d | aliguori | *
|
12 | 6e02c38d | aliguori | */
|
13 | 6e02c38d | aliguori | |
14 | 869a5c6d | aliguori | #include <qemu-common.h> |
15 | d75d25e3 | Markus Armbruster | #include "qemu-error.h" |
16 | 6d519a5f | Stefan Hajnoczi | #include "trace.h" |
17 | 2446333c | Blue Swirl | #include "blockdev.h" |
18 | 6e02c38d | aliguori | #include "virtio-blk.h" |
19 | 1063b8b1 | Christoph Hellwig | #ifdef __linux__
|
20 | 1063b8b1 | Christoph Hellwig | # include <scsi/sg.h> |
21 | 1063b8b1 | Christoph Hellwig | #endif
|
22 | 6e02c38d | aliguori | |
23 | 6e02c38d | aliguori | typedef struct VirtIOBlock |
24 | 6e02c38d | aliguori | { |
25 | 6e02c38d | aliguori | VirtIODevice vdev; |
26 | 6e02c38d | aliguori | BlockDriverState *bs; |
27 | 6e02c38d | aliguori | VirtQueue *vq; |
28 | 869a5c6d | aliguori | void *rq;
|
29 | 213189ab | Markus Armbruster | QEMUBH *bh; |
30 | 9752c371 | Christoph Hellwig | BlockConf *conf; |
31 | 8cfacf07 | Christoph Hellwig | unsigned short sector_mask; |
32 | 2930b313 | john cooper | char sn[BLOCK_SERIAL_STRLEN];
|
33 | 9d0d3138 | Alex Williamson | DeviceState *qdev; |
34 | 6e02c38d | aliguori | } VirtIOBlock; |
35 | 6e02c38d | aliguori | |
36 | 6e02c38d | aliguori | static VirtIOBlock *to_virtio_blk(VirtIODevice *vdev)
|
37 | 6e02c38d | aliguori | { |
38 | 6e02c38d | aliguori | return (VirtIOBlock *)vdev;
|
39 | 6e02c38d | aliguori | } |
40 | 6e02c38d | aliguori | |
41 | 6e02c38d | aliguori | typedef struct VirtIOBlockReq |
42 | 6e02c38d | aliguori | { |
43 | 6e02c38d | aliguori | VirtIOBlock *dev; |
44 | 6e02c38d | aliguori | VirtQueueElement elem; |
45 | 6e02c38d | aliguori | struct virtio_blk_inhdr *in;
|
46 | 6e02c38d | aliguori | struct virtio_blk_outhdr *out;
|
47 | 1063b8b1 | Christoph Hellwig | struct virtio_scsi_inhdr *scsi;
|
48 | d28a1b6e | aliguori | QEMUIOVector qiov; |
49 | 869a5c6d | aliguori | struct VirtIOBlockReq *next;
|
50 | 6e02c38d | aliguori | } VirtIOBlockReq; |
51 | 6e02c38d | aliguori | |
52 | 869a5c6d | aliguori | static void virtio_blk_req_complete(VirtIOBlockReq *req, int status) |
53 | 869a5c6d | aliguori | { |
54 | 869a5c6d | aliguori | VirtIOBlock *s = req->dev; |
55 | 869a5c6d | aliguori | |
56 | 6d519a5f | Stefan Hajnoczi | trace_virtio_blk_req_complete(req, status); |
57 | 6d519a5f | Stefan Hajnoczi | |
58 | 92e3c2a3 | Aurelien Jarno | stb_p(&req->in->status, status); |
59 | d28a1b6e | aliguori | virtqueue_push(s->vq, &req->elem, req->qiov.size + sizeof(*req->in));
|
60 | 869a5c6d | aliguori | virtio_notify(&s->vdev, s->vq); |
61 | 869a5c6d | aliguori | |
62 | 869a5c6d | aliguori | qemu_free(req); |
63 | 869a5c6d | aliguori | } |
64 | 869a5c6d | aliguori | |
65 | f35d68f0 | Kevin Wolf | static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error, |
66 | f35d68f0 | Kevin Wolf | int is_read)
|
67 | 869a5c6d | aliguori | { |
68 | abd7f68d | Markus Armbruster | BlockErrorAction action = bdrv_get_on_error(req->dev->bs, is_read); |
69 | 869a5c6d | aliguori | VirtIOBlock *s = req->dev; |
70 | 869a5c6d | aliguori | |
71 | eaa6c85f | Luiz Capitulino | if (action == BLOCK_ERR_IGNORE) {
|
72 | 908bb949 | Kevin Wolf | bdrv_mon_event(s->bs, BDRV_ACTION_IGNORE, is_read); |
73 | 869a5c6d | aliguori | return 0; |
74 | eaa6c85f | Luiz Capitulino | } |
75 | 869a5c6d | aliguori | |
76 | 869a5c6d | aliguori | if ((error == ENOSPC && action == BLOCK_ERR_STOP_ENOSPC)
|
77 | 869a5c6d | aliguori | || action == BLOCK_ERR_STOP_ANY) { |
78 | 869a5c6d | aliguori | req->next = s->rq; |
79 | 869a5c6d | aliguori | s->rq = req; |
80 | 908bb949 | Kevin Wolf | bdrv_mon_event(s->bs, BDRV_ACTION_STOP, is_read); |
81 | e07bbac5 | Jan Kiszka | vm_stop(VMSTOP_DISKFULL); |
82 | 869a5c6d | aliguori | } else {
|
83 | 869a5c6d | aliguori | virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); |
84 | 908bb949 | Kevin Wolf | bdrv_mon_event(s->bs, BDRV_ACTION_REPORT, is_read); |
85 | 869a5c6d | aliguori | } |
86 | 869a5c6d | aliguori | |
87 | 869a5c6d | aliguori | return 1; |
88 | 869a5c6d | aliguori | } |
89 | 869a5c6d | aliguori | |
90 | 6e02c38d | aliguori | static void virtio_blk_rw_complete(void *opaque, int ret) |
91 | 6e02c38d | aliguori | { |
92 | 6e02c38d | aliguori | VirtIOBlockReq *req = opaque; |
93 | 6e02c38d | aliguori | |
94 | 6d519a5f | Stefan Hajnoczi | trace_virtio_blk_rw_complete(req, ret); |
95 | 6d519a5f | Stefan Hajnoczi | |
96 | f35d68f0 | Kevin Wolf | if (ret) {
|
97 | 92e3c2a3 | Aurelien Jarno | int is_read = !(ldl_p(&req->out->type) & VIRTIO_BLK_T_OUT);
|
98 | f35d68f0 | Kevin Wolf | if (virtio_blk_handle_rw_error(req, -ret, is_read))
|
99 | 869a5c6d | aliguori | return;
|
100 | 6e02c38d | aliguori | } |
101 | 6e02c38d | aliguori | |
102 | f35d68f0 | Kevin Wolf | virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); |
103 | 869a5c6d | aliguori | } |
104 | 6e02c38d | aliguori | |
105 | aa659be3 | Christoph Hellwig | static void virtio_blk_flush_complete(void *opaque, int ret) |
106 | aa659be3 | Christoph Hellwig | { |
107 | aa659be3 | Christoph Hellwig | VirtIOBlockReq *req = opaque; |
108 | aa659be3 | Christoph Hellwig | |
109 | 8c269b54 | Kevin Wolf | if (ret) {
|
110 | 8c269b54 | Kevin Wolf | if (virtio_blk_handle_rw_error(req, -ret, 0)) { |
111 | 8c269b54 | Kevin Wolf | return;
|
112 | 8c269b54 | Kevin Wolf | } |
113 | 8c269b54 | Kevin Wolf | } |
114 | 8c269b54 | Kevin Wolf | |
115 | 8c269b54 | Kevin Wolf | virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); |
116 | aa659be3 | Christoph Hellwig | } |
117 | aa659be3 | Christoph Hellwig | |
118 | 869a5c6d | aliguori | static VirtIOBlockReq *virtio_blk_alloc_request(VirtIOBlock *s)
|
119 | 869a5c6d | aliguori | { |
120 | de6c8042 | Stefan Hajnoczi | VirtIOBlockReq *req = qemu_malloc(sizeof(*req));
|
121 | 487414f1 | aliguori | req->dev = s; |
122 | de6c8042 | Stefan Hajnoczi | req->qiov.size = 0;
|
123 | de6c8042 | Stefan Hajnoczi | req->next = NULL;
|
124 | 869a5c6d | aliguori | return req;
|
125 | 6e02c38d | aliguori | } |
126 | 6e02c38d | aliguori | |
127 | 6e02c38d | aliguori | static VirtIOBlockReq *virtio_blk_get_request(VirtIOBlock *s)
|
128 | 6e02c38d | aliguori | { |
129 | 869a5c6d | aliguori | VirtIOBlockReq *req = virtio_blk_alloc_request(s); |
130 | 6e02c38d | aliguori | |
131 | 869a5c6d | aliguori | if (req != NULL) { |
132 | 869a5c6d | aliguori | if (!virtqueue_pop(s->vq, &req->elem)) {
|
133 | 869a5c6d | aliguori | qemu_free(req); |
134 | 869a5c6d | aliguori | return NULL; |
135 | 869a5c6d | aliguori | } |
136 | 6e02c38d | aliguori | } |
137 | 6e02c38d | aliguori | |
138 | 6e02c38d | aliguori | return req;
|
139 | 6e02c38d | aliguori | } |
140 | 6e02c38d | aliguori | |
141 | 1063b8b1 | Christoph Hellwig | #ifdef __linux__
|
142 | 1063b8b1 | Christoph Hellwig | static void virtio_blk_handle_scsi(VirtIOBlockReq *req) |
143 | 1063b8b1 | Christoph Hellwig | { |
144 | 1063b8b1 | Christoph Hellwig | struct sg_io_hdr hdr;
|
145 | 4277906d | Christoph Hellwig | int ret;
|
146 | 1063b8b1 | Christoph Hellwig | int status;
|
147 | 1063b8b1 | Christoph Hellwig | int i;
|
148 | 1063b8b1 | Christoph Hellwig | |
149 | 1063b8b1 | Christoph Hellwig | /*
|
150 | 1063b8b1 | Christoph Hellwig | * We require at least one output segment each for the virtio_blk_outhdr
|
151 | 1063b8b1 | Christoph Hellwig | * and the SCSI command block.
|
152 | 1063b8b1 | Christoph Hellwig | *
|
153 | 1063b8b1 | Christoph Hellwig | * We also at least require the virtio_blk_inhdr, the virtio_scsi_inhdr
|
154 | 1063b8b1 | Christoph Hellwig | * and the sense buffer pointer in the input segments.
|
155 | 1063b8b1 | Christoph Hellwig | */
|
156 | 1063b8b1 | Christoph Hellwig | if (req->elem.out_num < 2 || req->elem.in_num < 3) { |
157 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); |
158 | 1063b8b1 | Christoph Hellwig | return;
|
159 | 1063b8b1 | Christoph Hellwig | } |
160 | 1063b8b1 | Christoph Hellwig | |
161 | 1063b8b1 | Christoph Hellwig | /*
|
162 | 1063b8b1 | Christoph Hellwig | * No support for bidirection commands yet.
|
163 | 1063b8b1 | Christoph Hellwig | */
|
164 | 1063b8b1 | Christoph Hellwig | if (req->elem.out_num > 2 && req->elem.in_num > 3) { |
165 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); |
166 | 1063b8b1 | Christoph Hellwig | return;
|
167 | 1063b8b1 | Christoph Hellwig | } |
168 | 1063b8b1 | Christoph Hellwig | |
169 | 1063b8b1 | Christoph Hellwig | /*
|
170 | 1063b8b1 | Christoph Hellwig | * The scsi inhdr is placed in the second-to-last input segment, just
|
171 | 1063b8b1 | Christoph Hellwig | * before the regular inhdr.
|
172 | 1063b8b1 | Christoph Hellwig | */
|
173 | 1063b8b1 | Christoph Hellwig | req->scsi = (void *)req->elem.in_sg[req->elem.in_num - 2].iov_base; |
174 | 1063b8b1 | Christoph Hellwig | |
175 | 1063b8b1 | Christoph Hellwig | memset(&hdr, 0, sizeof(struct sg_io_hdr)); |
176 | 1063b8b1 | Christoph Hellwig | hdr.interface_id = 'S';
|
177 | 1063b8b1 | Christoph Hellwig | hdr.cmd_len = req->elem.out_sg[1].iov_len;
|
178 | 1063b8b1 | Christoph Hellwig | hdr.cmdp = req->elem.out_sg[1].iov_base;
|
179 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_len = 0;
|
180 | 1063b8b1 | Christoph Hellwig | |
181 | 1063b8b1 | Christoph Hellwig | if (req->elem.out_num > 2) { |
182 | 1063b8b1 | Christoph Hellwig | /*
|
183 | 1063b8b1 | Christoph Hellwig | * If there are more than the minimally required 2 output segments
|
184 | 1063b8b1 | Christoph Hellwig | * there is write payload starting from the third iovec.
|
185 | 1063b8b1 | Christoph Hellwig | */
|
186 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_direction = SG_DXFER_TO_DEV; |
187 | 1063b8b1 | Christoph Hellwig | hdr.iovec_count = req->elem.out_num - 2;
|
188 | 1063b8b1 | Christoph Hellwig | |
189 | 1063b8b1 | Christoph Hellwig | for (i = 0; i < hdr.iovec_count; i++) |
190 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_len += req->elem.out_sg[i + 2].iov_len;
|
191 | 1063b8b1 | Christoph Hellwig | |
192 | 1063b8b1 | Christoph Hellwig | hdr.dxferp = req->elem.out_sg + 2;
|
193 | 1063b8b1 | Christoph Hellwig | |
194 | 1063b8b1 | Christoph Hellwig | } else if (req->elem.in_num > 3) { |
195 | 1063b8b1 | Christoph Hellwig | /*
|
196 | 1063b8b1 | Christoph Hellwig | * If we have more than 3 input segments the guest wants to actually
|
197 | 1063b8b1 | Christoph Hellwig | * read data.
|
198 | 1063b8b1 | Christoph Hellwig | */
|
199 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_direction = SG_DXFER_FROM_DEV; |
200 | 1063b8b1 | Christoph Hellwig | hdr.iovec_count = req->elem.in_num - 3;
|
201 | 1063b8b1 | Christoph Hellwig | for (i = 0; i < hdr.iovec_count; i++) |
202 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_len += req->elem.in_sg[i].iov_len; |
203 | 1063b8b1 | Christoph Hellwig | |
204 | 1063b8b1 | Christoph Hellwig | hdr.dxferp = req->elem.in_sg; |
205 | 1063b8b1 | Christoph Hellwig | } else {
|
206 | 1063b8b1 | Christoph Hellwig | /*
|
207 | 1063b8b1 | Christoph Hellwig | * Some SCSI commands don't actually transfer any data.
|
208 | 1063b8b1 | Christoph Hellwig | */
|
209 | 1063b8b1 | Christoph Hellwig | hdr.dxfer_direction = SG_DXFER_NONE; |
210 | 1063b8b1 | Christoph Hellwig | } |
211 | 1063b8b1 | Christoph Hellwig | |
212 | 1063b8b1 | Christoph Hellwig | hdr.sbp = req->elem.in_sg[req->elem.in_num - 3].iov_base;
|
213 | 1063b8b1 | Christoph Hellwig | hdr.mx_sb_len = req->elem.in_sg[req->elem.in_num - 3].iov_len;
|
214 | 1063b8b1 | Christoph Hellwig | |
215 | 1063b8b1 | Christoph Hellwig | ret = bdrv_ioctl(req->dev->bs, SG_IO, &hdr); |
216 | 1063b8b1 | Christoph Hellwig | if (ret) {
|
217 | 1063b8b1 | Christoph Hellwig | status = VIRTIO_BLK_S_UNSUPP; |
218 | 1063b8b1 | Christoph Hellwig | hdr.status = ret; |
219 | 1063b8b1 | Christoph Hellwig | hdr.resid = hdr.dxfer_len; |
220 | 1063b8b1 | Christoph Hellwig | } else if (hdr.status) { |
221 | 1063b8b1 | Christoph Hellwig | status = VIRTIO_BLK_S_IOERR; |
222 | 1063b8b1 | Christoph Hellwig | } else {
|
223 | 1063b8b1 | Christoph Hellwig | status = VIRTIO_BLK_S_OK; |
224 | 1063b8b1 | Christoph Hellwig | } |
225 | 1063b8b1 | Christoph Hellwig | |
226 | 92e3c2a3 | Aurelien Jarno | stl_p(&req->scsi->errors, hdr.status); |
227 | 92e3c2a3 | Aurelien Jarno | stl_p(&req->scsi->residual, hdr.resid); |
228 | 92e3c2a3 | Aurelien Jarno | stl_p(&req->scsi->sense_len, hdr.sb_len_wr); |
229 | 92e3c2a3 | Aurelien Jarno | stl_p(&req->scsi->data_len, hdr.dxfer_len); |
230 | 1063b8b1 | Christoph Hellwig | |
231 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, status); |
232 | 1063b8b1 | Christoph Hellwig | } |
233 | 1063b8b1 | Christoph Hellwig | #else
|
234 | 1063b8b1 | Christoph Hellwig | static void virtio_blk_handle_scsi(VirtIOBlockReq *req) |
235 | 1063b8b1 | Christoph Hellwig | { |
236 | 1063b8b1 | Christoph Hellwig | virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); |
237 | 1063b8b1 | Christoph Hellwig | } |
238 | 1063b8b1 | Christoph Hellwig | #endif /* __linux__ */ |
239 | 1063b8b1 | Christoph Hellwig | |
240 | c20fd872 | Christoph Hellwig | typedef struct MultiReqBuffer { |
241 | c20fd872 | Christoph Hellwig | BlockRequest blkreq[32];
|
242 | c20fd872 | Christoph Hellwig | unsigned int num_writes; |
243 | c20fd872 | Christoph Hellwig | } MultiReqBuffer; |
244 | c20fd872 | Christoph Hellwig | |
245 | c20fd872 | Christoph Hellwig | static void virtio_submit_multiwrite(BlockDriverState *bs, MultiReqBuffer *mrb) |
246 | 869a5c6d | aliguori | { |
247 | 91553dcc | Kevin Wolf | int i, ret;
|
248 | 91553dcc | Kevin Wolf | |
249 | c20fd872 | Christoph Hellwig | if (!mrb->num_writes) {
|
250 | c20fd872 | Christoph Hellwig | return;
|
251 | c20fd872 | Christoph Hellwig | } |
252 | c20fd872 | Christoph Hellwig | |
253 | c20fd872 | Christoph Hellwig | ret = bdrv_aio_multiwrite(bs, mrb->blkreq, mrb->num_writes); |
254 | 91553dcc | Kevin Wolf | if (ret != 0) { |
255 | c20fd872 | Christoph Hellwig | for (i = 0; i < mrb->num_writes; i++) { |
256 | c20fd872 | Christoph Hellwig | if (mrb->blkreq[i].error) {
|
257 | c20fd872 | Christoph Hellwig | virtio_blk_rw_complete(mrb->blkreq[i].opaque, -EIO); |
258 | 91553dcc | Kevin Wolf | } |
259 | 91553dcc | Kevin Wolf | } |
260 | 91553dcc | Kevin Wolf | } |
261 | c20fd872 | Christoph Hellwig | |
262 | c20fd872 | Christoph Hellwig | mrb->num_writes = 0;
|
263 | 91553dcc | Kevin Wolf | } |
264 | 87b245db | Christoph Hellwig | |
265 | c20fd872 | Christoph Hellwig | static void virtio_blk_handle_flush(VirtIOBlockReq *req, MultiReqBuffer *mrb) |
266 | aa659be3 | Christoph Hellwig | { |
267 | aa659be3 | Christoph Hellwig | BlockDriverAIOCB *acb; |
268 | aa659be3 | Christoph Hellwig | |
269 | 618fbb84 | Christoph Hellwig | /*
|
270 | 618fbb84 | Christoph Hellwig | * Make sure all outstanding writes are posted to the backing device.
|
271 | 618fbb84 | Christoph Hellwig | */
|
272 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(req->dev->bs, mrb); |
273 | 618fbb84 | Christoph Hellwig | |
274 | aa659be3 | Christoph Hellwig | acb = bdrv_aio_flush(req->dev->bs, virtio_blk_flush_complete, req); |
275 | aa659be3 | Christoph Hellwig | if (!acb) {
|
276 | 18a8d421 | Kevin Wolf | virtio_blk_flush_complete(req, -EIO); |
277 | aa659be3 | Christoph Hellwig | } |
278 | aa659be3 | Christoph Hellwig | } |
279 | aa659be3 | Christoph Hellwig | |
280 | c20fd872 | Christoph Hellwig | static void virtio_blk_handle_write(VirtIOBlockReq *req, MultiReqBuffer *mrb) |
281 | 91553dcc | Kevin Wolf | { |
282 | c20fd872 | Christoph Hellwig | BlockRequest *blkreq; |
283 | 92e3c2a3 | Aurelien Jarno | uint64_t sector; |
284 | c20fd872 | Christoph Hellwig | |
285 | 92e3c2a3 | Aurelien Jarno | sector = ldq_p(&req->out->sector); |
286 | 6d519a5f | Stefan Hajnoczi | |
287 | 92e3c2a3 | Aurelien Jarno | trace_virtio_blk_handle_write(req, sector, req->qiov.size / 512);
|
288 | 92e3c2a3 | Aurelien Jarno | |
289 | 92e3c2a3 | Aurelien Jarno | if (sector & req->dev->sector_mask) {
|
290 | 8cfacf07 | Christoph Hellwig | virtio_blk_rw_complete(req, -EIO); |
291 | 8cfacf07 | Christoph Hellwig | return;
|
292 | 8cfacf07 | Christoph Hellwig | } |
293 | 8cfacf07 | Christoph Hellwig | |
294 | c20fd872 | Christoph Hellwig | if (mrb->num_writes == 32) { |
295 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(req->dev->bs, mrb); |
296 | 87b245db | Christoph Hellwig | } |
297 | 91553dcc | Kevin Wolf | |
298 | c20fd872 | Christoph Hellwig | blkreq = &mrb->blkreq[mrb->num_writes]; |
299 | 92e3c2a3 | Aurelien Jarno | blkreq->sector = sector; |
300 | c20fd872 | Christoph Hellwig | blkreq->nb_sectors = req->qiov.size / BDRV_SECTOR_SIZE; |
301 | c20fd872 | Christoph Hellwig | blkreq->qiov = &req->qiov; |
302 | c20fd872 | Christoph Hellwig | blkreq->cb = virtio_blk_rw_complete; |
303 | c20fd872 | Christoph Hellwig | blkreq->opaque = req; |
304 | c20fd872 | Christoph Hellwig | blkreq->error = 0;
|
305 | 91553dcc | Kevin Wolf | |
306 | c20fd872 | Christoph Hellwig | mrb->num_writes++; |
307 | d28a1b6e | aliguori | } |
308 | 869a5c6d | aliguori | |
309 | d28a1b6e | aliguori | static void virtio_blk_handle_read(VirtIOBlockReq *req) |
310 | d28a1b6e | aliguori | { |
311 | 87b245db | Christoph Hellwig | BlockDriverAIOCB *acb; |
312 | 92e3c2a3 | Aurelien Jarno | uint64_t sector; |
313 | 92e3c2a3 | Aurelien Jarno | |
314 | 92e3c2a3 | Aurelien Jarno | sector = ldq_p(&req->out->sector); |
315 | 87b245db | Christoph Hellwig | |
316 | 92e3c2a3 | Aurelien Jarno | if (sector & req->dev->sector_mask) {
|
317 | 8cfacf07 | Christoph Hellwig | virtio_blk_rw_complete(req, -EIO); |
318 | 8cfacf07 | Christoph Hellwig | return;
|
319 | 8cfacf07 | Christoph Hellwig | } |
320 | 8cfacf07 | Christoph Hellwig | |
321 | 92e3c2a3 | Aurelien Jarno | acb = bdrv_aio_readv(req->dev->bs, sector, &req->qiov, |
322 | 1573a35d | Jes Sorensen | req->qiov.size / BDRV_SECTOR_SIZE, |
323 | 1573a35d | Jes Sorensen | virtio_blk_rw_complete, req); |
324 | 87b245db | Christoph Hellwig | if (!acb) {
|
325 | 6c510fbf | Kevin Wolf | virtio_blk_rw_complete(req, -EIO); |
326 | 87b245db | Christoph Hellwig | } |
327 | 869a5c6d | aliguori | } |
328 | 869a5c6d | aliguori | |
329 | bc6694d4 | Kevin Wolf | static void virtio_blk_handle_request(VirtIOBlockReq *req, |
330 | bc6694d4 | Kevin Wolf | MultiReqBuffer *mrb) |
331 | bc6694d4 | Kevin Wolf | { |
332 | 92e3c2a3 | Aurelien Jarno | uint32_t type; |
333 | 92e3c2a3 | Aurelien Jarno | |
334 | bc6694d4 | Kevin Wolf | if (req->elem.out_num < 1 || req->elem.in_num < 1) { |
335 | 870cef1d | Stefan Hajnoczi | error_report("virtio-blk missing headers");
|
336 | bc6694d4 | Kevin Wolf | exit(1);
|
337 | bc6694d4 | Kevin Wolf | } |
338 | bc6694d4 | Kevin Wolf | |
339 | bc6694d4 | Kevin Wolf | if (req->elem.out_sg[0].iov_len < sizeof(*req->out) || |
340 | bc6694d4 | Kevin Wolf | req->elem.in_sg[req->elem.in_num - 1].iov_len < sizeof(*req->in)) { |
341 | 870cef1d | Stefan Hajnoczi | error_report("virtio-blk header not in correct element");
|
342 | bc6694d4 | Kevin Wolf | exit(1);
|
343 | bc6694d4 | Kevin Wolf | } |
344 | bc6694d4 | Kevin Wolf | |
345 | bc6694d4 | Kevin Wolf | req->out = (void *)req->elem.out_sg[0].iov_base; |
346 | bc6694d4 | Kevin Wolf | req->in = (void *)req->elem.in_sg[req->elem.in_num - 1].iov_base; |
347 | bc6694d4 | Kevin Wolf | |
348 | 92e3c2a3 | Aurelien Jarno | type = ldl_p(&req->out->type); |
349 | 92e3c2a3 | Aurelien Jarno | |
350 | 92e3c2a3 | Aurelien Jarno | if (type & VIRTIO_BLK_T_FLUSH) {
|
351 | c20fd872 | Christoph Hellwig | virtio_blk_handle_flush(req, mrb); |
352 | 92e3c2a3 | Aurelien Jarno | } else if (type & VIRTIO_BLK_T_SCSI_CMD) { |
353 | bc6694d4 | Kevin Wolf | virtio_blk_handle_scsi(req); |
354 | 92e3c2a3 | Aurelien Jarno | } else if (type & VIRTIO_BLK_T_GET_ID) { |
355 | 2930b313 | john cooper | VirtIOBlock *s = req->dev; |
356 | 2930b313 | john cooper | |
357 | 2930b313 | john cooper | memcpy(req->elem.in_sg[0].iov_base, s->sn,
|
358 | 2930b313 | john cooper | MIN(req->elem.in_sg[0].iov_len, sizeof(s->sn))); |
359 | 2930b313 | john cooper | virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); |
360 | 92e3c2a3 | Aurelien Jarno | } else if (type & VIRTIO_BLK_T_OUT) { |
361 | bc6694d4 | Kevin Wolf | qemu_iovec_init_external(&req->qiov, &req->elem.out_sg[1],
|
362 | bc6694d4 | Kevin Wolf | req->elem.out_num - 1);
|
363 | c20fd872 | Christoph Hellwig | virtio_blk_handle_write(req, mrb); |
364 | bc6694d4 | Kevin Wolf | } else {
|
365 | bc6694d4 | Kevin Wolf | qemu_iovec_init_external(&req->qiov, &req->elem.in_sg[0],
|
366 | bc6694d4 | Kevin Wolf | req->elem.in_num - 1);
|
367 | bc6694d4 | Kevin Wolf | virtio_blk_handle_read(req); |
368 | bc6694d4 | Kevin Wolf | } |
369 | bc6694d4 | Kevin Wolf | } |
370 | bc6694d4 | Kevin Wolf | |
371 | 6e02c38d | aliguori | static void virtio_blk_handle_output(VirtIODevice *vdev, VirtQueue *vq) |
372 | 6e02c38d | aliguori | { |
373 | 6e02c38d | aliguori | VirtIOBlock *s = to_virtio_blk(vdev); |
374 | 6e02c38d | aliguori | VirtIOBlockReq *req; |
375 | bc6694d4 | Kevin Wolf | MultiReqBuffer mrb = { |
376 | bc6694d4 | Kevin Wolf | .num_writes = 0,
|
377 | bc6694d4 | Kevin Wolf | }; |
378 | 6e02c38d | aliguori | |
379 | 6e02c38d | aliguori | while ((req = virtio_blk_get_request(s))) {
|
380 | bc6694d4 | Kevin Wolf | virtio_blk_handle_request(req, &mrb); |
381 | 6e02c38d | aliguori | } |
382 | 91553dcc | Kevin Wolf | |
383 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(s->bs, &mrb); |
384 | 91553dcc | Kevin Wolf | |
385 | 6e02c38d | aliguori | /*
|
386 | 6e02c38d | aliguori | * FIXME: Want to check for completions before returning to guest mode,
|
387 | 6e02c38d | aliguori | * so cached reads and writes are reported as quickly as possible. But
|
388 | 6e02c38d | aliguori | * that should be done in the generic block layer.
|
389 | 6e02c38d | aliguori | */
|
390 | 6e02c38d | aliguori | } |
391 | 6e02c38d | aliguori | |
392 | 213189ab | Markus Armbruster | static void virtio_blk_dma_restart_bh(void *opaque) |
393 | 869a5c6d | aliguori | { |
394 | 869a5c6d | aliguori | VirtIOBlock *s = opaque; |
395 | 869a5c6d | aliguori | VirtIOBlockReq *req = s->rq; |
396 | f1b52868 | Kevin Wolf | MultiReqBuffer mrb = { |
397 | f1b52868 | Kevin Wolf | .num_writes = 0,
|
398 | f1b52868 | Kevin Wolf | }; |
399 | 869a5c6d | aliguori | |
400 | 213189ab | Markus Armbruster | qemu_bh_delete(s->bh); |
401 | 213189ab | Markus Armbruster | s->bh = NULL;
|
402 | 869a5c6d | aliguori | |
403 | 869a5c6d | aliguori | s->rq = NULL;
|
404 | 869a5c6d | aliguori | |
405 | 869a5c6d | aliguori | while (req) {
|
406 | f1b52868 | Kevin Wolf | virtio_blk_handle_request(req, &mrb); |
407 | 869a5c6d | aliguori | req = req->next; |
408 | 869a5c6d | aliguori | } |
409 | f1b52868 | Kevin Wolf | |
410 | c20fd872 | Christoph Hellwig | virtio_submit_multiwrite(s->bs, &mrb); |
411 | 869a5c6d | aliguori | } |
412 | 869a5c6d | aliguori | |
413 | 213189ab | Markus Armbruster | static void virtio_blk_dma_restart_cb(void *opaque, int running, int reason) |
414 | 213189ab | Markus Armbruster | { |
415 | 213189ab | Markus Armbruster | VirtIOBlock *s = opaque; |
416 | 213189ab | Markus Armbruster | |
417 | 213189ab | Markus Armbruster | if (!running)
|
418 | 213189ab | Markus Armbruster | return;
|
419 | 213189ab | Markus Armbruster | |
420 | 213189ab | Markus Armbruster | if (!s->bh) {
|
421 | 213189ab | Markus Armbruster | s->bh = qemu_bh_new(virtio_blk_dma_restart_bh, s); |
422 | 213189ab | Markus Armbruster | qemu_bh_schedule(s->bh); |
423 | 213189ab | Markus Armbruster | } |
424 | 213189ab | Markus Armbruster | } |
425 | 213189ab | Markus Armbruster | |
426 | 6e02c38d | aliguori | static void virtio_blk_reset(VirtIODevice *vdev) |
427 | 6e02c38d | aliguori | { |
428 | 6e02c38d | aliguori | /*
|
429 | 6e02c38d | aliguori | * This should cancel pending requests, but can't do nicely until there
|
430 | 6e02c38d | aliguori | * are per-device request lists.
|
431 | 6e02c38d | aliguori | */
|
432 | 6e02c38d | aliguori | qemu_aio_flush(); |
433 | 6e02c38d | aliguori | } |
434 | 6e02c38d | aliguori | |
435 | bf011293 | john cooper | /* coalesce internal state, copy to pci i/o region 0
|
436 | bf011293 | john cooper | */
|
437 | 6e02c38d | aliguori | static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config) |
438 | 6e02c38d | aliguori | { |
439 | 6e02c38d | aliguori | VirtIOBlock *s = to_virtio_blk(vdev); |
440 | 6e02c38d | aliguori | struct virtio_blk_config blkcfg;
|
441 | 6e02c38d | aliguori | uint64_t capacity; |
442 | 6e02c38d | aliguori | int cylinders, heads, secs;
|
443 | 6e02c38d | aliguori | |
444 | 6e02c38d | aliguori | bdrv_get_geometry(s->bs, &capacity); |
445 | 6e02c38d | aliguori | bdrv_get_geometry_hint(s->bs, &cylinders, &heads, &secs); |
446 | 5c5dafdc | Gerd Hoffmann | memset(&blkcfg, 0, sizeof(blkcfg)); |
447 | 6e02c38d | aliguori | stq_raw(&blkcfg.capacity, capacity); |
448 | 6e02c38d | aliguori | stl_raw(&blkcfg.seg_max, 128 - 2); |
449 | 6e02c38d | aliguori | stw_raw(&blkcfg.cylinders, cylinders); |
450 | 6e02c38d | aliguori | blkcfg.heads = heads; |
451 | 8cfacf07 | Christoph Hellwig | blkcfg.sectors = secs & ~s->sector_mask; |
452 | 8cfacf07 | Christoph Hellwig | blkcfg.blk_size = s->conf->logical_block_size; |
453 | c7085da7 | Blue Swirl | blkcfg.size_max = 0;
|
454 | 9752c371 | Christoph Hellwig | blkcfg.physical_block_exp = get_physical_block_exp(s->conf); |
455 | 9752c371 | Christoph Hellwig | blkcfg.alignment_offset = 0;
|
456 | 8cfacf07 | Christoph Hellwig | blkcfg.min_io_size = s->conf->min_io_size / blkcfg.blk_size; |
457 | 8cfacf07 | Christoph Hellwig | blkcfg.opt_io_size = s->conf->opt_io_size / blkcfg.blk_size; |
458 | 37d5ddd6 | hch@lst.de | memcpy(config, &blkcfg, sizeof(struct virtio_blk_config)); |
459 | 6e02c38d | aliguori | } |
460 | 6e02c38d | aliguori | |
461 | 8172539d | Michael S. Tsirkin | static uint32_t virtio_blk_get_features(VirtIODevice *vdev, uint32_t features)
|
462 | 6e02c38d | aliguori | { |
463 | bf011293 | john cooper | VirtIOBlock *s = to_virtio_blk(vdev); |
464 | 1063b8b1 | Christoph Hellwig | |
465 | 1063b8b1 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_SEG_MAX);
|
466 | 1063b8b1 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_GEOMETRY);
|
467 | 9752c371 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_TOPOLOGY);
|
468 | 8cfacf07 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_BLK_SIZE);
|
469 | aa659be3 | Christoph Hellwig | |
470 | aa659be3 | Christoph Hellwig | if (bdrv_enable_write_cache(s->bs))
|
471 | aa659be3 | Christoph Hellwig | features |= (1 << VIRTIO_BLK_F_WCACHE);
|
472 | c79662f7 | Naphtali Sprei | |
473 | c79662f7 | Naphtali Sprei | if (bdrv_is_read_only(s->bs))
|
474 | c79662f7 | Naphtali Sprei | features |= 1 << VIRTIO_BLK_F_RO;
|
475 | 1063b8b1 | Christoph Hellwig | |
476 | 1063b8b1 | Christoph Hellwig | return features;
|
477 | 6e02c38d | aliguori | } |
478 | 6e02c38d | aliguori | |
479 | 6e02c38d | aliguori | static void virtio_blk_save(QEMUFile *f, void *opaque) |
480 | 6e02c38d | aliguori | { |
481 | 6e02c38d | aliguori | VirtIOBlock *s = opaque; |
482 | 869a5c6d | aliguori | VirtIOBlockReq *req = s->rq; |
483 | 869a5c6d | aliguori | |
484 | 6e02c38d | aliguori | virtio_save(&s->vdev, f); |
485 | 869a5c6d | aliguori | |
486 | 869a5c6d | aliguori | while (req) {
|
487 | 869a5c6d | aliguori | qemu_put_sbyte(f, 1);
|
488 | 869a5c6d | aliguori | qemu_put_buffer(f, (unsigned char*)&req->elem, sizeof(req->elem)); |
489 | 869a5c6d | aliguori | req = req->next; |
490 | 869a5c6d | aliguori | } |
491 | 869a5c6d | aliguori | qemu_put_sbyte(f, 0);
|
492 | 6e02c38d | aliguori | } |
493 | 6e02c38d | aliguori | |
494 | 6e02c38d | aliguori | static int virtio_blk_load(QEMUFile *f, void *opaque, int version_id) |
495 | 6e02c38d | aliguori | { |
496 | 6e02c38d | aliguori | VirtIOBlock *s = opaque; |
497 | 6e02c38d | aliguori | |
498 | 869a5c6d | aliguori | if (version_id != 2) |
499 | 6e02c38d | aliguori | return -EINVAL;
|
500 | 6e02c38d | aliguori | |
501 | 6e02c38d | aliguori | virtio_load(&s->vdev, f); |
502 | 869a5c6d | aliguori | while (qemu_get_sbyte(f)) {
|
503 | 869a5c6d | aliguori | VirtIOBlockReq *req = virtio_blk_alloc_request(s); |
504 | 869a5c6d | aliguori | qemu_get_buffer(f, (unsigned char*)&req->elem, sizeof(req->elem)); |
505 | 869a5c6d | aliguori | req->next = s->rq; |
506 | 20a81e4d | Yoshiaki Tamura | s->rq = req; |
507 | b6a4805b | Kevin Wolf | |
508 | b6a4805b | Kevin Wolf | virtqueue_map_sg(req->elem.in_sg, req->elem.in_addr, |
509 | b6a4805b | Kevin Wolf | req->elem.in_num, 1);
|
510 | b6a4805b | Kevin Wolf | virtqueue_map_sg(req->elem.out_sg, req->elem.out_addr, |
511 | b6a4805b | Kevin Wolf | req->elem.out_num, 0);
|
512 | 869a5c6d | aliguori | } |
513 | 6e02c38d | aliguori | |
514 | 6e02c38d | aliguori | return 0; |
515 | 6e02c38d | aliguori | } |
516 | 6e02c38d | aliguori | |
517 | e5051fc7 | Christoph Hellwig | static void virtio_blk_change_cb(void *opaque, int reason) |
518 | e5051fc7 | Christoph Hellwig | { |
519 | e5051fc7 | Christoph Hellwig | VirtIOBlock *s = opaque; |
520 | e5051fc7 | Christoph Hellwig | |
521 | e5051fc7 | Christoph Hellwig | if (reason & CHANGE_SIZE) {
|
522 | e5051fc7 | Christoph Hellwig | virtio_notify_config(&s->vdev); |
523 | e5051fc7 | Christoph Hellwig | } |
524 | e5051fc7 | Christoph Hellwig | } |
525 | e5051fc7 | Christoph Hellwig | |
526 | 428c149b | Christoph Hellwig | VirtIODevice *virtio_blk_init(DeviceState *dev, BlockConf *conf) |
527 | 6e02c38d | aliguori | { |
528 | 6e02c38d | aliguori | VirtIOBlock *s; |
529 | 6e02c38d | aliguori | int cylinders, heads, secs;
|
530 | 6e02c38d | aliguori | static int virtio_blk_id; |
531 | 2930b313 | john cooper | DriveInfo *dinfo; |
532 | cf21e106 | Paul Brook | |
533 | d75d25e3 | Markus Armbruster | if (!conf->bs) {
|
534 | d75d25e3 | Markus Armbruster | error_report("virtio-blk-pci: drive property not set");
|
535 | d75d25e3 | Markus Armbruster | return NULL; |
536 | d75d25e3 | Markus Armbruster | } |
537 | 98f28ad7 | Markus Armbruster | if (!bdrv_is_inserted(conf->bs)) {
|
538 | 98f28ad7 | Markus Armbruster | error_report("Device needs media, but drive is empty");
|
539 | 98f28ad7 | Markus Armbruster | return NULL; |
540 | 98f28ad7 | Markus Armbruster | } |
541 | d75d25e3 | Markus Armbruster | |
542 | 53c25cea | Paul Brook | s = (VirtIOBlock *)virtio_common_init("virtio-blk", VIRTIO_ID_BLOCK,
|
543 | 37d5ddd6 | hch@lst.de | sizeof(struct virtio_blk_config), |
544 | 53c25cea | Paul Brook | sizeof(VirtIOBlock));
|
545 | 6e02c38d | aliguori | |
546 | 6e02c38d | aliguori | s->vdev.get_config = virtio_blk_update_config; |
547 | 6e02c38d | aliguori | s->vdev.get_features = virtio_blk_get_features; |
548 | 6e02c38d | aliguori | s->vdev.reset = virtio_blk_reset; |
549 | f8b6cc00 | Markus Armbruster | s->bs = conf->bs; |
550 | 9752c371 | Christoph Hellwig | s->conf = conf; |
551 | 869a5c6d | aliguori | s->rq = NULL;
|
552 | 1573a35d | Jes Sorensen | s->sector_mask = (s->conf->logical_block_size / BDRV_SECTOR_SIZE) - 1;
|
553 | 6e02c38d | aliguori | bdrv_guess_geometry(s->bs, &cylinders, &heads, &secs); |
554 | 6e02c38d | aliguori | |
555 | 2930b313 | john cooper | /* NB: per existing s/n string convention the string is terminated
|
556 | 2930b313 | john cooper | * by '\0' only when less than sizeof (s->sn)
|
557 | 2930b313 | john cooper | */
|
558 | 2930b313 | john cooper | dinfo = drive_get_by_blockdev(s->bs); |
559 | 2930b313 | john cooper | strncpy(s->sn, dinfo->serial, sizeof (s->sn));
|
560 | 2930b313 | john cooper | |
561 | 6e02c38d | aliguori | s->vq = virtio_add_queue(&s->vdev, 128, virtio_blk_handle_output);
|
562 | 6e02c38d | aliguori | |
563 | 869a5c6d | aliguori | qemu_add_vm_change_state_handler(virtio_blk_dma_restart_cb, s); |
564 | 9d0d3138 | Alex Williamson | s->qdev = dev; |
565 | 0be71e32 | Alex Williamson | register_savevm(dev, "virtio-blk", virtio_blk_id++, 2, |
566 | 6e02c38d | aliguori | virtio_blk_save, virtio_blk_load, s); |
567 | 7d0d6950 | Markus Armbruster | bdrv_set_removable(s->bs, 0);
|
568 | e5051fc7 | Christoph Hellwig | bdrv_set_change_cb(s->bs, virtio_blk_change_cb, s); |
569 | 316a7af3 | Christoph Hellwig | s->bs->buffer_alignment = conf->logical_block_size; |
570 | 6e02c38d | aliguori | |
571 | 1ca4d09a | Gleb Natapov | add_boot_device_path(conf->bootindex, dev, "/disk@0,0");
|
572 | 1ca4d09a | Gleb Natapov | |
573 | 53c25cea | Paul Brook | return &s->vdev;
|
574 | 6e02c38d | aliguori | } |
575 | 9d0d3138 | Alex Williamson | |
576 | 9d0d3138 | Alex Williamson | void virtio_blk_exit(VirtIODevice *vdev)
|
577 | 9d0d3138 | Alex Williamson | { |
578 | 9d0d3138 | Alex Williamson | VirtIOBlock *s = to_virtio_blk(vdev); |
579 | 9d0d3138 | Alex Williamson | unregister_savevm(s->qdev, "virtio-blk", s);
|
580 | 9d0d3138 | Alex Williamson | } |