]>
Commit | Line | Data |
---|---|---|
798bfe00 | 1 | /* |
216ee365 | 2 | * Copyright (C) 2016-2018 Red Hat, Inc. |
798bfe00 FZ |
3 | * Copyright (C) 2005 Anthony Liguori <[email protected]> |
4 | * | |
5 | * Network Block Device Client Side | |
6 | * | |
7 | * This program is free software; you can redistribute it and/or modify | |
8 | * it under the terms of the GNU General Public License as published by | |
9 | * the Free Software Foundation; under version 2 of the License. | |
10 | * | |
11 | * This program is distributed in the hope that it will be useful, | |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 | * GNU General Public License for more details. | |
15 | * | |
16 | * You should have received a copy of the GNU General Public License | |
17 | * along with this program; if not, see <http://www.gnu.org/licenses/>. | |
18 | */ | |
19 | ||
d38ea87a | 20 | #include "qemu/osdep.h" |
da34e65c | 21 | #include "qapi/error.h" |
9588463e | 22 | #include "trace.h" |
798bfe00 FZ |
23 | #include "nbd-internal.h" |
24 | ||
798bfe00 FZ |
25 | /* Definitions for opaque data types */ |
26 | ||
27 | static QTAILQ_HEAD(, NBDExport) exports = QTAILQ_HEAD_INITIALIZER(exports); | |
28 | ||
29 | /* That's all folks */ | |
30 | ||
31 | /* Basic flow for negotiation | |
32 | ||
33 | Server Client | |
34 | Negotiate | |
35 | ||
36 | or | |
37 | ||
38 | Server Client | |
39 | Negotiate #1 | |
40 | Option | |
41 | Negotiate #2 | |
42 | ||
43 | ---- | |
44 | ||
45 | followed by | |
46 | ||
47 | Server Client | |
48 | Request | |
49 | Response | |
50 | Request | |
51 | Response | |
52 | ... | |
53 | ... | |
54 | Request (type == 2) | |
55 | ||
56 | */ | |
57 | ||
c8a3a1b6 EB |
58 | /* Send an option request. |
59 | * | |
60 | * The request is for option @opt, with @data containing @len bytes of | |
61 | * additional payload for the request (@len may be -1 to treat @data as | |
62 | * a C string; and @data may be NULL if @len is 0). | |
63 | * Return 0 if successful, -1 with errp set if it is impossible to | |
64 | * continue. */ | |
65 | static int nbd_send_option_request(QIOChannel *ioc, uint32_t opt, | |
66 | uint32_t len, const char *data, | |
67 | Error **errp) | |
68 | { | |
420a4e95 | 69 | NBDOption req; |
c8a3a1b6 EB |
70 | QEMU_BUILD_BUG_ON(sizeof(req) != 16); |
71 | ||
72 | if (len == -1) { | |
73 | req.length = len = strlen(data); | |
74 | } | |
3736cc5b | 75 | trace_nbd_send_option_request(opt, nbd_opt_lookup(opt), len); |
c8a3a1b6 EB |
76 | |
77 | stq_be_p(&req.magic, NBD_OPTS_MAGIC); | |
78 | stl_be_p(&req.option, opt); | |
79 | stl_be_p(&req.length, len); | |
80 | ||
d1fdf257 | 81 | if (nbd_write(ioc, &req, sizeof(req), errp) < 0) { |
cb6b1a3f | 82 | error_prepend(errp, "Failed to send option request header: "); |
c8a3a1b6 EB |
83 | return -1; |
84 | } | |
85 | ||
d1fdf257 | 86 | if (len && nbd_write(ioc, (char *) data, len, errp) < 0) { |
cb6b1a3f | 87 | error_prepend(errp, "Failed to send option request data: "); |
c8a3a1b6 EB |
88 | return -1; |
89 | } | |
90 | ||
91 | return 0; | |
92 | } | |
93 | ||
2cdbf413 EB |
94 | /* Send NBD_OPT_ABORT as a courtesy to let the server know that we are |
95 | * not going to attempt further negotiation. */ | |
96 | static void nbd_send_opt_abort(QIOChannel *ioc) | |
97 | { | |
98 | /* Technically, a compliant server is supposed to reply to us; but | |
99 | * older servers disconnected instead. At any rate, we're allowed | |
100 | * to disconnect without waiting for the server reply, so we don't | |
101 | * even care if the request makes it to the server, let alone | |
102 | * waiting around for whether the server replies. */ | |
103 | nbd_send_option_request(ioc, NBD_OPT_ABORT, 0, NULL, NULL); | |
104 | } | |
105 | ||
106 | ||
c8a3a1b6 EB |
107 | /* Receive the header of an option reply, which should match the given |
108 | * opt. Read through the length field, but NOT the length bytes of | |
109 | * payload. Return 0 if successful, -1 with errp set if it is | |
110 | * impossible to continue. */ | |
111 | static int nbd_receive_option_reply(QIOChannel *ioc, uint32_t opt, | |
420a4e95 | 112 | NBDOptionReply *reply, Error **errp) |
c8a3a1b6 EB |
113 | { |
114 | QEMU_BUILD_BUG_ON(sizeof(*reply) != 20); | |
d1fdf257 | 115 | if (nbd_read(ioc, reply, sizeof(*reply), errp) < 0) { |
cb6b1a3f | 116 | error_prepend(errp, "failed to read option reply: "); |
2cdbf413 | 117 | nbd_send_opt_abort(ioc); |
c8a3a1b6 EB |
118 | return -1; |
119 | } | |
80c7c2b0 PM |
120 | reply->magic = be64_to_cpu(reply->magic); |
121 | reply->option = be32_to_cpu(reply->option); | |
122 | reply->type = be32_to_cpu(reply->type); | |
123 | reply->length = be32_to_cpu(reply->length); | |
c8a3a1b6 | 124 | |
3736cc5b EB |
125 | trace_nbd_receive_option_reply(reply->option, nbd_opt_lookup(reply->option), |
126 | reply->type, nbd_rep_lookup(reply->type), | |
127 | reply->length); | |
9344e5f5 | 128 | |
c8a3a1b6 EB |
129 | if (reply->magic != NBD_REP_MAGIC) { |
130 | error_setg(errp, "Unexpected option reply magic"); | |
2cdbf413 | 131 | nbd_send_opt_abort(ioc); |
c8a3a1b6 EB |
132 | return -1; |
133 | } | |
134 | if (reply->option != opt) { | |
6c5c0351 EB |
135 | error_setg(errp, "Unexpected option type %u (%s), expected %u (%s)", |
136 | reply->option, nbd_opt_lookup(reply->option), | |
137 | opt, nbd_opt_lookup(opt)); | |
2cdbf413 | 138 | nbd_send_opt_abort(ioc); |
c8a3a1b6 EB |
139 | return -1; |
140 | } | |
141 | return 0; | |
142 | } | |
143 | ||
144 | /* If reply represents success, return 1 without further action. | |
145 | * If reply represents an error, consume the optional payload of | |
146 | * the packet on ioc. Then return 0 for unsupported (so the client | |
147 | * can fall back to other approaches), or -1 with errp set for other | |
148 | * errors. | |
6ff58164 | 149 | */ |
420a4e95 | 150 | static int nbd_handle_reply_err(QIOChannel *ioc, NBDOptionReply *reply, |
6ff58164 | 151 | Error **errp) |
9344e5f5 | 152 | { |
6ff58164 AB |
153 | char *msg = NULL; |
154 | int result = -1; | |
155 | ||
c8a3a1b6 | 156 | if (!(reply->type & (1 << 31))) { |
6ff58164 AB |
157 | return 1; |
158 | } | |
159 | ||
c8a3a1b6 EB |
160 | if (reply->length) { |
161 | if (reply->length > NBD_MAX_BUFFER_SIZE) { | |
28fb494f | 162 | error_setg(errp, "server error %" PRIu32 |
3736cc5b EB |
163 | " (%s) message is too long", |
164 | reply->type, nbd_rep_lookup(reply->type)); | |
6ff58164 AB |
165 | goto cleanup; |
166 | } | |
c8a3a1b6 | 167 | msg = g_malloc(reply->length + 1); |
d1fdf257 | 168 | if (nbd_read(ioc, msg, reply->length, errp) < 0) { |
28fb494f | 169 | error_prepend(errp, "failed to read option error %" PRIu32 |
cb6b1a3f | 170 | " (%s) message: ", |
3736cc5b | 171 | reply->type, nbd_rep_lookup(reply->type)); |
6ff58164 AB |
172 | goto cleanup; |
173 | } | |
c8a3a1b6 | 174 | msg[reply->length] = '\0'; |
bee21ef0 EB |
175 | trace_nbd_server_error_msg(reply->type, |
176 | nbd_reply_type_lookup(reply->type), msg); | |
9344e5f5 DB |
177 | } |
178 | ||
c8a3a1b6 | 179 | switch (reply->type) { |
9344e5f5 | 180 | case NBD_REP_ERR_UNSUP: |
3736cc5b | 181 | trace_nbd_reply_err_unsup(reply->option, nbd_opt_lookup(reply->option)); |
6ff58164 AB |
182 | result = 0; |
183 | goto cleanup; | |
9344e5f5 | 184 | |
f95910fe | 185 | case NBD_REP_ERR_POLICY: |
28fb494f | 186 | error_setg(errp, "Denied by server for option %" PRIu32 " (%s)", |
3736cc5b | 187 | reply->option, nbd_opt_lookup(reply->option)); |
f95910fe DB |
188 | break; |
189 | ||
9344e5f5 | 190 | case NBD_REP_ERR_INVALID: |
28fb494f | 191 | error_setg(errp, "Invalid parameters for option %" PRIu32 " (%s)", |
3736cc5b | 192 | reply->option, nbd_opt_lookup(reply->option)); |
9344e5f5 DB |
193 | break; |
194 | ||
b6f5d3b5 | 195 | case NBD_REP_ERR_PLATFORM: |
28fb494f | 196 | error_setg(errp, "Server lacks support for option %" PRIu32 " (%s)", |
3736cc5b | 197 | reply->option, nbd_opt_lookup(reply->option)); |
b6f5d3b5 EB |
198 | break; |
199 | ||
f95910fe | 200 | case NBD_REP_ERR_TLS_REQD: |
28fb494f | 201 | error_setg(errp, "TLS negotiation required before option %" PRIu32 |
3736cc5b EB |
202 | " (%s)", reply->option, nbd_opt_lookup(reply->option)); |
203 | break; | |
204 | ||
205 | case NBD_REP_ERR_UNKNOWN: | |
9a76bd78 | 206 | error_setg(errp, "Requested export not available"); |
f95910fe DB |
207 | break; |
208 | ||
b6f5d3b5 | 209 | case NBD_REP_ERR_SHUTDOWN: |
28fb494f | 210 | error_setg(errp, "Server shutting down before option %" PRIu32 " (%s)", |
3736cc5b EB |
211 | reply->option, nbd_opt_lookup(reply->option)); |
212 | break; | |
213 | ||
214 | case NBD_REP_ERR_BLOCK_SIZE_REQD: | |
28fb494f | 215 | error_setg(errp, "Server requires INFO_BLOCK_SIZE for option %" PRIu32 |
3736cc5b | 216 | " (%s)", reply->option, nbd_opt_lookup(reply->option)); |
b6f5d3b5 EB |
217 | break; |
218 | ||
9344e5f5 | 219 | default: |
28fb494f | 220 | error_setg(errp, "Unknown error code when asking for option %" PRIu32 |
3736cc5b | 221 | " (%s)", reply->option, nbd_opt_lookup(reply->option)); |
9344e5f5 DB |
222 | break; |
223 | } | |
224 | ||
6ff58164 | 225 | if (msg) { |
9a76bd78 | 226 | error_append_hint(errp, "server reported: %s\n", msg); |
6ff58164 AB |
227 | } |
228 | ||
229 | cleanup: | |
230 | g_free(msg); | |
2cdbf413 EB |
231 | if (result < 0) { |
232 | nbd_send_opt_abort(ioc); | |
233 | } | |
6ff58164 | 234 | return result; |
9344e5f5 DB |
235 | } |
236 | ||
091d0bf3 EB |
237 | /* nbd_receive_list: |
238 | * Process another portion of the NBD_OPT_LIST reply, populating any | |
239 | * name received into *@name. If @description is non-NULL, and the | |
240 | * server provided a description, that is also populated. The caller | |
241 | * must eventually call g_free() on success. | |
242 | * Returns 1 if name and description were set and iteration must continue, | |
243 | * 0 if iteration is complete (including if OPT_LIST unsupported), | |
244 | * -1 with @errp set if an unrecoverable error occurred. | |
245 | */ | |
246 | static int nbd_receive_list(QIOChannel *ioc, char **name, char **description, | |
75368aab | 247 | Error **errp) |
9344e5f5 | 248 | { |
091d0bf3 | 249 | int ret = -1; |
420a4e95 | 250 | NBDOptionReply reply; |
9344e5f5 DB |
251 | uint32_t len; |
252 | uint32_t namelen; | |
091d0bf3 EB |
253 | char *local_name = NULL; |
254 | char *local_desc = NULL; | |
6ff58164 | 255 | int error; |
9344e5f5 | 256 | |
c8a3a1b6 | 257 | if (nbd_receive_option_reply(ioc, NBD_OPT_LIST, &reply, errp) < 0) { |
9344e5f5 DB |
258 | return -1; |
259 | } | |
c8a3a1b6 | 260 | error = nbd_handle_reply_err(ioc, &reply, errp); |
6ff58164 AB |
261 | if (error <= 0) { |
262 | return error; | |
9344e5f5 | 263 | } |
c8a3a1b6 | 264 | len = reply.length; |
9344e5f5 | 265 | |
c8a3a1b6 | 266 | if (reply.type == NBD_REP_ACK) { |
9344e5f5 DB |
267 | if (len != 0) { |
268 | error_setg(errp, "length too long for option end"); | |
2cdbf413 | 269 | nbd_send_opt_abort(ioc); |
9344e5f5 DB |
270 | return -1; |
271 | } | |
75368aab EB |
272 | return 0; |
273 | } else if (reply.type != NBD_REP_SERVER) { | |
6c5c0351 EB |
274 | error_setg(errp, "Unexpected reply type %u (%s), expected %u (%s)", |
275 | reply.type, nbd_rep_lookup(reply.type), | |
276 | NBD_REP_SERVER, nbd_rep_lookup(NBD_REP_SERVER)); | |
75368aab EB |
277 | nbd_send_opt_abort(ioc); |
278 | return -1; | |
279 | } | |
9344e5f5 | 280 | |
75368aab EB |
281 | if (len < sizeof(namelen) || len > NBD_MAX_BUFFER_SIZE) { |
282 | error_setg(errp, "incorrect option length %" PRIu32, len); | |
283 | nbd_send_opt_abort(ioc); | |
284 | return -1; | |
285 | } | |
d1fdf257 | 286 | if (nbd_read(ioc, &namelen, sizeof(namelen), errp) < 0) { |
cb6b1a3f | 287 | error_prepend(errp, "failed to read option name length: "); |
75368aab EB |
288 | nbd_send_opt_abort(ioc); |
289 | return -1; | |
290 | } | |
291 | namelen = be32_to_cpu(namelen); | |
292 | len -= sizeof(namelen); | |
293 | if (len < namelen) { | |
294 | error_setg(errp, "incorrect option name length"); | |
295 | nbd_send_opt_abort(ioc); | |
296 | return -1; | |
297 | } | |
75368aab | 298 | |
091d0bf3 EB |
299 | local_name = g_malloc(namelen + 1); |
300 | if (nbd_read(ioc, local_name, namelen, errp) < 0) { | |
cb6b1a3f | 301 | error_prepend(errp, "failed to read export name: "); |
75368aab | 302 | nbd_send_opt_abort(ioc); |
091d0bf3 | 303 | goto out; |
75368aab | 304 | } |
091d0bf3 | 305 | local_name[namelen] = '\0'; |
75368aab | 306 | len -= namelen; |
091d0bf3 EB |
307 | if (len) { |
308 | local_desc = g_malloc(len + 1); | |
309 | if (nbd_read(ioc, local_desc, len, errp) < 0) { | |
310 | error_prepend(errp, "failed to read export description: "); | |
311 | nbd_send_opt_abort(ioc); | |
312 | goto out; | |
313 | } | |
314 | local_desc[len] = '\0'; | |
9344e5f5 | 315 | } |
091d0bf3 EB |
316 | |
317 | trace_nbd_receive_list(local_name, local_desc ?: ""); | |
318 | *name = local_name; | |
319 | local_name = NULL; | |
320 | if (description) { | |
321 | *description = local_desc; | |
322 | local_desc = NULL; | |
75368aab | 323 | } |
091d0bf3 EB |
324 | ret = 1; |
325 | ||
326 | out: | |
327 | g_free(local_name); | |
328 | g_free(local_desc); | |
329 | return ret; | |
9344e5f5 DB |
330 | } |
331 | ||
332 | ||
6dc1667d | 333 | /* Returns -1 if NBD_OPT_GO proves the export @info->name cannot be |
8ecaeae8 EB |
334 | * used, 0 if NBD_OPT_GO is unsupported (fall back to NBD_OPT_LIST and |
335 | * NBD_OPT_EXPORT_NAME in that case), and > 0 if the export is good to | |
6dc1667d EB |
336 | * go (with the rest of @info populated). */ |
337 | static int nbd_opt_go(QIOChannel *ioc, NBDExportInfo *info, Error **errp) | |
8ecaeae8 | 338 | { |
420a4e95 | 339 | NBDOptionReply reply; |
6dc1667d | 340 | uint32_t len = strlen(info->name); |
8ecaeae8 EB |
341 | uint16_t type; |
342 | int error; | |
343 | char *buf; | |
344 | ||
345 | /* The protocol requires that the server send NBD_INFO_EXPORT with | |
346 | * a non-zero flags (at least NBD_FLAG_HAS_FLAGS must be set); so | |
347 | * flags still 0 is a witness of a broken server. */ | |
348 | info->flags = 0; | |
349 | ||
6dc1667d | 350 | trace_nbd_opt_go_start(info->name); |
081dd1fe | 351 | buf = g_malloc(4 + len + 2 + 2 * info->request_sizes + 1); |
8ecaeae8 | 352 | stl_be_p(buf, len); |
6dc1667d | 353 | memcpy(buf + 4, info->name, len); |
081dd1fe EB |
354 | /* At most one request, everything else up to server */ |
355 | stw_be_p(buf + 4 + len, info->request_sizes); | |
356 | if (info->request_sizes) { | |
357 | stw_be_p(buf + 4 + len + 2, NBD_INFO_BLOCK_SIZE); | |
358 | } | |
158b9aa5 PMD |
359 | error = nbd_send_option_request(ioc, NBD_OPT_GO, |
360 | 4 + len + 2 + 2 * info->request_sizes, | |
361 | buf, errp); | |
362 | g_free(buf); | |
363 | if (error < 0) { | |
8ecaeae8 EB |
364 | return -1; |
365 | } | |
366 | ||
367 | while (1) { | |
368 | if (nbd_receive_option_reply(ioc, NBD_OPT_GO, &reply, errp) < 0) { | |
369 | return -1; | |
370 | } | |
371 | error = nbd_handle_reply_err(ioc, &reply, errp); | |
372 | if (error <= 0) { | |
373 | return error; | |
374 | } | |
375 | len = reply.length; | |
376 | ||
377 | if (reply.type == NBD_REP_ACK) { | |
378 | /* Server is done sending info and moved into transmission | |
379 | phase, but make sure it sent flags */ | |
380 | if (len) { | |
381 | error_setg(errp, "server sent invalid NBD_REP_ACK"); | |
8ecaeae8 EB |
382 | return -1; |
383 | } | |
384 | if (!info->flags) { | |
385 | error_setg(errp, "broken server omitted NBD_INFO_EXPORT"); | |
8ecaeae8 EB |
386 | return -1; |
387 | } | |
388 | trace_nbd_opt_go_success(); | |
389 | return 1; | |
390 | } | |
391 | if (reply.type != NBD_REP_INFO) { | |
6c5c0351 EB |
392 | error_setg(errp, "unexpected reply type %u (%s), expected %u (%s)", |
393 | reply.type, nbd_rep_lookup(reply.type), | |
394 | NBD_REP_INFO, nbd_rep_lookup(NBD_REP_INFO)); | |
8ecaeae8 EB |
395 | nbd_send_opt_abort(ioc); |
396 | return -1; | |
397 | } | |
398 | if (len < sizeof(type)) { | |
399 | error_setg(errp, "NBD_REP_INFO length %" PRIu32 " is too short", | |
400 | len); | |
401 | nbd_send_opt_abort(ioc); | |
402 | return -1; | |
403 | } | |
404 | if (nbd_read(ioc, &type, sizeof(type), errp) < 0) { | |
cb6b1a3f | 405 | error_prepend(errp, "failed to read info type: "); |
8ecaeae8 EB |
406 | nbd_send_opt_abort(ioc); |
407 | return -1; | |
408 | } | |
409 | len -= sizeof(type); | |
80c7c2b0 | 410 | type = be16_to_cpu(type); |
8ecaeae8 EB |
411 | switch (type) { |
412 | case NBD_INFO_EXPORT: | |
413 | if (len != sizeof(info->size) + sizeof(info->flags)) { | |
414 | error_setg(errp, "remaining export info len %" PRIu32 | |
415 | " is unexpected size", len); | |
416 | nbd_send_opt_abort(ioc); | |
417 | return -1; | |
418 | } | |
419 | if (nbd_read(ioc, &info->size, sizeof(info->size), errp) < 0) { | |
cb6b1a3f | 420 | error_prepend(errp, "failed to read info size: "); |
8ecaeae8 EB |
421 | nbd_send_opt_abort(ioc); |
422 | return -1; | |
423 | } | |
80c7c2b0 | 424 | info->size = be64_to_cpu(info->size); |
8ecaeae8 | 425 | if (nbd_read(ioc, &info->flags, sizeof(info->flags), errp) < 0) { |
cb6b1a3f | 426 | error_prepend(errp, "failed to read info flags: "); |
8ecaeae8 EB |
427 | nbd_send_opt_abort(ioc); |
428 | return -1; | |
429 | } | |
80c7c2b0 | 430 | info->flags = be16_to_cpu(info->flags); |
8ecaeae8 EB |
431 | trace_nbd_receive_negotiate_size_flags(info->size, info->flags); |
432 | break; | |
433 | ||
081dd1fe EB |
434 | case NBD_INFO_BLOCK_SIZE: |
435 | if (len != sizeof(info->min_block) * 3) { | |
436 | error_setg(errp, "remaining export info len %" PRIu32 | |
437 | " is unexpected size", len); | |
438 | nbd_send_opt_abort(ioc); | |
439 | return -1; | |
440 | } | |
441 | if (nbd_read(ioc, &info->min_block, sizeof(info->min_block), | |
442 | errp) < 0) { | |
cb6b1a3f | 443 | error_prepend(errp, "failed to read info minimum block size: "); |
081dd1fe EB |
444 | nbd_send_opt_abort(ioc); |
445 | return -1; | |
446 | } | |
80c7c2b0 | 447 | info->min_block = be32_to_cpu(info->min_block); |
081dd1fe | 448 | if (!is_power_of_2(info->min_block)) { |
e475d108 EB |
449 | error_setg(errp, "server minimum block size %" PRIu32 |
450 | " is not a power of two", info->min_block); | |
081dd1fe EB |
451 | nbd_send_opt_abort(ioc); |
452 | return -1; | |
453 | } | |
454 | if (nbd_read(ioc, &info->opt_block, sizeof(info->opt_block), | |
455 | errp) < 0) { | |
cb6b1a3f EB |
456 | error_prepend(errp, |
457 | "failed to read info preferred block size: "); | |
081dd1fe EB |
458 | nbd_send_opt_abort(ioc); |
459 | return -1; | |
460 | } | |
80c7c2b0 | 461 | info->opt_block = be32_to_cpu(info->opt_block); |
081dd1fe EB |
462 | if (!is_power_of_2(info->opt_block) || |
463 | info->opt_block < info->min_block) { | |
e475d108 EB |
464 | error_setg(errp, "server preferred block size %" PRIu32 |
465 | " is not valid", info->opt_block); | |
081dd1fe EB |
466 | nbd_send_opt_abort(ioc); |
467 | return -1; | |
468 | } | |
469 | if (nbd_read(ioc, &info->max_block, sizeof(info->max_block), | |
470 | errp) < 0) { | |
cb6b1a3f | 471 | error_prepend(errp, "failed to read info maximum block size: "); |
081dd1fe EB |
472 | nbd_send_opt_abort(ioc); |
473 | return -1; | |
474 | } | |
80c7c2b0 | 475 | info->max_block = be32_to_cpu(info->max_block); |
e475d108 EB |
476 | if (info->max_block < info->min_block) { |
477 | error_setg(errp, "server maximum block size %" PRIu32 | |
478 | " is not valid", info->max_block); | |
479 | nbd_send_opt_abort(ioc); | |
480 | return -1; | |
481 | } | |
081dd1fe EB |
482 | trace_nbd_opt_go_info_block_size(info->min_block, info->opt_block, |
483 | info->max_block); | |
484 | break; | |
485 | ||
8ecaeae8 EB |
486 | default: |
487 | trace_nbd_opt_go_info_unknown(type, nbd_info_lookup(type)); | |
488 | if (nbd_drop(ioc, len, errp) < 0) { | |
cb6b1a3f | 489 | error_prepend(errp, "Failed to read info payload: "); |
8ecaeae8 EB |
490 | nbd_send_opt_abort(ioc); |
491 | return -1; | |
492 | } | |
493 | break; | |
494 | } | |
495 | } | |
496 | } | |
497 | ||
75368aab | 498 | /* Return -1 on failure, 0 if wantname is an available export. */ |
9344e5f5 DB |
499 | static int nbd_receive_query_exports(QIOChannel *ioc, |
500 | const char *wantname, | |
501 | Error **errp) | |
502 | { | |
091d0bf3 EB |
503 | bool list_empty = true; |
504 | bool found_export = false; | |
9344e5f5 | 505 | |
9588463e | 506 | trace_nbd_receive_query_exports_start(wantname); |
c8a3a1b6 | 507 | if (nbd_send_option_request(ioc, NBD_OPT_LIST, 0, NULL, errp) < 0) { |
9344e5f5 DB |
508 | return -1; |
509 | } | |
510 | ||
9344e5f5 | 511 | while (1) { |
091d0bf3 EB |
512 | char *name; |
513 | int ret = nbd_receive_list(ioc, &name, NULL, errp); | |
9344e5f5 DB |
514 | |
515 | if (ret < 0) { | |
75368aab | 516 | /* Server gave unexpected reply */ |
9344e5f5 | 517 | return -1; |
75368aab EB |
518 | } else if (ret == 0) { |
519 | /* Done iterating. */ | |
091d0bf3 EB |
520 | if (list_empty) { |
521 | /* | |
522 | * We don't have enough context to tell a server that | |
523 | * sent an empty list apart from a server that does | |
524 | * not support the list command; but as this function | |
525 | * is just used to trigger a nicer error message | |
526 | * before trying NBD_OPT_EXPORT_NAME, assume the | |
527 | * export is available. | |
528 | */ | |
529 | return 0; | |
530 | } else if (!found_export) { | |
75368aab EB |
531 | error_setg(errp, "No export with name '%s' available", |
532 | wantname); | |
533 | nbd_send_opt_abort(ioc); | |
534 | return -1; | |
535 | } | |
9588463e | 536 | trace_nbd_receive_query_exports_success(wantname); |
75368aab | 537 | return 0; |
9344e5f5 | 538 | } |
091d0bf3 EB |
539 | list_empty = false; |
540 | if (!strcmp(name, wantname)) { | |
541 | found_export = true; | |
542 | } | |
543 | g_free(name); | |
9344e5f5 | 544 | } |
9344e5f5 DB |
545 | } |
546 | ||
d795299b VSO |
547 | /* nbd_request_simple_option: Send an option request, and parse the reply |
548 | * return 1 for successful negotiation, | |
549 | * 0 if operation is unsupported, | |
550 | * -1 with errp set for any other error | |
551 | */ | |
552 | static int nbd_request_simple_option(QIOChannel *ioc, int opt, Error **errp) | |
f95910fe | 553 | { |
420a4e95 | 554 | NBDOptionReply reply; |
d795299b | 555 | int error; |
f95910fe | 556 | |
d795299b VSO |
557 | if (nbd_send_option_request(ioc, opt, 0, NULL, errp) < 0) { |
558 | return -1; | |
f95910fe DB |
559 | } |
560 | ||
d795299b VSO |
561 | if (nbd_receive_option_reply(ioc, opt, &reply, errp) < 0) { |
562 | return -1; | |
563 | } | |
564 | error = nbd_handle_reply_err(ioc, &reply, errp); | |
565 | if (error <= 0) { | |
566 | return error; | |
f95910fe | 567 | } |
c8a3a1b6 EB |
568 | |
569 | if (reply.type != NBD_REP_ACK) { | |
d795299b | 570 | error_setg(errp, "Server answered option %d (%s) with unexpected " |
28fb494f | 571 | "reply %" PRIu32 " (%s)", opt, nbd_opt_lookup(opt), |
d795299b | 572 | reply.type, nbd_rep_lookup(reply.type)); |
2cdbf413 | 573 | nbd_send_opt_abort(ioc); |
d795299b | 574 | return -1; |
f95910fe DB |
575 | } |
576 | ||
c8a3a1b6 | 577 | if (reply.length != 0) { |
d795299b VSO |
578 | error_setg(errp, "Option %d ('%s') response length is %" PRIu32 |
579 | " (it should be zero)", opt, nbd_opt_lookup(opt), | |
c8a3a1b6 | 580 | reply.length); |
2cdbf413 | 581 | nbd_send_opt_abort(ioc); |
d795299b VSO |
582 | return -1; |
583 | } | |
584 | ||
585 | return 1; | |
586 | } | |
587 | ||
588 | static QIOChannel *nbd_receive_starttls(QIOChannel *ioc, | |
589 | QCryptoTLSCreds *tlscreds, | |
590 | const char *hostname, Error **errp) | |
591 | { | |
592 | int ret; | |
593 | QIOChannelTLS *tioc; | |
594 | struct NBDTLSHandshakeData data = { 0 }; | |
595 | ||
596 | ret = nbd_request_simple_option(ioc, NBD_OPT_STARTTLS, errp); | |
597 | if (ret <= 0) { | |
598 | if (ret == 0) { | |
599 | error_setg(errp, "Server don't support STARTTLS option"); | |
600 | nbd_send_opt_abort(ioc); | |
601 | } | |
f95910fe DB |
602 | return NULL; |
603 | } | |
604 | ||
9588463e | 605 | trace_nbd_receive_starttls_new_client(); |
f95910fe DB |
606 | tioc = qio_channel_tls_new_client(ioc, tlscreds, hostname, errp); |
607 | if (!tioc) { | |
608 | return NULL; | |
609 | } | |
0d73f725 | 610 | qio_channel_set_name(QIO_CHANNEL(tioc), "nbd-client-tls"); |
f95910fe | 611 | data.loop = g_main_loop_new(g_main_context_default(), FALSE); |
9588463e | 612 | trace_nbd_receive_starttls_tls_handshake(); |
f95910fe DB |
613 | qio_channel_tls_handshake(tioc, |
614 | nbd_tls_handshake, | |
615 | &data, | |
1939ccda | 616 | NULL, |
f95910fe DB |
617 | NULL); |
618 | ||
619 | if (!data.complete) { | |
620 | g_main_loop_run(data.loop); | |
621 | } | |
622 | g_main_loop_unref(data.loop); | |
623 | if (data.error) { | |
624 | error_propagate(errp, data.error); | |
625 | object_unref(OBJECT(tioc)); | |
626 | return NULL; | |
627 | } | |
628 | ||
629 | return QIO_CHANNEL(tioc); | |
630 | } | |
631 | ||
757b3ab9 EB |
632 | /* |
633 | * nbd_send_meta_query: | |
634 | * Send 0 or 1 set/list meta context queries. | |
635 | * Return 0 on success, -1 with errp set for any error | |
636 | */ | |
637 | static int nbd_send_meta_query(QIOChannel *ioc, uint32_t opt, | |
638 | const char *export, const char *query, | |
639 | Error **errp) | |
640 | { | |
641 | int ret; | |
642 | uint32_t export_len = strlen(export); | |
643 | uint32_t queries = !!query; | |
644 | uint32_t query_len = 0; | |
645 | uint32_t data_len; | |
646 | char *data; | |
647 | char *p; | |
648 | ||
649 | data_len = sizeof(export_len) + export_len + sizeof(queries); | |
650 | if (query) { | |
651 | query_len = strlen(query); | |
652 | data_len += sizeof(query_len) + query_len; | |
653 | } else { | |
654 | assert(opt == NBD_OPT_LIST_META_CONTEXT); | |
655 | } | |
656 | p = data = g_malloc(data_len); | |
657 | ||
658 | trace_nbd_opt_meta_request(nbd_opt_lookup(opt), query ?: "(all)", export); | |
659 | stl_be_p(p, export_len); | |
660 | memcpy(p += sizeof(export_len), export, export_len); | |
661 | stl_be_p(p += export_len, queries); | |
662 | if (query) { | |
663 | stl_be_p(p += sizeof(queries), query_len); | |
664 | memcpy(p += sizeof(query_len), query, query_len); | |
665 | } | |
666 | ||
667 | ret = nbd_send_option_request(ioc, opt, data_len, data, errp); | |
668 | g_free(data); | |
669 | return ret; | |
670 | } | |
671 | ||
0182c1ae EB |
672 | /* |
673 | * nbd_receive_one_meta_context: | |
674 | * Called in a loop to receive and trace one set/list meta context reply. | |
675 | * Pass non-NULL @name or @id to collect results back to the caller, which | |
676 | * must eventually call g_free(). | |
677 | * return 1 if name is set and iteration must continue, | |
678 | * 0 if iteration is complete (including if option is unsupported), | |
679 | * -1 with errp set for any error | |
680 | */ | |
681 | static int nbd_receive_one_meta_context(QIOChannel *ioc, | |
682 | uint32_t opt, | |
683 | char **name, | |
684 | uint32_t *id, | |
685 | Error **errp) | |
686 | { | |
687 | int ret; | |
688 | NBDOptionReply reply; | |
689 | char *local_name = NULL; | |
690 | uint32_t local_id; | |
691 | ||
692 | if (nbd_receive_option_reply(ioc, opt, &reply, errp) < 0) { | |
693 | return -1; | |
694 | } | |
695 | ||
696 | ret = nbd_handle_reply_err(ioc, &reply, errp); | |
697 | if (ret <= 0) { | |
698 | return ret; | |
699 | } | |
700 | ||
701 | if (reply.type == NBD_REP_ACK) { | |
702 | if (reply.length != 0) { | |
703 | error_setg(errp, "Unexpected length to ACK response"); | |
704 | nbd_send_opt_abort(ioc); | |
705 | return -1; | |
706 | } | |
707 | return 0; | |
708 | } else if (reply.type != NBD_REP_META_CONTEXT) { | |
709 | error_setg(errp, "Unexpected reply type %u (%s), expected %u (%s)", | |
710 | reply.type, nbd_rep_lookup(reply.type), | |
711 | NBD_REP_META_CONTEXT, nbd_rep_lookup(NBD_REP_META_CONTEXT)); | |
712 | nbd_send_opt_abort(ioc); | |
713 | return -1; | |
714 | } | |
715 | ||
716 | if (reply.length <= sizeof(local_id) || | |
717 | reply.length > NBD_MAX_BUFFER_SIZE) { | |
718 | error_setg(errp, "Failed to negotiate meta context, server " | |
719 | "answered with unexpected length %" PRIu32, | |
720 | reply.length); | |
721 | nbd_send_opt_abort(ioc); | |
722 | return -1; | |
723 | } | |
724 | ||
725 | if (nbd_read(ioc, &local_id, sizeof(local_id), errp) < 0) { | |
726 | return -1; | |
727 | } | |
728 | local_id = be32_to_cpu(local_id); | |
729 | ||
730 | reply.length -= sizeof(local_id); | |
731 | local_name = g_malloc(reply.length + 1); | |
732 | if (nbd_read(ioc, local_name, reply.length, errp) < 0) { | |
733 | g_free(local_name); | |
734 | return -1; | |
735 | } | |
736 | local_name[reply.length] = '\0'; | |
737 | trace_nbd_opt_meta_reply(nbd_opt_lookup(opt), local_name, local_id); | |
738 | ||
739 | if (name) { | |
740 | *name = local_name; | |
741 | } else { | |
742 | g_free(local_name); | |
743 | } | |
744 | if (id) { | |
745 | *id = local_id; | |
746 | } | |
747 | return 1; | |
748 | } | |
749 | ||
750 | /* | |
751 | * nbd_negotiate_simple_meta_context: | |
2df94eb5 EB |
752 | * Request the server to set the meta context for export @info->name |
753 | * using @info->x_dirty_bitmap with a fallback to "base:allocation", | |
754 | * setting @info->context_id to the resulting id. Fail if the server | |
755 | * responds with more than one context or with a context different | |
756 | * than the query. | |
757 | * return 1 for successful negotiation, | |
78a33ab5 VSO |
758 | * 0 if operation is unsupported, |
759 | * -1 with errp set for any other error | |
760 | */ | |
761 | static int nbd_negotiate_simple_meta_context(QIOChannel *ioc, | |
2df94eb5 | 762 | NBDExportInfo *info, |
78a33ab5 VSO |
763 | Error **errp) |
764 | { | |
2df94eb5 EB |
765 | /* |
766 | * TODO: Removing the x_dirty_bitmap hack will mean refactoring | |
767 | * this function to request and store ids for multiple contexts | |
768 | * (both base:allocation and a dirty bitmap), at which point this | |
769 | * function should lose the term _simple. | |
770 | */ | |
78a33ab5 | 771 | int ret; |
2df94eb5 | 772 | const char *context = info->x_dirty_bitmap ?: "base:allocation"; |
89aa0d87 | 773 | bool received = false; |
0182c1ae | 774 | char *name = NULL; |
78a33ab5 | 775 | |
757b3ab9 EB |
776 | if (nbd_send_meta_query(ioc, NBD_OPT_SET_META_CONTEXT, |
777 | info->name, context, errp) < 0) { | |
778 | return -1; | |
78a33ab5 VSO |
779 | } |
780 | ||
0182c1ae EB |
781 | ret = nbd_receive_one_meta_context(ioc, NBD_OPT_SET_META_CONTEXT, |
782 | &name, &info->context_id, errp); | |
783 | if (ret < 0) { | |
78a33ab5 VSO |
784 | return -1; |
785 | } | |
0182c1ae | 786 | if (ret == 1) { |
78a33ab5 VSO |
787 | if (strcmp(context, name)) { |
788 | error_setg(errp, "Failed to negotiate meta context '%s', server " | |
789 | "answered with different context '%s'", context, | |
790 | name); | |
791 | g_free(name); | |
260e34db | 792 | nbd_send_opt_abort(ioc); |
78a33ab5 VSO |
793 | return -1; |
794 | } | |
795 | g_free(name); | |
78a33ab5 VSO |
796 | received = true; |
797 | ||
0182c1ae EB |
798 | ret = nbd_receive_one_meta_context(ioc, NBD_OPT_SET_META_CONTEXT, |
799 | NULL, NULL, errp); | |
800 | if (ret < 0) { | |
78a33ab5 VSO |
801 | return -1; |
802 | } | |
78a33ab5 | 803 | } |
0182c1ae EB |
804 | if (ret != 0) { |
805 | error_setg(errp, "Server answered with more than one context"); | |
260e34db EB |
806 | nbd_send_opt_abort(ioc); |
807 | return -1; | |
808 | } | |
2df94eb5 | 809 | return received; |
78a33ab5 | 810 | } |
f95910fe | 811 | |
6dc1667d EB |
812 | int nbd_receive_negotiate(QIOChannel *ioc, QCryptoTLSCreds *tlscreds, |
813 | const char *hostname, QIOChannel **outioc, | |
814 | NBDExportInfo *info, Error **errp) | |
798bfe00 | 815 | { |
004a89fc | 816 | uint64_t magic; |
c203c59a | 817 | bool zeroes = true; |
f140e300 | 818 | bool structured_reply = info->structured_reply; |
78a33ab5 | 819 | bool base_allocation = info->base_allocation; |
798bfe00 | 820 | |
9588463e | 821 | trace_nbd_receive_negotiate(tlscreds, hostname ? hostname : "<null>"); |
798bfe00 | 822 | |
6dc1667d EB |
823 | assert(info->name); |
824 | trace_nbd_receive_negotiate_name(info->name); | |
f140e300 | 825 | info->structured_reply = false; |
78a33ab5 | 826 | info->base_allocation = false; |
798bfe00 | 827 | |
f95910fe DB |
828 | if (outioc) { |
829 | *outioc = NULL; | |
830 | } | |
831 | if (tlscreds && !outioc) { | |
832 | error_setg(errp, "Output I/O channel required for TLS"); | |
2b8d0954 | 833 | return -EINVAL; |
f95910fe DB |
834 | } |
835 | ||
ef2e35fc EB |
836 | if (nbd_read(ioc, &magic, sizeof(magic), errp) < 0) { |
837 | error_prepend(errp, "Failed to read initial magic: "); | |
2b8d0954 | 838 | return -EINVAL; |
798bfe00 | 839 | } |
ef2e35fc | 840 | magic = be64_to_cpu(magic); |
9588463e | 841 | trace_nbd_receive_negotiate_magic(magic); |
798bfe00 | 842 | |
ef2e35fc EB |
843 | if (magic != NBD_INIT_MAGIC) { |
844 | error_setg(errp, "Bad initial magic received: 0x%" PRIx64, magic); | |
2b8d0954 | 845 | return -EINVAL; |
798bfe00 FZ |
846 | } |
847 | ||
d1fdf257 | 848 | if (nbd_read(ioc, &magic, sizeof(magic), errp) < 0) { |
ef2e35fc | 849 | error_prepend(errp, "Failed to read server magic: "); |
2b8d0954 | 850 | return -EINVAL; |
798bfe00 FZ |
851 | } |
852 | magic = be64_to_cpu(magic); | |
9588463e | 853 | trace_nbd_receive_negotiate_magic(magic); |
798bfe00 | 854 | |
f72d705f | 855 | if (magic == NBD_OPTS_MAGIC) { |
e2a9d9a3 | 856 | uint32_t clientflags = 0; |
e2a9d9a3 | 857 | uint16_t globalflags; |
9344e5f5 | 858 | bool fixedNewStyle = false; |
798bfe00 | 859 | |
d1fdf257 | 860 | if (nbd_read(ioc, &globalflags, sizeof(globalflags), errp) < 0) { |
cb6b1a3f | 861 | error_prepend(errp, "Failed to read server flags: "); |
2b8d0954 | 862 | return -EINVAL; |
798bfe00 | 863 | } |
9344e5f5 | 864 | globalflags = be16_to_cpu(globalflags); |
9588463e | 865 | trace_nbd_receive_negotiate_server_flags(globalflags); |
e2a9d9a3 | 866 | if (globalflags & NBD_FLAG_FIXED_NEWSTYLE) { |
9344e5f5 | 867 | fixedNewStyle = true; |
e2a9d9a3 DB |
868 | clientflags |= NBD_FLAG_C_FIXED_NEWSTYLE; |
869 | } | |
c203c59a EB |
870 | if (globalflags & NBD_FLAG_NO_ZEROES) { |
871 | zeroes = false; | |
c203c59a EB |
872 | clientflags |= NBD_FLAG_C_NO_ZEROES; |
873 | } | |
e2a9d9a3 | 874 | /* client requested flags */ |
9344e5f5 | 875 | clientflags = cpu_to_be32(clientflags); |
d1fdf257 | 876 | if (nbd_write(ioc, &clientflags, sizeof(clientflags), errp) < 0) { |
cb6b1a3f | 877 | error_prepend(errp, "Failed to send clientflags field: "); |
2b8d0954 | 878 | return -EINVAL; |
798bfe00 | 879 | } |
f95910fe DB |
880 | if (tlscreds) { |
881 | if (fixedNewStyle) { | |
882 | *outioc = nbd_receive_starttls(ioc, tlscreds, hostname, errp); | |
883 | if (!*outioc) { | |
2b8d0954 | 884 | return -EINVAL; |
f95910fe DB |
885 | } |
886 | ioc = *outioc; | |
887 | } else { | |
888 | error_setg(errp, "Server does not support STARTTLS"); | |
2b8d0954 | 889 | return -EINVAL; |
f95910fe DB |
890 | } |
891 | } | |
9344e5f5 | 892 | if (fixedNewStyle) { |
8ecaeae8 EB |
893 | int result; |
894 | ||
f140e300 VSO |
895 | if (structured_reply) { |
896 | result = nbd_request_simple_option(ioc, | |
897 | NBD_OPT_STRUCTURED_REPLY, | |
898 | errp); | |
899 | if (result < 0) { | |
2b8d0954 | 900 | return -EINVAL; |
f140e300 VSO |
901 | } |
902 | info->structured_reply = result == 1; | |
903 | } | |
904 | ||
78a33ab5 | 905 | if (info->structured_reply && base_allocation) { |
2df94eb5 | 906 | result = nbd_negotiate_simple_meta_context(ioc, info, errp); |
78a33ab5 | 907 | if (result < 0) { |
2b8d0954 | 908 | return -EINVAL; |
78a33ab5 VSO |
909 | } |
910 | info->base_allocation = result == 1; | |
911 | } | |
912 | ||
8ecaeae8 EB |
913 | /* Try NBD_OPT_GO first - if it works, we are done (it |
914 | * also gives us a good message if the server requires | |
915 | * TLS). If it is not available, fall back to | |
916 | * NBD_OPT_LIST for nicer error messages about a missing | |
917 | * export, then use NBD_OPT_EXPORT_NAME. */ | |
6dc1667d | 918 | result = nbd_opt_go(ioc, info, errp); |
8ecaeae8 | 919 | if (result < 0) { |
2b8d0954 | 920 | return -EINVAL; |
8ecaeae8 EB |
921 | } |
922 | if (result > 0) { | |
923 | return 0; | |
924 | } | |
9344e5f5 DB |
925 | /* Check our desired export is present in the |
926 | * server export list. Since NBD_OPT_EXPORT_NAME | |
927 | * cannot return an error message, running this | |
8ecaeae8 EB |
928 | * query gives us better error reporting if the |
929 | * export name is not available. | |
9344e5f5 | 930 | */ |
6dc1667d | 931 | if (nbd_receive_query_exports(ioc, info->name, errp) < 0) { |
2b8d0954 | 932 | return -EINVAL; |
9344e5f5 DB |
933 | } |
934 | } | |
c8a3a1b6 | 935 | /* write the export name request */ |
6dc1667d | 936 | if (nbd_send_option_request(ioc, NBD_OPT_EXPORT_NAME, -1, info->name, |
c8a3a1b6 | 937 | errp) < 0) { |
2b8d0954 | 938 | return -EINVAL; |
798bfe00 | 939 | } |
f72d705f | 940 | |
c8a3a1b6 | 941 | /* Read the response */ |
004a89fc | 942 | if (nbd_read(ioc, &info->size, sizeof(info->size), errp) < 0) { |
cb6b1a3f | 943 | error_prepend(errp, "Failed to read export length: "); |
2b8d0954 | 944 | return -EINVAL; |
798bfe00 | 945 | } |
80c7c2b0 | 946 | info->size = be64_to_cpu(info->size); |
798bfe00 | 947 | |
004a89fc | 948 | if (nbd_read(ioc, &info->flags, sizeof(info->flags), errp) < 0) { |
cb6b1a3f | 949 | error_prepend(errp, "Failed to read export flags: "); |
2b8d0954 | 950 | return -EINVAL; |
f72d705f | 951 | } |
80c7c2b0 | 952 | info->flags = be16_to_cpu(info->flags); |
f72d705f | 953 | } else if (magic == NBD_CLIENT_MAGIC) { |
7423f417 EB |
954 | uint32_t oldflags; |
955 | ||
6dc1667d EB |
956 | if (*info->name) { |
957 | error_setg(errp, "Server does not support non-empty export names"); | |
2b8d0954 | 958 | return -EINVAL; |
f72d705f | 959 | } |
f95910fe DB |
960 | if (tlscreds) { |
961 | error_setg(errp, "Server does not support STARTTLS"); | |
2b8d0954 | 962 | return -EINVAL; |
f95910fe | 963 | } |
f72d705f | 964 | |
004a89fc | 965 | if (nbd_read(ioc, &info->size, sizeof(info->size), errp) < 0) { |
cb6b1a3f | 966 | error_prepend(errp, "Failed to read export length: "); |
2b8d0954 | 967 | return -EINVAL; |
f72d705f | 968 | } |
80c7c2b0 | 969 | info->size = be64_to_cpu(info->size); |
798bfe00 | 970 | |
d1fdf257 | 971 | if (nbd_read(ioc, &oldflags, sizeof(oldflags), errp) < 0) { |
cb6b1a3f | 972 | error_prepend(errp, "Failed to read export flags: "); |
2b8d0954 | 973 | return -EINVAL; |
798bfe00 | 974 | } |
80c7c2b0 | 975 | oldflags = be32_to_cpu(oldflags); |
7423f417 EB |
976 | if (oldflags & ~0xffff) { |
977 | error_setg(errp, "Unexpected export flags %0x" PRIx32, oldflags); | |
2b8d0954 | 978 | return -EINVAL; |
7423f417 | 979 | } |
004a89fc | 980 | info->flags = oldflags; |
798bfe00 | 981 | } else { |
ef2e35fc | 982 | error_setg(errp, "Bad server magic received: 0x%" PRIx64, magic); |
2b8d0954 | 983 | return -EINVAL; |
798bfe00 | 984 | } |
f72d705f | 985 | |
004a89fc | 986 | trace_nbd_receive_negotiate_size_flags(info->size, info->flags); |
d1fdf257 | 987 | if (zeroes && nbd_drop(ioc, 124, errp) < 0) { |
cb6b1a3f | 988 | error_prepend(errp, "Failed to read reserved block: "); |
2b8d0954 | 989 | return -EINVAL; |
798bfe00 | 990 | } |
2b8d0954 | 991 | return 0; |
798bfe00 FZ |
992 | } |
993 | ||
994 | #ifdef __linux__ | |
004a89fc | 995 | int nbd_init(int fd, QIOChannelSocket *sioc, NBDExportInfo *info, |
be41c100 | 996 | Error **errp) |
798bfe00 | 997 | { |
081dd1fe EB |
998 | unsigned long sector_size = MAX(BDRV_SECTOR_SIZE, info->min_block); |
999 | unsigned long sectors = info->size / sector_size; | |
1000 | ||
1001 | /* FIXME: Once the kernel module is patched to honor block sizes, | |
1002 | * and to advertise that fact to user space, we should update the | |
1003 | * hand-off to the kernel to use any block sizes we learned. */ | |
1004 | assert(!info->request_sizes); | |
1005 | if (info->size / sector_size != sectors) { | |
004a89fc EB |
1006 | error_setg(errp, "Export size %" PRIu64 " too large for 32-bit kernel", |
1007 | info->size); | |
f57e2416 EB |
1008 | return -E2BIG; |
1009 | } | |
1010 | ||
9588463e | 1011 | trace_nbd_init_set_socket(); |
798bfe00 | 1012 | |
f57e2416 | 1013 | if (ioctl(fd, NBD_SET_SOCK, (unsigned long) sioc->fd) < 0) { |
798bfe00 | 1014 | int serrno = errno; |
be41c100 | 1015 | error_setg(errp, "Failed to set NBD socket"); |
798bfe00 FZ |
1016 | return -serrno; |
1017 | } | |
1018 | ||
081dd1fe | 1019 | trace_nbd_init_set_block_size(sector_size); |
798bfe00 | 1020 | |
081dd1fe | 1021 | if (ioctl(fd, NBD_SET_BLKSIZE, sector_size) < 0) { |
798bfe00 | 1022 | int serrno = errno; |
be41c100 | 1023 | error_setg(errp, "Failed setting NBD block size"); |
798bfe00 FZ |
1024 | return -serrno; |
1025 | } | |
1026 | ||
9588463e | 1027 | trace_nbd_init_set_size(sectors); |
081dd1fe EB |
1028 | if (info->size % sector_size) { |
1029 | trace_nbd_init_trailing_bytes(info->size % sector_size); | |
f57e2416 | 1030 | } |
798bfe00 | 1031 | |
f57e2416 | 1032 | if (ioctl(fd, NBD_SET_SIZE_BLOCKS, sectors) < 0) { |
798bfe00 | 1033 | int serrno = errno; |
be41c100 | 1034 | error_setg(errp, "Failed setting size (in blocks)"); |
798bfe00 FZ |
1035 | return -serrno; |
1036 | } | |
1037 | ||
004a89fc | 1038 | if (ioctl(fd, NBD_SET_FLAGS, (unsigned long) info->flags) < 0) { |
798bfe00 | 1039 | if (errno == ENOTTY) { |
004a89fc | 1040 | int read_only = (info->flags & NBD_FLAG_READ_ONLY) != 0; |
9588463e | 1041 | trace_nbd_init_set_readonly(); |
798bfe00 FZ |
1042 | |
1043 | if (ioctl(fd, BLKROSET, (unsigned long) &read_only) < 0) { | |
1044 | int serrno = errno; | |
be41c100 | 1045 | error_setg(errp, "Failed setting read-only attribute"); |
798bfe00 FZ |
1046 | return -serrno; |
1047 | } | |
1048 | } else { | |
1049 | int serrno = errno; | |
be41c100 | 1050 | error_setg(errp, "Failed setting flags"); |
798bfe00 FZ |
1051 | return -serrno; |
1052 | } | |
1053 | } | |
1054 | ||
9588463e | 1055 | trace_nbd_init_finish(); |
798bfe00 FZ |
1056 | |
1057 | return 0; | |
1058 | } | |
1059 | ||
1060 | int nbd_client(int fd) | |
1061 | { | |
1062 | int ret; | |
1063 | int serrno; | |
1064 | ||
9588463e | 1065 | trace_nbd_client_loop(); |
798bfe00 FZ |
1066 | |
1067 | ret = ioctl(fd, NBD_DO_IT); | |
1068 | if (ret < 0 && errno == EPIPE) { | |
1069 | /* NBD_DO_IT normally returns EPIPE when someone has disconnected | |
1070 | * the socket via NBD_DISCONNECT. We do not want to return 1 in | |
1071 | * that case. | |
1072 | */ | |
1073 | ret = 0; | |
1074 | } | |
1075 | serrno = errno; | |
1076 | ||
9588463e | 1077 | trace_nbd_client_loop_ret(ret, strerror(serrno)); |
798bfe00 | 1078 | |
9588463e | 1079 | trace_nbd_client_clear_queue(); |
798bfe00 FZ |
1080 | ioctl(fd, NBD_CLEAR_QUE); |
1081 | ||
9588463e | 1082 | trace_nbd_client_clear_socket(); |
798bfe00 FZ |
1083 | ioctl(fd, NBD_CLEAR_SOCK); |
1084 | ||
1085 | errno = serrno; | |
1086 | return ret; | |
1087 | } | |
98494e3b EB |
1088 | |
1089 | int nbd_disconnect(int fd) | |
1090 | { | |
1091 | ioctl(fd, NBD_CLEAR_QUE); | |
1092 | ioctl(fd, NBD_DISCONNECT); | |
1093 | ioctl(fd, NBD_CLEAR_SOCK); | |
1094 | return 0; | |
1095 | } | |
1096 | ||
3c1fa35d | 1097 | #endif /* __linux__ */ |
798bfe00 | 1098 | |
490dc5ed | 1099 | int nbd_send_request(QIOChannel *ioc, NBDRequest *request) |
798bfe00 FZ |
1100 | { |
1101 | uint8_t buf[NBD_REQUEST_SIZE]; | |
798bfe00 | 1102 | |
9588463e | 1103 | trace_nbd_send_request(request->from, request->len, request->handle, |
48000eb3 EB |
1104 | request->flags, request->type, |
1105 | nbd_cmd_lookup(request->type)); | |
7548fe31 | 1106 | |
f6be6720 | 1107 | stl_be_p(buf, NBD_REQUEST_MAGIC); |
b626b51a EB |
1108 | stw_be_p(buf + 4, request->flags); |
1109 | stw_be_p(buf + 6, request->type); | |
f6be6720 PM |
1110 | stq_be_p(buf + 8, request->handle); |
1111 | stq_be_p(buf + 16, request->from); | |
1112 | stl_be_p(buf + 24, request->len); | |
798bfe00 | 1113 | |
d1fdf257 | 1114 | return nbd_write(ioc, buf, sizeof(buf), NULL); |
798bfe00 FZ |
1115 | } |
1116 | ||
d2febedb VSO |
1117 | /* nbd_receive_simple_reply |
1118 | * Read simple reply except magic field (which should be already read). | |
1119 | * Payload is not read (payload is possible for CMD_READ, but here we even | |
1120 | * don't know whether it take place or not). | |
1121 | */ | |
1122 | static int nbd_receive_simple_reply(QIOChannel *ioc, NBDSimpleReply *reply, | |
1123 | Error **errp) | |
1124 | { | |
1125 | int ret; | |
1126 | ||
1127 | assert(reply->magic == NBD_SIMPLE_REPLY_MAGIC); | |
1128 | ||
1129 | ret = nbd_read(ioc, (uint8_t *)reply + sizeof(reply->magic), | |
1130 | sizeof(*reply) - sizeof(reply->magic), errp); | |
1131 | if (ret < 0) { | |
1132 | return ret; | |
1133 | } | |
1134 | ||
80c7c2b0 PM |
1135 | reply->error = be32_to_cpu(reply->error); |
1136 | reply->handle = be64_to_cpu(reply->handle); | |
d2febedb VSO |
1137 | |
1138 | return 0; | |
1139 | } | |
1140 | ||
1141 | /* nbd_receive_structured_reply_chunk | |
1142 | * Read structured reply chunk except magic field (which should be already | |
1143 | * read). | |
1144 | * Payload is not read. | |
1145 | */ | |
1146 | static int nbd_receive_structured_reply_chunk(QIOChannel *ioc, | |
1147 | NBDStructuredReplyChunk *chunk, | |
1148 | Error **errp) | |
1149 | { | |
1150 | int ret; | |
1151 | ||
1152 | assert(chunk->magic == NBD_STRUCTURED_REPLY_MAGIC); | |
1153 | ||
1154 | ret = nbd_read(ioc, (uint8_t *)chunk + sizeof(chunk->magic), | |
1155 | sizeof(*chunk) - sizeof(chunk->magic), errp); | |
1156 | if (ret < 0) { | |
1157 | return ret; | |
1158 | } | |
1159 | ||
80c7c2b0 PM |
1160 | chunk->flags = be16_to_cpu(chunk->flags); |
1161 | chunk->type = be16_to_cpu(chunk->type); | |
1162 | chunk->handle = be64_to_cpu(chunk->handle); | |
1163 | chunk->length = be32_to_cpu(chunk->length); | |
d2febedb VSO |
1164 | |
1165 | return 0; | |
1166 | } | |
1167 | ||
ba845644 VSO |
1168 | /* nbd_receive_reply |
1169 | * Returns 1 on success | |
1170 | * 0 on eof, when no data was read (errp is not set) | |
1171 | * negative errno on failure (errp is set) | |
1172 | */ | |
1173 | int nbd_receive_reply(QIOChannel *ioc, NBDReply *reply, Error **errp) | |
798bfe00 | 1174 | { |
ba845644 | 1175 | int ret; |
079d3266 | 1176 | const char *type; |
798bfe00 | 1177 | |
d2febedb | 1178 | ret = nbd_read_eof(ioc, &reply->magic, sizeof(reply->magic), errp); |
ff82911c | 1179 | if (ret <= 0) { |
798bfe00 FZ |
1180 | return ret; |
1181 | } | |
1182 | ||
80c7c2b0 | 1183 | reply->magic = be32_to_cpu(reply->magic); |
798bfe00 | 1184 | |
d2febedb VSO |
1185 | switch (reply->magic) { |
1186 | case NBD_SIMPLE_REPLY_MAGIC: | |
1187 | ret = nbd_receive_simple_reply(ioc, &reply->simple, errp); | |
1188 | if (ret < 0) { | |
1189 | break; | |
1190 | } | |
d2febedb VSO |
1191 | trace_nbd_receive_simple_reply(reply->simple.error, |
1192 | nbd_err_lookup(reply->simple.error), | |
1193 | reply->handle); | |
d2febedb VSO |
1194 | break; |
1195 | case NBD_STRUCTURED_REPLY_MAGIC: | |
1196 | ret = nbd_receive_structured_reply_chunk(ioc, &reply->structured, errp); | |
1197 | if (ret < 0) { | |
1198 | break; | |
1199 | } | |
079d3266 | 1200 | type = nbd_reply_type_lookup(reply->structured.type); |
d2febedb | 1201 | trace_nbd_receive_structured_reply_chunk(reply->structured.flags, |
079d3266 | 1202 | reply->structured.type, type, |
d2febedb VSO |
1203 | reply->structured.handle, |
1204 | reply->structured.length); | |
1205 | break; | |
1206 | default: | |
1207 | error_setg(errp, "invalid magic (got 0x%" PRIx32 ")", reply->magic); | |
b6f5d3b5 EB |
1208 | return -EINVAL; |
1209 | } | |
d2febedb VSO |
1210 | if (ret < 0) { |
1211 | return ret; | |
798bfe00 | 1212 | } |
ba845644 VSO |
1213 | |
1214 | return 1; | |
798bfe00 FZ |
1215 | } |
1216 |