xref: /qemu/block/blkdebug.c (revision efe25c260cd69dcfc948e1622bedbdec953569a8)
1  /*
2   * Block protocol for I/O error injection
3   *
4   * Copyright (C) 2016-2017 Red Hat, Inc.
5   * Copyright (c) 2010 Kevin Wolf <kwolf@redhat.com>
6   *
7   * Permission is hereby granted, free of charge, to any person obtaining a copy
8   * of this software and associated documentation files (the "Software"), to deal
9   * in the Software without restriction, including without limitation the rights
10   * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11   * copies of the Software, and to permit persons to whom the Software is
12   * furnished to do so, subject to the following conditions:
13   *
14   * The above copyright notice and this permission notice shall be included in
15   * all copies or substantial portions of the Software.
16   *
17   * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18   * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19   * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20   * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21   * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22   * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23   * THE SOFTWARE.
24   */
25  
26  #include "qemu/osdep.h"
27  #include "qapi/error.h"
28  #include "qemu/cutils.h"
29  #include "qemu/config-file.h"
30  #include "block/block-io.h"
31  #include "block/block_int.h"
32  #include "block/qdict.h"
33  #include "qemu/module.h"
34  #include "qemu/option.h"
35  #include "qapi/qapi-visit-block-core.h"
36  #include "qobject/qdict.h"
37  #include "qobject/qlist.h"
38  #include "qobject/qstring.h"
39  #include "qapi/qobject-input-visitor.h"
40  #include "system/qtest.h"
41  
42  /* All APIs are thread-safe */
43  
44  typedef struct BDRVBlkdebugState {
45      /* IN: initialized in blkdebug_open() and never changed */
46      uint64_t align;
47      uint64_t max_transfer;
48      uint64_t opt_write_zero;
49      uint64_t max_write_zero;
50      uint64_t opt_discard;
51      uint64_t max_discard;
52      char *config_file; /* For blkdebug_refresh_filename() */
53      /* initialized in blkdebug_parse_perms() */
54      uint64_t take_child_perms;
55      uint64_t unshare_child_perms;
56  
57      /* State. Protected by lock */
58      int state;
59      QLIST_HEAD(, BlkdebugRule) rules[BLKDBG__MAX];
60      QSIMPLEQ_HEAD(, BlkdebugRule) active_rules;
61      QLIST_HEAD(, BlkdebugSuspendedReq) suspended_reqs;
62      QemuMutex lock;
63  } BDRVBlkdebugState;
64  
65  typedef struct BlkdebugAIOCB {
66      BlockAIOCB common;
67      int ret;
68  } BlkdebugAIOCB;
69  
70  typedef struct BlkdebugSuspendedReq {
71      /* IN: initialized in suspend_request() */
72      Coroutine *co;
73      char *tag;
74  
75      /* List entry protected BDRVBlkdebugState's lock */
76      QLIST_ENTRY(BlkdebugSuspendedReq) next;
77  } BlkdebugSuspendedReq;
78  
79  enum {
80      ACTION_INJECT_ERROR,
81      ACTION_SET_STATE,
82      ACTION_SUSPEND,
83      ACTION__MAX,
84  };
85  
86  typedef struct BlkdebugRule {
87      /* IN: initialized in add_rule() or blkdebug_debug_breakpoint() */
88      BlkdebugEvent event;
89      int action;
90      int state;
91      union {
92          struct {
93              uint64_t iotype_mask;
94              int error;
95              int immediately;
96              int once;
97              int64_t offset;
98          } inject;
99          struct {
100              int new_state;
101          } set_state;
102          struct {
103              char *tag;
104          } suspend;
105      } options;
106  
107      /* List entries protected BDRVBlkdebugState's lock */
108      QLIST_ENTRY(BlkdebugRule) next;
109      QSIMPLEQ_ENTRY(BlkdebugRule) active_next;
110  } BlkdebugRule;
111  
112  QEMU_BUILD_BUG_MSG(BLKDEBUG_IO_TYPE__MAX > 64,
113                     "BlkdebugIOType mask does not fit into an uint64_t");
114  
115  static QemuOptsList inject_error_opts = {
116      .name = "inject-error",
117      .head = QTAILQ_HEAD_INITIALIZER(inject_error_opts.head),
118      .desc = {
119          {
120              .name = "event",
121              .type = QEMU_OPT_STRING,
122          },
123          {
124              .name = "state",
125              .type = QEMU_OPT_NUMBER,
126          },
127          {
128              .name = "iotype",
129              .type = QEMU_OPT_STRING,
130          },
131          {
132              .name = "errno",
133              .type = QEMU_OPT_NUMBER,
134          },
135          {
136              .name = "sector",
137              .type = QEMU_OPT_NUMBER,
138          },
139          {
140              .name = "once",
141              .type = QEMU_OPT_BOOL,
142          },
143          {
144              .name = "immediately",
145              .type = QEMU_OPT_BOOL,
146          },
147          { /* end of list */ }
148      },
149  };
150  
151  static QemuOptsList set_state_opts = {
152      .name = "set-state",
153      .head = QTAILQ_HEAD_INITIALIZER(set_state_opts.head),
154      .desc = {
155          {
156              .name = "event",
157              .type = QEMU_OPT_STRING,
158          },
159          {
160              .name = "state",
161              .type = QEMU_OPT_NUMBER,
162          },
163          {
164              .name = "new_state",
165              .type = QEMU_OPT_NUMBER,
166          },
167          { /* end of list */ }
168      },
169  };
170  
171  static QemuOptsList *config_groups[] = {
172      &inject_error_opts,
173      &set_state_opts,
174      NULL
175  };
176  
177  struct add_rule_data {
178      BDRVBlkdebugState *s;
179      int action;
180  };
181  
182  static int add_rule(void *opaque, QemuOpts *opts, Error **errp)
183  {
184      struct add_rule_data *d = opaque;
185      BDRVBlkdebugState *s = d->s;
186      const char *event_name;
187      int event;
188      struct BlkdebugRule *rule;
189      int64_t sector;
190      BlkdebugIOType iotype;
191      Error *local_error = NULL;
192  
193      /* Find the right event for the rule */
194      event_name = qemu_opt_get(opts, "event");
195      if (!event_name) {
196          error_setg(errp, "Missing event name for rule");
197          return -1;
198      }
199      event = qapi_enum_parse(&BlkdebugEvent_lookup, event_name, -1, errp);
200      if (event < 0) {
201          return -1;
202      }
203  
204      /* Set attributes common for all actions */
205      rule = g_malloc0(sizeof(*rule));
206      *rule = (struct BlkdebugRule) {
207          .event  = event,
208          .action = d->action,
209          .state  = qemu_opt_get_number(opts, "state", 0),
210      };
211  
212      /* Parse action-specific options */
213      switch (d->action) {
214      case ACTION_INJECT_ERROR:
215          rule->options.inject.error = qemu_opt_get_number(opts, "errno", EIO);
216          rule->options.inject.once  = qemu_opt_get_bool(opts, "once", 0);
217          rule->options.inject.immediately =
218              qemu_opt_get_bool(opts, "immediately", 0);
219          sector = qemu_opt_get_number(opts, "sector", -1);
220          rule->options.inject.offset =
221              sector == -1 ? -1 : sector * BDRV_SECTOR_SIZE;
222  
223          iotype = qapi_enum_parse(&BlkdebugIOType_lookup,
224                                   qemu_opt_get(opts, "iotype"),
225                                   BLKDEBUG_IO_TYPE__MAX, &local_error);
226          if (local_error) {
227              error_propagate(errp, local_error);
228              g_free(rule);
229              return -1;
230          }
231          if (iotype != BLKDEBUG_IO_TYPE__MAX) {
232              rule->options.inject.iotype_mask = (1ull << iotype);
233          } else {
234              /* Apply the default */
235              rule->options.inject.iotype_mask =
236                  (1ull << BLKDEBUG_IO_TYPE_READ)
237                  | (1ull << BLKDEBUG_IO_TYPE_WRITE)
238                  | (1ull << BLKDEBUG_IO_TYPE_WRITE_ZEROES)
239                  | (1ull << BLKDEBUG_IO_TYPE_DISCARD)
240                  | (1ull << BLKDEBUG_IO_TYPE_FLUSH);
241          }
242  
243          break;
244  
245      case ACTION_SET_STATE:
246          rule->options.set_state.new_state =
247              qemu_opt_get_number(opts, "new_state", 0);
248          break;
249  
250      case ACTION_SUSPEND:
251          rule->options.suspend.tag =
252              g_strdup(qemu_opt_get(opts, "tag"));
253          break;
254      };
255  
256      /* Add the rule */
257      qemu_mutex_lock(&s->lock);
258      QLIST_INSERT_HEAD(&s->rules[event], rule, next);
259      qemu_mutex_unlock(&s->lock);
260  
261      return 0;
262  }
263  
264  /* Called with lock held or from .bdrv_close */
265  static void remove_rule(BlkdebugRule *rule)
266  {
267      switch (rule->action) {
268      case ACTION_INJECT_ERROR:
269      case ACTION_SET_STATE:
270          break;
271      case ACTION_SUSPEND:
272          g_free(rule->options.suspend.tag);
273          break;
274      }
275  
276      QLIST_REMOVE(rule, next);
277      g_free(rule);
278  }
279  
280  static int read_config(BDRVBlkdebugState *s, const char *filename,
281                         QDict *options, Error **errp)
282  {
283      FILE *f = NULL;
284      int ret;
285      struct add_rule_data d;
286      Error *local_err = NULL;
287  
288      if (filename) {
289          f = fopen(filename, "r");
290          if (f == NULL) {
291              error_setg_errno(errp, errno, "Could not read blkdebug config file");
292              return -errno;
293          }
294  
295          ret = qemu_config_parse(f, config_groups, filename, errp);
296          if (ret < 0) {
297              goto fail;
298          }
299      }
300  
301      if (!qemu_config_parse_qdict(options, config_groups, errp)) {
302          ret = -EINVAL;
303          goto fail;
304      }
305  
306      d.s = s;
307      d.action = ACTION_INJECT_ERROR;
308      qemu_opts_foreach(&inject_error_opts, add_rule, &d, &local_err);
309      if (local_err) {
310          error_propagate(errp, local_err);
311          ret = -EINVAL;
312          goto fail;
313      }
314  
315      d.action = ACTION_SET_STATE;
316      qemu_opts_foreach(&set_state_opts, add_rule, &d, &local_err);
317      if (local_err) {
318          error_propagate(errp, local_err);
319          ret = -EINVAL;
320          goto fail;
321      }
322  
323      ret = 0;
324  fail:
325      qemu_opts_reset(&inject_error_opts);
326      qemu_opts_reset(&set_state_opts);
327      if (f) {
328          fclose(f);
329      }
330      return ret;
331  }
332  
333  /* Valid blkdebug filenames look like blkdebug:path/to/config:path/to/image */
334  static void blkdebug_parse_filename(const char *filename, QDict *options,
335                                      Error **errp)
336  {
337      const char *c;
338  
339      /* Parse the blkdebug: prefix */
340      if (!strstart(filename, "blkdebug:", &filename)) {
341          /* There was no prefix; therefore, all options have to be already
342             present in the QDict (except for the filename) */
343          qdict_put_str(options, "x-image", filename);
344          return;
345      }
346  
347      /* Parse config file path */
348      c = strchr(filename, ':');
349      if (c == NULL) {
350          error_setg(errp, "blkdebug requires both config file and image path");
351          return;
352      }
353  
354      if (c != filename) {
355          QString *config_path;
356          config_path = qstring_from_substr(filename, 0, c - filename);
357          qdict_put(options, "config", config_path);
358      }
359  
360      /* TODO Allow multi-level nesting and set file.filename here */
361      filename = c + 1;
362      qdict_put_str(options, "x-image", filename);
363  }
364  
365  static int blkdebug_parse_perm_list(uint64_t *dest, QDict *options,
366                                      const char *prefix, Error **errp)
367  {
368      int ret = 0;
369      QDict *subqdict = NULL;
370      QObject *crumpled_subqdict = NULL;
371      Visitor *v = NULL;
372      BlockPermissionList *perm_list = NULL, *element;
373  
374      *dest = 0;
375  
376      qdict_extract_subqdict(options, &subqdict, prefix);
377      if (!qdict_size(subqdict)) {
378          goto out;
379      }
380  
381      crumpled_subqdict = qdict_crumple(subqdict, errp);
382      if (!crumpled_subqdict) {
383          ret = -EINVAL;
384          goto out;
385      }
386  
387      v = qobject_input_visitor_new(crumpled_subqdict);
388      if (!visit_type_BlockPermissionList(v, NULL, &perm_list, errp)) {
389          ret = -EINVAL;
390          goto out;
391      }
392  
393      for (element = perm_list; element; element = element->next) {
394          *dest |= bdrv_qapi_perm_to_blk_perm(element->value);
395      }
396  
397  out:
398      qapi_free_BlockPermissionList(perm_list);
399      visit_free(v);
400      qobject_unref(subqdict);
401      qobject_unref(crumpled_subqdict);
402      return ret;
403  }
404  
405  static int blkdebug_parse_perms(BDRVBlkdebugState *s, QDict *options,
406                                  Error **errp)
407  {
408      int ret;
409  
410      ret = blkdebug_parse_perm_list(&s->take_child_perms, options,
411                                     "take-child-perms.", errp);
412      if (ret < 0) {
413          return ret;
414      }
415  
416      ret = blkdebug_parse_perm_list(&s->unshare_child_perms, options,
417                                     "unshare-child-perms.", errp);
418      if (ret < 0) {
419          return ret;
420      }
421  
422      return 0;
423  }
424  
425  static QemuOptsList runtime_opts = {
426      .name = "blkdebug",
427      .head = QTAILQ_HEAD_INITIALIZER(runtime_opts.head),
428      .desc = {
429          {
430              .name = "config",
431              .type = QEMU_OPT_STRING,
432              .help = "Path to the configuration file",
433          },
434          {
435              .name = "x-image",
436              .type = QEMU_OPT_STRING,
437              .help = "[internal use only, will be removed]",
438          },
439          {
440              .name = "align",
441              .type = QEMU_OPT_SIZE,
442              .help = "Required alignment in bytes",
443          },
444          {
445              .name = "max-transfer",
446              .type = QEMU_OPT_SIZE,
447              .help = "Maximum transfer size in bytes",
448          },
449          {
450              .name = "opt-write-zero",
451              .type = QEMU_OPT_SIZE,
452              .help = "Optimum write zero alignment in bytes",
453          },
454          {
455              .name = "max-write-zero",
456              .type = QEMU_OPT_SIZE,
457              .help = "Maximum write zero size in bytes",
458          },
459          {
460              .name = "opt-discard",
461              .type = QEMU_OPT_SIZE,
462              .help = "Optimum discard alignment in bytes",
463          },
464          {
465              .name = "max-discard",
466              .type = QEMU_OPT_SIZE,
467              .help = "Maximum discard size in bytes",
468          },
469          { /* end of list */ }
470      },
471  };
472  
473  static int blkdebug_open(BlockDriverState *bs, QDict *options, int flags,
474                           Error **errp)
475  {
476      BDRVBlkdebugState *s = bs->opaque;
477      QemuOpts *opts;
478      int ret;
479      uint64_t align;
480  
481      qemu_mutex_init(&s->lock);
482      opts = qemu_opts_create(&runtime_opts, NULL, 0, &error_abort);
483      if (!qemu_opts_absorb_qdict(opts, options, errp)) {
484          ret = -EINVAL;
485          goto out;
486      }
487  
488      /* Read rules from config file or command line options */
489      s->config_file = g_strdup(qemu_opt_get(opts, "config"));
490      ret = read_config(s, s->config_file, options, errp);
491      if (ret) {
492          goto out;
493      }
494  
495      /* Set initial state */
496      s->state = 1;
497  
498      /* Parse permissions modifiers before opening the image file */
499      ret = blkdebug_parse_perms(s, options, errp);
500      if (ret < 0) {
501          goto out;
502      }
503  
504      /* Open the image file */
505      ret = bdrv_open_file_child(qemu_opt_get(opts, "x-image"), options, "image",
506                                 bs, errp);
507      if (ret < 0) {
508          goto out;
509      }
510  
511      bdrv_graph_rdlock_main_loop();
512  
513      bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
514          (BDRV_REQ_FUA & bs->file->bs->supported_write_flags);
515      bs->supported_zero_flags = BDRV_REQ_WRITE_UNCHANGED |
516          ((BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP | BDRV_REQ_NO_FALLBACK) &
517              bs->file->bs->supported_zero_flags);
518      ret = -EINVAL;
519  
520      /* Set alignment overrides */
521      s->align = qemu_opt_get_size(opts, "align", 0);
522      if (s->align && (s->align >= INT_MAX || !is_power_of_2(s->align))) {
523          error_setg(errp, "Cannot meet constraints with align %" PRIu64,
524                     s->align);
525          goto out_rdlock;
526      }
527      align = MAX(s->align, bs->file->bs->bl.request_alignment);
528  
529      s->max_transfer = qemu_opt_get_size(opts, "max-transfer", 0);
530      if (s->max_transfer &&
531          (s->max_transfer >= INT_MAX ||
532           !QEMU_IS_ALIGNED(s->max_transfer, align))) {
533          error_setg(errp, "Cannot meet constraints with max-transfer %" PRIu64,
534                     s->max_transfer);
535          goto out_rdlock;
536      }
537  
538      s->opt_write_zero = qemu_opt_get_size(opts, "opt-write-zero", 0);
539      if (s->opt_write_zero &&
540          (s->opt_write_zero >= INT_MAX ||
541           !QEMU_IS_ALIGNED(s->opt_write_zero, align))) {
542          error_setg(errp, "Cannot meet constraints with opt-write-zero %" PRIu64,
543                     s->opt_write_zero);
544          goto out_rdlock;
545      }
546  
547      s->max_write_zero = qemu_opt_get_size(opts, "max-write-zero", 0);
548      if (s->max_write_zero &&
549          (s->max_write_zero >= INT_MAX ||
550           !QEMU_IS_ALIGNED(s->max_write_zero,
551                            MAX(s->opt_write_zero, align)))) {
552          error_setg(errp, "Cannot meet constraints with max-write-zero %" PRIu64,
553                     s->max_write_zero);
554          goto out_rdlock;
555      }
556  
557      s->opt_discard = qemu_opt_get_size(opts, "opt-discard", 0);
558      if (s->opt_discard &&
559          (s->opt_discard >= INT_MAX ||
560           !QEMU_IS_ALIGNED(s->opt_discard, align))) {
561          error_setg(errp, "Cannot meet constraints with opt-discard %" PRIu64,
562                     s->opt_discard);
563          goto out_rdlock;
564      }
565  
566      s->max_discard = qemu_opt_get_size(opts, "max-discard", 0);
567      if (s->max_discard &&
568          (s->max_discard >= INT_MAX ||
569           !QEMU_IS_ALIGNED(s->max_discard,
570                            MAX(s->opt_discard, align)))) {
571          error_setg(errp, "Cannot meet constraints with max-discard %" PRIu64,
572                     s->max_discard);
573          goto out_rdlock;
574      }
575  
576      bdrv_debug_event(bs, BLKDBG_NONE);
577  
578      ret = 0;
579  out_rdlock:
580      bdrv_graph_rdunlock_main_loop();
581  out:
582      if (ret < 0) {
583          qemu_mutex_destroy(&s->lock);
584          g_free(s->config_file);
585      }
586      qemu_opts_del(opts);
587      return ret;
588  }
589  
590  static int coroutine_fn rule_check(BlockDriverState *bs, uint64_t offset,
591                                     uint64_t bytes, BlkdebugIOType iotype)
592  {
593      BDRVBlkdebugState *s = bs->opaque;
594      BlkdebugRule *rule = NULL;
595      int error;
596      bool immediately;
597  
598      qemu_mutex_lock(&s->lock);
599      QSIMPLEQ_FOREACH(rule, &s->active_rules, active_next) {
600          uint64_t inject_offset = rule->options.inject.offset;
601  
602          if ((inject_offset == -1 ||
603               (bytes && inject_offset >= offset &&
604                inject_offset < offset + bytes)) &&
605              (rule->options.inject.iotype_mask & (1ull << iotype)))
606          {
607              break;
608          }
609      }
610  
611      if (!rule || !rule->options.inject.error) {
612          qemu_mutex_unlock(&s->lock);
613          return 0;
614      }
615  
616      immediately = rule->options.inject.immediately;
617      error = rule->options.inject.error;
618  
619      if (rule->options.inject.once) {
620          QSIMPLEQ_REMOVE(&s->active_rules, rule, BlkdebugRule, active_next);
621          remove_rule(rule);
622      }
623  
624      qemu_mutex_unlock(&s->lock);
625      if (!immediately) {
626          aio_co_schedule(qemu_get_current_aio_context(), qemu_coroutine_self());
627          qemu_coroutine_yield();
628      }
629  
630      return -error;
631  }
632  
633  static int coroutine_fn GRAPH_RDLOCK
634  blkdebug_co_preadv(BlockDriverState *bs, int64_t offset, int64_t bytes,
635                     QEMUIOVector *qiov, BdrvRequestFlags flags)
636  {
637      int err;
638  
639      /* Sanity check block layer guarantees */
640      assert(QEMU_IS_ALIGNED(offset, bs->bl.request_alignment));
641      assert(QEMU_IS_ALIGNED(bytes, bs->bl.request_alignment));
642      if (bs->bl.max_transfer) {
643          assert(bytes <= bs->bl.max_transfer);
644      }
645  
646      err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_READ);
647      if (err) {
648          return err;
649      }
650  
651      return bdrv_co_preadv(bs->file, offset, bytes, qiov, flags);
652  }
653  
654  static int coroutine_fn GRAPH_RDLOCK
655  blkdebug_co_pwritev(BlockDriverState *bs, int64_t offset, int64_t bytes,
656                      QEMUIOVector *qiov, BdrvRequestFlags flags)
657  {
658      int err;
659  
660      /* Sanity check block layer guarantees */
661      assert(QEMU_IS_ALIGNED(offset, bs->bl.request_alignment));
662      assert(QEMU_IS_ALIGNED(bytes, bs->bl.request_alignment));
663      if (bs->bl.max_transfer) {
664          assert(bytes <= bs->bl.max_transfer);
665      }
666  
667      err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_WRITE);
668      if (err) {
669          return err;
670      }
671  
672      return bdrv_co_pwritev(bs->file, offset, bytes, qiov, flags);
673  }
674  
675  static int GRAPH_RDLOCK coroutine_fn blkdebug_co_flush(BlockDriverState *bs)
676  {
677      int err = rule_check(bs, 0, 0, BLKDEBUG_IO_TYPE_FLUSH);
678  
679      if (err) {
680          return err;
681      }
682  
683      return bdrv_co_flush(bs->file->bs);
684  }
685  
686  static int coroutine_fn GRAPH_RDLOCK
687  blkdebug_co_pwrite_zeroes(BlockDriverState *bs, int64_t offset, int64_t bytes,
688                            BdrvRequestFlags flags)
689  {
690      uint32_t align = MAX(bs->bl.request_alignment,
691                           bs->bl.pwrite_zeroes_alignment);
692      int err;
693  
694      /* Only pass through requests that are larger than requested
695       * preferred alignment (so that we test the fallback to writes on
696       * unaligned portions), and check that the block layer never hands
697       * us anything unaligned that crosses an alignment boundary.  */
698      if (bytes < align) {
699          assert(QEMU_IS_ALIGNED(offset, align) ||
700                 QEMU_IS_ALIGNED(offset + bytes, align) ||
701                 DIV_ROUND_UP(offset, align) ==
702                 DIV_ROUND_UP(offset + bytes, align));
703          return -ENOTSUP;
704      }
705      assert(QEMU_IS_ALIGNED(offset, align));
706      assert(QEMU_IS_ALIGNED(bytes, align));
707      if (bs->bl.max_pwrite_zeroes) {
708          assert(bytes <= bs->bl.max_pwrite_zeroes);
709      }
710  
711      err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_WRITE_ZEROES);
712      if (err) {
713          return err;
714      }
715  
716      return bdrv_co_pwrite_zeroes(bs->file, offset, bytes, flags);
717  }
718  
719  static int coroutine_fn GRAPH_RDLOCK
720  blkdebug_co_pdiscard(BlockDriverState *bs, int64_t offset, int64_t bytes)
721  {
722      uint32_t align = bs->bl.pdiscard_alignment;
723      int err;
724  
725      /* Only pass through requests that are larger than requested
726       * minimum alignment, and ensure that unaligned requests do not
727       * cross optimum discard boundaries. */
728      if (bytes < bs->bl.request_alignment) {
729          assert(QEMU_IS_ALIGNED(offset, align) ||
730                 QEMU_IS_ALIGNED(offset + bytes, align) ||
731                 DIV_ROUND_UP(offset, align) ==
732                 DIV_ROUND_UP(offset + bytes, align));
733          return -ENOTSUP;
734      }
735      assert(QEMU_IS_ALIGNED(offset, bs->bl.request_alignment));
736      assert(QEMU_IS_ALIGNED(bytes, bs->bl.request_alignment));
737      if (align && bytes >= align) {
738          assert(QEMU_IS_ALIGNED(offset, align));
739          assert(QEMU_IS_ALIGNED(bytes, align));
740      }
741      if (bs->bl.max_pdiscard) {
742          assert(bytes <= bs->bl.max_pdiscard);
743      }
744  
745      err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_DISCARD);
746      if (err) {
747          return err;
748      }
749  
750      return bdrv_co_pdiscard(bs->file, offset, bytes);
751  }
752  
753  static int coroutine_fn GRAPH_RDLOCK
754  blkdebug_co_block_status(BlockDriverState *bs, bool want_zero, int64_t offset,
755                           int64_t bytes, int64_t *pnum, int64_t *map,
756                           BlockDriverState **file)
757  {
758      int err;
759  
760      assert(QEMU_IS_ALIGNED(offset | bytes, bs->bl.request_alignment));
761  
762      err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_BLOCK_STATUS);
763      if (err) {
764          return err;
765      }
766  
767      assert(bs->file && bs->file->bs);
768      *pnum = bytes;
769      *map = offset;
770      *file = bs->file->bs;
771      return BDRV_BLOCK_RAW | BDRV_BLOCK_OFFSET_VALID;
772  }
773  
774  static void blkdebug_close(BlockDriverState *bs)
775  {
776      BDRVBlkdebugState *s = bs->opaque;
777      BlkdebugRule *rule, *next;
778      int i;
779  
780      for (i = 0; i < BLKDBG__MAX; i++) {
781          QLIST_FOREACH_SAFE(rule, &s->rules[i], next, next) {
782              remove_rule(rule);
783          }
784      }
785  
786      g_free(s->config_file);
787      qemu_mutex_destroy(&s->lock);
788  }
789  
790  /* Called with lock held.  */
791  static void suspend_request(BlockDriverState *bs, BlkdebugRule *rule)
792  {
793      BDRVBlkdebugState *s = bs->opaque;
794      BlkdebugSuspendedReq *r;
795  
796      r = g_new(BlkdebugSuspendedReq, 1);
797  
798      r->co         = qemu_coroutine_self();
799      r->tag        = g_strdup(rule->options.suspend.tag);
800  
801      remove_rule(rule);
802      QLIST_INSERT_HEAD(&s->suspended_reqs, r, next);
803  
804      if (!qtest_enabled()) {
805          printf("blkdebug: Suspended request '%s'\n", r->tag);
806      }
807  }
808  
809  /* Called with lock held.  */
810  static void process_rule(BlockDriverState *bs, struct BlkdebugRule *rule,
811                           int *action_count, int *new_state)
812  {
813      BDRVBlkdebugState *s = bs->opaque;
814  
815      /* Only process rules for the current state */
816      if (rule->state && rule->state != s->state) {
817          return;
818      }
819  
820      /* Take the action */
821      action_count[rule->action]++;
822      switch (rule->action) {
823      case ACTION_INJECT_ERROR:
824          if (action_count[ACTION_INJECT_ERROR] == 1) {
825              QSIMPLEQ_INIT(&s->active_rules);
826          }
827          QSIMPLEQ_INSERT_HEAD(&s->active_rules, rule, active_next);
828          break;
829  
830      case ACTION_SET_STATE:
831          *new_state = rule->options.set_state.new_state;
832          break;
833  
834      case ACTION_SUSPEND:
835          suspend_request(bs, rule);
836          break;
837      }
838  }
839  
840  static void coroutine_fn
841  blkdebug_co_debug_event(BlockDriverState *bs, BlkdebugEvent event)
842  {
843      BDRVBlkdebugState *s = bs->opaque;
844      struct BlkdebugRule *rule, *next;
845      int new_state;
846      int actions_count[ACTION__MAX] = { 0 };
847  
848      assert((int)event >= 0 && event < BLKDBG__MAX);
849  
850      WITH_QEMU_LOCK_GUARD(&s->lock) {
851          new_state = s->state;
852          QLIST_FOREACH_SAFE(rule, &s->rules[event], next, next) {
853              process_rule(bs, rule, actions_count, &new_state);
854          }
855          s->state = new_state;
856      }
857  
858      while (actions_count[ACTION_SUSPEND] > 0) {
859          qemu_coroutine_yield();
860          actions_count[ACTION_SUSPEND]--;
861      }
862  }
863  
864  static int blkdebug_debug_breakpoint(BlockDriverState *bs, const char *event,
865                                       const char *tag)
866  {
867      BDRVBlkdebugState *s = bs->opaque;
868      struct BlkdebugRule *rule;
869      int blkdebug_event;
870  
871      blkdebug_event = qapi_enum_parse(&BlkdebugEvent_lookup, event, -1, NULL);
872      if (blkdebug_event < 0) {
873          return -ENOENT;
874      }
875  
876      rule = g_malloc(sizeof(*rule));
877      *rule = (struct BlkdebugRule) {
878          .event  = blkdebug_event,
879          .action = ACTION_SUSPEND,
880          .state  = 0,
881          .options.suspend.tag = g_strdup(tag),
882      };
883  
884      qemu_mutex_lock(&s->lock);
885      QLIST_INSERT_HEAD(&s->rules[blkdebug_event], rule, next);
886      qemu_mutex_unlock(&s->lock);
887  
888      return 0;
889  }
890  
891  /* Called with lock held. May temporarily release lock. */
892  static int resume_req_by_tag(BDRVBlkdebugState *s, const char *tag, bool all)
893  {
894      BlkdebugSuspendedReq *r;
895  
896  retry:
897      /*
898       * No need for _SAFE, since a different coroutine can remove another node
899       * (not the current one) in this list, and when the current one is removed
900       * the iteration starts back from beginning anyways.
901       */
902      QLIST_FOREACH(r, &s->suspended_reqs, next) {
903          if (!strcmp(r->tag, tag)) {
904              Coroutine *co = r->co;
905  
906              if (!qtest_enabled()) {
907                  printf("blkdebug: Resuming request '%s'\n", r->tag);
908              }
909  
910              QLIST_REMOVE(r, next);
911              g_free(r->tag);
912              g_free(r);
913  
914              qemu_mutex_unlock(&s->lock);
915              qemu_coroutine_enter(co);
916              qemu_mutex_lock(&s->lock);
917  
918              if (all) {
919                  goto retry;
920              }
921              return 0;
922          }
923      }
924      return -ENOENT;
925  }
926  
927  static int blkdebug_debug_resume(BlockDriverState *bs, const char *tag)
928  {
929      BDRVBlkdebugState *s = bs->opaque;
930      QEMU_LOCK_GUARD(&s->lock);
931      return resume_req_by_tag(s, tag, false);
932  }
933  
934  static int blkdebug_debug_remove_breakpoint(BlockDriverState *bs,
935                                              const char *tag)
936  {
937      BDRVBlkdebugState *s = bs->opaque;
938      BlkdebugRule *rule, *next;
939      int i, ret = -ENOENT;
940  
941      QEMU_LOCK_GUARD(&s->lock);
942      for (i = 0; i < BLKDBG__MAX; i++) {
943          QLIST_FOREACH_SAFE(rule, &s->rules[i], next, next) {
944              if (rule->action == ACTION_SUSPEND &&
945                  !strcmp(rule->options.suspend.tag, tag)) {
946                  remove_rule(rule);
947                  ret = 0;
948              }
949          }
950      }
951      if (resume_req_by_tag(s, tag, true) == 0) {
952          ret = 0;
953      }
954      return ret;
955  }
956  
957  static bool blkdebug_debug_is_suspended(BlockDriverState *bs, const char *tag)
958  {
959      BDRVBlkdebugState *s = bs->opaque;
960      BlkdebugSuspendedReq *r;
961  
962      QEMU_LOCK_GUARD(&s->lock);
963      QLIST_FOREACH(r, &s->suspended_reqs, next) {
964          if (!strcmp(r->tag, tag)) {
965              return true;
966          }
967      }
968      return false;
969  }
970  
971  static int64_t coroutine_fn GRAPH_RDLOCK
972  blkdebug_co_getlength(BlockDriverState *bs)
973  {
974      return bdrv_co_getlength(bs->file->bs);
975  }
976  
977  static void GRAPH_RDLOCK blkdebug_refresh_filename(BlockDriverState *bs)
978  {
979      BDRVBlkdebugState *s = bs->opaque;
980      const QDictEntry *e;
981      int ret;
982  
983      if (!bs->file->bs->exact_filename[0]) {
984          return;
985      }
986  
987      for (e = qdict_first(bs->full_open_options); e;
988           e = qdict_next(bs->full_open_options, e))
989      {
990          /* Real child options are under "image", but "x-image" may
991           * contain a filename */
992          if (strcmp(qdict_entry_key(e), "config") &&
993              strcmp(qdict_entry_key(e), "image") &&
994              strcmp(qdict_entry_key(e), "x-image") &&
995              strcmp(qdict_entry_key(e), "driver"))
996          {
997              return;
998          }
999      }
1000  
1001      ret = snprintf(bs->exact_filename, sizeof(bs->exact_filename),
1002                     "blkdebug:%s:%s",
1003                     s->config_file ?: "", bs->file->bs->exact_filename);
1004      if (ret >= sizeof(bs->exact_filename)) {
1005          /* An overflow makes the filename unusable, so do not report any */
1006          bs->exact_filename[0] = 0;
1007      }
1008  }
1009  
1010  static void blkdebug_refresh_limits(BlockDriverState *bs, Error **errp)
1011  {
1012      BDRVBlkdebugState *s = bs->opaque;
1013  
1014      if (s->align) {
1015          bs->bl.request_alignment = s->align;
1016      }
1017      if (s->max_transfer) {
1018          bs->bl.max_transfer = s->max_transfer;
1019      }
1020      if (s->opt_write_zero) {
1021          bs->bl.pwrite_zeroes_alignment = s->opt_write_zero;
1022      }
1023      if (s->max_write_zero) {
1024          bs->bl.max_pwrite_zeroes = s->max_write_zero;
1025      }
1026      if (s->opt_discard) {
1027          bs->bl.pdiscard_alignment = s->opt_discard;
1028      }
1029      if (s->max_discard) {
1030          bs->bl.max_pdiscard = s->max_discard;
1031      }
1032  }
1033  
1034  static int blkdebug_reopen_prepare(BDRVReopenState *reopen_state,
1035                                     BlockReopenQueue *queue, Error **errp)
1036  {
1037      return 0;
1038  }
1039  
1040  static void blkdebug_child_perm(BlockDriverState *bs, BdrvChild *c,
1041                                  BdrvChildRole role,
1042                                  BlockReopenQueue *reopen_queue,
1043                                  uint64_t perm, uint64_t shared,
1044                                  uint64_t *nperm, uint64_t *nshared)
1045  {
1046      BDRVBlkdebugState *s = bs->opaque;
1047  
1048      bdrv_default_perms(bs, c, role, reopen_queue,
1049                         perm, shared, nperm, nshared);
1050  
1051      *nperm |= s->take_child_perms;
1052      *nshared &= ~s->unshare_child_perms;
1053  }
1054  
1055  static const char *const blkdebug_strong_runtime_opts[] = {
1056      "config",
1057      "inject-error.",
1058      "set-state.",
1059      "align",
1060      "max-transfer",
1061      "opt-write-zero",
1062      "max-write-zero",
1063      "opt-discard",
1064      "max-discard",
1065  
1066      NULL
1067  };
1068  
1069  static BlockDriver bdrv_blkdebug = {
1070      .format_name            = "blkdebug",
1071      .protocol_name          = "blkdebug",
1072      .instance_size          = sizeof(BDRVBlkdebugState),
1073      .is_filter              = true,
1074  
1075      .bdrv_parse_filename    = blkdebug_parse_filename,
1076      .bdrv_open              = blkdebug_open,
1077      .bdrv_close             = blkdebug_close,
1078      .bdrv_reopen_prepare    = blkdebug_reopen_prepare,
1079      .bdrv_child_perm        = blkdebug_child_perm,
1080  
1081      .bdrv_co_getlength      = blkdebug_co_getlength,
1082      .bdrv_refresh_filename  = blkdebug_refresh_filename,
1083      .bdrv_refresh_limits    = blkdebug_refresh_limits,
1084  
1085      .bdrv_co_preadv         = blkdebug_co_preadv,
1086      .bdrv_co_pwritev        = blkdebug_co_pwritev,
1087      .bdrv_co_flush_to_disk  = blkdebug_co_flush,
1088      .bdrv_co_pwrite_zeroes  = blkdebug_co_pwrite_zeroes,
1089      .bdrv_co_pdiscard       = blkdebug_co_pdiscard,
1090      .bdrv_co_block_status   = blkdebug_co_block_status,
1091  
1092      .bdrv_co_debug_event        = blkdebug_co_debug_event,
1093      .bdrv_debug_breakpoint      = blkdebug_debug_breakpoint,
1094      .bdrv_debug_remove_breakpoint
1095                                  = blkdebug_debug_remove_breakpoint,
1096      .bdrv_debug_resume          = blkdebug_debug_resume,
1097      .bdrv_debug_is_suspended    = blkdebug_debug_is_suspended,
1098  
1099      .strong_runtime_opts        = blkdebug_strong_runtime_opts,
1100  };
1101  
1102  static void bdrv_blkdebug_init(void)
1103  {
1104      bdrv_register(&bdrv_blkdebug);
1105  }
1106  
1107  block_init(bdrv_blkdebug_init);
1108