linux/block/blk-integrity.c
<<
>>
Prefs
   1/*
   2 * blk-integrity.c - Block layer data integrity extensions
   3 *
   4 * Copyright (C) 2007, 2008 Oracle Corporation
   5 * Written by: Martin K. Petersen <martin.petersen@oracle.com>
   6 *
   7 * This program is free software; you can redistribute it and/or
   8 * modify it under the terms of the GNU General Public License version
   9 * 2 as published by the Free Software Foundation.
  10 *
  11 * This program is distributed in the hope that it will be useful, but
  12 * WITHOUT ANY WARRANTY; without even the implied warranty of
  13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14 * General Public License for more details.
  15 *
  16 * You should have received a copy of the GNU General Public License
  17 * along with this program; see the file COPYING.  If not, write to
  18 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
  19 * USA.
  20 *
  21 */
  22
  23#include <linux/blkdev.h>
  24#include <linux/mempool.h>
  25#include <linux/bio.h>
  26#include <linux/scatterlist.h>
  27#include <linux/export.h>
  28#include <linux/slab.h>
  29
  30#include "blk.h"
  31
  32static struct kmem_cache *integrity_cachep;
  33
  34static const char *bi_unsupported_name = "unsupported";
  35
  36/**
  37 * blk_rq_count_integrity_sg - Count number of integrity scatterlist elements
  38 * @q:          request queue
  39 * @bio:        bio with integrity metadata attached
  40 *
  41 * Description: Returns the number of elements required in a
  42 * scatterlist corresponding to the integrity metadata in a bio.
  43 */
  44int blk_rq_count_integrity_sg(struct request_queue *q, struct bio *bio)
  45{
  46        struct bio_vec *iv, *ivprv = NULL;
  47        unsigned int segments = 0;
  48        unsigned int seg_size = 0;
  49        unsigned int i = 0;
  50
  51        bio_for_each_integrity_vec(iv, bio, i) {
  52
  53                if (ivprv) {
  54                        if (!BIOVEC_PHYS_MERGEABLE(ivprv, iv))
  55                                goto new_segment;
  56
  57                        if (!BIOVEC_SEG_BOUNDARY(q, ivprv, iv))
  58                                goto new_segment;
  59
  60                        if (seg_size + iv->bv_len > queue_max_segment_size(q))
  61                                goto new_segment;
  62
  63                        seg_size += iv->bv_len;
  64                } else {
  65new_segment:
  66                        segments++;
  67                        seg_size = iv->bv_len;
  68                }
  69
  70                ivprv = iv;
  71        }
  72
  73        return segments;
  74}
  75EXPORT_SYMBOL(blk_rq_count_integrity_sg);
  76
  77/**
  78 * blk_rq_map_integrity_sg - Map integrity metadata into a scatterlist
  79 * @q:          request queue
  80 * @bio:        bio with integrity metadata attached
  81 * @sglist:     target scatterlist
  82 *
  83 * Description: Map the integrity vectors in request into a
  84 * scatterlist.  The scatterlist must be big enough to hold all
  85 * elements.  I.e. sized using blk_rq_count_integrity_sg().
  86 */
  87int blk_rq_map_integrity_sg(struct request_queue *q, struct bio *bio,
  88                            struct scatterlist *sglist)
  89{
  90        struct bio_vec *iv, *ivprv = NULL;
  91        struct scatterlist *sg = NULL;
  92        unsigned int segments = 0;
  93        unsigned int i = 0;
  94
  95        bio_for_each_integrity_vec(iv, bio, i) {
  96
  97                if (ivprv) {
  98                        if (!BIOVEC_PHYS_MERGEABLE(ivprv, iv))
  99                                goto new_segment;
 100
 101                        if (!BIOVEC_SEG_BOUNDARY(q, ivprv, iv))
 102                                goto new_segment;
 103
 104                        if (sg->length + iv->bv_len > queue_max_segment_size(q))
 105                                goto new_segment;
 106
 107                        sg->length += iv->bv_len;
 108                } else {
 109new_segment:
 110                        if (!sg)
 111                                sg = sglist;
 112                        else {
 113                                sg_unmark_end(sg);
 114                                sg = sg_next(sg);
 115                        }
 116
 117                        sg_set_page(sg, iv->bv_page, iv->bv_len, iv->bv_offset);
 118                        segments++;
 119                }
 120
 121                ivprv = iv;
 122        }
 123
 124        if (sg)
 125                sg_mark_end(sg);
 126
 127        return segments;
 128}
 129EXPORT_SYMBOL(blk_rq_map_integrity_sg);
 130
 131/**
 132 * blk_integrity_compare - Compare integrity profile of two disks
 133 * @gd1:        Disk to compare
 134 * @gd2:        Disk to compare
 135 *
 136 * Description: Meta-devices like DM and MD need to verify that all
 137 * sub-devices use the same integrity format before advertising to
 138 * upper layers that they can send/receive integrity metadata.  This
 139 * function can be used to check whether two gendisk devices have
 140 * compatible integrity formats.
 141 */
 142int blk_integrity_compare(struct gendisk *gd1, struct gendisk *gd2)
 143{
 144        struct blk_integrity *b1 = gd1->integrity;
 145        struct blk_integrity *b2 = gd2->integrity;
 146
 147        if (!b1 && !b2)
 148                return 0;
 149
 150        if (!b1 || !b2)
 151                return -1;
 152
 153        if (b1->sector_size != b2->sector_size) {
 154                printk(KERN_ERR "%s: %s/%s sector sz %u != %u\n", __func__,
 155                       gd1->disk_name, gd2->disk_name,
 156                       b1->sector_size, b2->sector_size);
 157                return -1;
 158        }
 159
 160        if (b1->tuple_size != b2->tuple_size) {
 161                printk(KERN_ERR "%s: %s/%s tuple sz %u != %u\n", __func__,
 162                       gd1->disk_name, gd2->disk_name,
 163                       b1->tuple_size, b2->tuple_size);
 164                return -1;
 165        }
 166
 167        if (b1->tag_size && b2->tag_size && (b1->tag_size != b2->tag_size)) {
 168                printk(KERN_ERR "%s: %s/%s tag sz %u != %u\n", __func__,
 169                       gd1->disk_name, gd2->disk_name,
 170                       b1->tag_size, b2->tag_size);
 171                return -1;
 172        }
 173
 174        if (strcmp(b1->name, b2->name)) {
 175                printk(KERN_ERR "%s: %s/%s type %s != %s\n", __func__,
 176                       gd1->disk_name, gd2->disk_name,
 177                       b1->name, b2->name);
 178                return -1;
 179        }
 180
 181        return 0;
 182}
 183EXPORT_SYMBOL(blk_integrity_compare);
 184
 185int blk_integrity_merge_rq(struct request_queue *q, struct request *req,
 186                           struct request *next)
 187{
 188        if (blk_integrity_rq(req) != blk_integrity_rq(next))
 189                return -1;
 190
 191        if (req->nr_integrity_segments + next->nr_integrity_segments >
 192            q->limits.max_integrity_segments)
 193                return -1;
 194
 195        return 0;
 196}
 197EXPORT_SYMBOL(blk_integrity_merge_rq);
 198
 199int blk_integrity_merge_bio(struct request_queue *q, struct request *req,
 200                            struct bio *bio)
 201{
 202        int nr_integrity_segs;
 203        struct bio *next = bio->bi_next;
 204
 205        bio->bi_next = NULL;
 206        nr_integrity_segs = blk_rq_count_integrity_sg(q, bio);
 207        bio->bi_next = next;
 208
 209        if (req->nr_integrity_segments + nr_integrity_segs >
 210            q->limits.max_integrity_segments)
 211                return -1;
 212
 213        req->nr_integrity_segments += nr_integrity_segs;
 214
 215        return 0;
 216}
 217EXPORT_SYMBOL(blk_integrity_merge_bio);
 218
 219struct integrity_sysfs_entry {
 220        struct attribute attr;
 221        ssize_t (*show)(struct blk_integrity *, char *);
 222        ssize_t (*store)(struct blk_integrity *, const char *, size_t);
 223};
 224
 225static ssize_t integrity_attr_show(struct kobject *kobj, struct attribute *attr,
 226                                   char *page)
 227{
 228        struct blk_integrity *bi =
 229                container_of(kobj, struct blk_integrity, kobj);
 230        struct integrity_sysfs_entry *entry =
 231                container_of(attr, struct integrity_sysfs_entry, attr);
 232
 233        return entry->show(bi, page);
 234}
 235
 236static ssize_t integrity_attr_store(struct kobject *kobj,
 237                                    struct attribute *attr, const char *page,
 238                                    size_t count)
 239{
 240        struct blk_integrity *bi =
 241                container_of(kobj, struct blk_integrity, kobj);
 242        struct integrity_sysfs_entry *entry =
 243                container_of(attr, struct integrity_sysfs_entry, attr);
 244        ssize_t ret = 0;
 245
 246        if (entry->store)
 247                ret = entry->store(bi, page, count);
 248
 249        return ret;
 250}
 251
 252static ssize_t integrity_format_show(struct blk_integrity *bi, char *page)
 253{
 254        if (bi != NULL && bi->name != NULL)
 255                return sprintf(page, "%s\n", bi->name);
 256        else
 257                return sprintf(page, "none\n");
 258}
 259
 260static ssize_t integrity_tag_size_show(struct blk_integrity *bi, char *page)
 261{
 262        if (bi != NULL)
 263                return sprintf(page, "%u\n", bi->tag_size);
 264        else
 265                return sprintf(page, "0\n");
 266}
 267
 268static ssize_t integrity_read_store(struct blk_integrity *bi,
 269                                    const char *page, size_t count)
 270{
 271        char *p = (char *) page;
 272        unsigned long val = simple_strtoul(p, &p, 10);
 273
 274        if (val)
 275                bi->flags |= INTEGRITY_FLAG_READ;
 276        else
 277                bi->flags &= ~INTEGRITY_FLAG_READ;
 278
 279        return count;
 280}
 281
 282static ssize_t integrity_read_show(struct blk_integrity *bi, char *page)
 283{
 284        return sprintf(page, "%d\n", (bi->flags & INTEGRITY_FLAG_READ) != 0);
 285}
 286
 287static ssize_t integrity_write_store(struct blk_integrity *bi,
 288                                     const char *page, size_t count)
 289{
 290        char *p = (char *) page;
 291        unsigned long val = simple_strtoul(p, &p, 10);
 292
 293        if (val)
 294                bi->flags |= INTEGRITY_FLAG_WRITE;
 295        else
 296                bi->flags &= ~INTEGRITY_FLAG_WRITE;
 297
 298        return count;
 299}
 300
 301static ssize_t integrity_write_show(struct blk_integrity *bi, char *page)
 302{
 303        return sprintf(page, "%d\n", (bi->flags & INTEGRITY_FLAG_WRITE) != 0);
 304}
 305
 306static struct integrity_sysfs_entry integrity_format_entry = {
 307        .attr = { .name = "format", .mode = S_IRUGO },
 308        .show = integrity_format_show,
 309};
 310
 311static struct integrity_sysfs_entry integrity_tag_size_entry = {
 312        .attr = { .name = "tag_size", .mode = S_IRUGO },
 313        .show = integrity_tag_size_show,
 314};
 315
 316static struct integrity_sysfs_entry integrity_read_entry = {
 317        .attr = { .name = "read_verify", .mode = S_IRUGO | S_IWUSR },
 318        .show = integrity_read_show,
 319        .store = integrity_read_store,
 320};
 321
 322static struct integrity_sysfs_entry integrity_write_entry = {
 323        .attr = { .name = "write_generate", .mode = S_IRUGO | S_IWUSR },
 324        .show = integrity_write_show,
 325        .store = integrity_write_store,
 326};
 327
 328static struct attribute *integrity_attrs[] = {
 329        &integrity_format_entry.attr,
 330        &integrity_tag_size_entry.attr,
 331        &integrity_read_entry.attr,
 332        &integrity_write_entry.attr,
 333        NULL,
 334};
 335
 336static const struct sysfs_ops integrity_ops = {
 337        .show   = &integrity_attr_show,
 338        .store  = &integrity_attr_store,
 339};
 340
 341static int __init blk_dev_integrity_init(void)
 342{
 343        integrity_cachep = kmem_cache_create("blkdev_integrity",
 344                                             sizeof(struct blk_integrity),
 345                                             0, SLAB_PANIC, NULL);
 346        return 0;
 347}
 348subsys_initcall(blk_dev_integrity_init);
 349
 350static void blk_integrity_release(struct kobject *kobj)
 351{
 352        struct blk_integrity *bi =
 353                container_of(kobj, struct blk_integrity, kobj);
 354
 355        kmem_cache_free(integrity_cachep, bi);
 356}
 357
 358static struct kobj_type integrity_ktype = {
 359        .default_attrs  = integrity_attrs,
 360        .sysfs_ops      = &integrity_ops,
 361        .release        = blk_integrity_release,
 362};
 363
 364bool blk_integrity_is_initialized(struct gendisk *disk)
 365{
 366        struct blk_integrity *bi = blk_get_integrity(disk);
 367
 368        return (bi && bi->name && strcmp(bi->name, bi_unsupported_name) != 0);
 369}
 370EXPORT_SYMBOL(blk_integrity_is_initialized);
 371
 372/**
 373 * blk_integrity_register - Register a gendisk as being integrity-capable
 374 * @disk:       struct gendisk pointer to make integrity-aware
 375 * @template:   optional integrity profile to register
 376 *
 377 * Description: When a device needs to advertise itself as being able
 378 * to send/receive integrity metadata it must use this function to
 379 * register the capability with the block layer.  The template is a
 380 * blk_integrity struct with values appropriate for the underlying
 381 * hardware.  If template is NULL the new profile is allocated but
 382 * not filled out. See Documentation/block/data-integrity.txt.
 383 */
 384int blk_integrity_register(struct gendisk *disk, struct blk_integrity *template)
 385{
 386        struct blk_integrity *bi;
 387
 388        BUG_ON(disk == NULL);
 389
 390        if (disk->integrity == NULL) {
 391                bi = kmem_cache_alloc(integrity_cachep,
 392                                      GFP_KERNEL | __GFP_ZERO);
 393                if (!bi)
 394                        return -1;
 395
 396                if (kobject_init_and_add(&bi->kobj, &integrity_ktype,
 397                                         &disk_to_dev(disk)->kobj,
 398                                         "%s", "integrity")) {
 399                        kmem_cache_free(integrity_cachep, bi);
 400                        return -1;
 401                }
 402
 403                kobject_uevent(&bi->kobj, KOBJ_ADD);
 404
 405                bi->flags |= INTEGRITY_FLAG_READ | INTEGRITY_FLAG_WRITE;
 406                bi->sector_size = queue_logical_block_size(disk->queue);
 407                disk->integrity = bi;
 408        } else
 409                bi = disk->integrity;
 410
 411        /* Use the provided profile as template */
 412        if (template != NULL) {
 413                bi->name = template->name;
 414                bi->generate_fn = template->generate_fn;
 415                bi->verify_fn = template->verify_fn;
 416                bi->tuple_size = template->tuple_size;
 417                bi->set_tag_fn = template->set_tag_fn;
 418                bi->get_tag_fn = template->get_tag_fn;
 419                bi->tag_size = template->tag_size;
 420        } else
 421                bi->name = bi_unsupported_name;
 422
 423        disk->queue->backing_dev_info.capabilities |= BDI_CAP_STABLE_WRITES;
 424
 425        return 0;
 426}
 427EXPORT_SYMBOL(blk_integrity_register);
 428
 429/**
 430 * blk_integrity_unregister - Remove block integrity profile
 431 * @disk:       disk whose integrity profile to deallocate
 432 *
 433 * Description: This function frees all memory used by the block
 434 * integrity profile.  To be called at device teardown.
 435 */
 436void blk_integrity_unregister(struct gendisk *disk)
 437{
 438        struct blk_integrity *bi;
 439
 440        if (!disk || !disk->integrity)
 441                return;
 442
 443        disk->queue->backing_dev_info.capabilities &= ~BDI_CAP_STABLE_WRITES;
 444
 445        bi = disk->integrity;
 446
 447        kobject_uevent(&bi->kobj, KOBJ_REMOVE);
 448        kobject_del(&bi->kobj);
 449        kobject_put(&bi->kobj);
 450        disk->integrity = NULL;
 451}
 452EXPORT_SYMBOL(blk_integrity_unregister);
 453