Linux 3.9-rc4
[linux-2.6/cjktty.git] / block / blk-integrity.c
blobdabd221857e1b8fdf9eac1d2ead6d5a4a71efa2d
1 /*
2 * blk-integrity.c - Block layer data integrity extensions
4 * Copyright (C) 2007, 2008 Oracle Corporation
5 * Written by: Martin K. Petersen <martin.petersen@oracle.com>
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License version
9 * 2 as published by the Free Software Foundation.
11 * This program is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; see the file COPYING. If not, write to
18 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
19 * USA.
23 #include <linux/blkdev.h>
24 #include <linux/mempool.h>
25 #include <linux/bio.h>
26 #include <linux/scatterlist.h>
27 #include <linux/export.h>
28 #include <linux/slab.h>
30 #include "blk.h"
32 static struct kmem_cache *integrity_cachep;
34 static const char *bi_unsupported_name = "unsupported";
36 /**
37 * blk_rq_count_integrity_sg - Count number of integrity scatterlist elements
38 * @q: request queue
39 * @bio: bio with integrity metadata attached
41 * Description: Returns the number of elements required in a
42 * scatterlist corresponding to the integrity metadata in a bio.
44 int blk_rq_count_integrity_sg(struct request_queue *q, struct bio *bio)
46 struct bio_vec *iv, *ivprv = NULL;
47 unsigned int segments = 0;
48 unsigned int seg_size = 0;
49 unsigned int i = 0;
51 bio_for_each_integrity_vec(iv, bio, i) {
53 if (ivprv) {
54 if (!BIOVEC_PHYS_MERGEABLE(ivprv, iv))
55 goto new_segment;
57 if (!BIOVEC_SEG_BOUNDARY(q, ivprv, iv))
58 goto new_segment;
60 if (seg_size + iv->bv_len > queue_max_segment_size(q))
61 goto new_segment;
63 seg_size += iv->bv_len;
64 } else {
65 new_segment:
66 segments++;
67 seg_size = iv->bv_len;
70 ivprv = iv;
73 return segments;
75 EXPORT_SYMBOL(blk_rq_count_integrity_sg);
77 /**
78 * blk_rq_map_integrity_sg - Map integrity metadata into a scatterlist
79 * @q: request queue
80 * @bio: bio with integrity metadata attached
81 * @sglist: target scatterlist
83 * Description: Map the integrity vectors in request into a
84 * scatterlist. The scatterlist must be big enough to hold all
85 * elements. I.e. sized using blk_rq_count_integrity_sg().
87 int blk_rq_map_integrity_sg(struct request_queue *q, struct bio *bio,
88 struct scatterlist *sglist)
90 struct bio_vec *iv, *ivprv = NULL;
91 struct scatterlist *sg = NULL;
92 unsigned int segments = 0;
93 unsigned int i = 0;
95 bio_for_each_integrity_vec(iv, bio, i) {
97 if (ivprv) {
98 if (!BIOVEC_PHYS_MERGEABLE(ivprv, iv))
99 goto new_segment;
101 if (!BIOVEC_SEG_BOUNDARY(q, ivprv, iv))
102 goto new_segment;
104 if (sg->length + iv->bv_len > queue_max_segment_size(q))
105 goto new_segment;
107 sg->length += iv->bv_len;
108 } else {
109 new_segment:
110 if (!sg)
111 sg = sglist;
112 else {
113 sg->page_link &= ~0x02;
114 sg = sg_next(sg);
117 sg_set_page(sg, iv->bv_page, iv->bv_len, iv->bv_offset);
118 segments++;
121 ivprv = iv;
124 if (sg)
125 sg_mark_end(sg);
127 return segments;
129 EXPORT_SYMBOL(blk_rq_map_integrity_sg);
132 * blk_integrity_compare - Compare integrity profile of two disks
133 * @gd1: Disk to compare
134 * @gd2: Disk to compare
136 * Description: Meta-devices like DM and MD need to verify that all
137 * sub-devices use the same integrity format before advertising to
138 * upper layers that they can send/receive integrity metadata. This
139 * function can be used to check whether two gendisk devices have
140 * compatible integrity formats.
142 int blk_integrity_compare(struct gendisk *gd1, struct gendisk *gd2)
144 struct blk_integrity *b1 = gd1->integrity;
145 struct blk_integrity *b2 = gd2->integrity;
147 if (!b1 && !b2)
148 return 0;
150 if (!b1 || !b2)
151 return -1;
153 if (b1->sector_size != b2->sector_size) {
154 printk(KERN_ERR "%s: %s/%s sector sz %u != %u\n", __func__,
155 gd1->disk_name, gd2->disk_name,
156 b1->sector_size, b2->sector_size);
157 return -1;
160 if (b1->tuple_size != b2->tuple_size) {
161 printk(KERN_ERR "%s: %s/%s tuple sz %u != %u\n", __func__,
162 gd1->disk_name, gd2->disk_name,
163 b1->tuple_size, b2->tuple_size);
164 return -1;
167 if (b1->tag_size && b2->tag_size && (b1->tag_size != b2->tag_size)) {
168 printk(KERN_ERR "%s: %s/%s tag sz %u != %u\n", __func__,
169 gd1->disk_name, gd2->disk_name,
170 b1->tag_size, b2->tag_size);
171 return -1;
174 if (strcmp(b1->name, b2->name)) {
175 printk(KERN_ERR "%s: %s/%s type %s != %s\n", __func__,
176 gd1->disk_name, gd2->disk_name,
177 b1->name, b2->name);
178 return -1;
181 return 0;
183 EXPORT_SYMBOL(blk_integrity_compare);
185 int blk_integrity_merge_rq(struct request_queue *q, struct request *req,
186 struct request *next)
188 if (blk_integrity_rq(req) != blk_integrity_rq(next))
189 return -1;
191 if (req->nr_integrity_segments + next->nr_integrity_segments >
192 q->limits.max_integrity_segments)
193 return -1;
195 return 0;
197 EXPORT_SYMBOL(blk_integrity_merge_rq);
199 int blk_integrity_merge_bio(struct request_queue *q, struct request *req,
200 struct bio *bio)
202 int nr_integrity_segs;
203 struct bio *next = bio->bi_next;
205 bio->bi_next = NULL;
206 nr_integrity_segs = blk_rq_count_integrity_sg(q, bio);
207 bio->bi_next = next;
209 if (req->nr_integrity_segments + nr_integrity_segs >
210 q->limits.max_integrity_segments)
211 return -1;
213 req->nr_integrity_segments += nr_integrity_segs;
215 return 0;
217 EXPORT_SYMBOL(blk_integrity_merge_bio);
219 struct integrity_sysfs_entry {
220 struct attribute attr;
221 ssize_t (*show)(struct blk_integrity *, char *);
222 ssize_t (*store)(struct blk_integrity *, const char *, size_t);
225 static ssize_t integrity_attr_show(struct kobject *kobj, struct attribute *attr,
226 char *page)
228 struct blk_integrity *bi =
229 container_of(kobj, struct blk_integrity, kobj);
230 struct integrity_sysfs_entry *entry =
231 container_of(attr, struct integrity_sysfs_entry, attr);
233 return entry->show(bi, page);
236 static ssize_t integrity_attr_store(struct kobject *kobj,
237 struct attribute *attr, const char *page,
238 size_t count)
240 struct blk_integrity *bi =
241 container_of(kobj, struct blk_integrity, kobj);
242 struct integrity_sysfs_entry *entry =
243 container_of(attr, struct integrity_sysfs_entry, attr);
244 ssize_t ret = 0;
246 if (entry->store)
247 ret = entry->store(bi, page, count);
249 return ret;
252 static ssize_t integrity_format_show(struct blk_integrity *bi, char *page)
254 if (bi != NULL && bi->name != NULL)
255 return sprintf(page, "%s\n", bi->name);
256 else
257 return sprintf(page, "none\n");
260 static ssize_t integrity_tag_size_show(struct blk_integrity *bi, char *page)
262 if (bi != NULL)
263 return sprintf(page, "%u\n", bi->tag_size);
264 else
265 return sprintf(page, "0\n");
268 static ssize_t integrity_read_store(struct blk_integrity *bi,
269 const char *page, size_t count)
271 char *p = (char *) page;
272 unsigned long val = simple_strtoul(p, &p, 10);
274 if (val)
275 bi->flags |= INTEGRITY_FLAG_READ;
276 else
277 bi->flags &= ~INTEGRITY_FLAG_READ;
279 return count;
282 static ssize_t integrity_read_show(struct blk_integrity *bi, char *page)
284 return sprintf(page, "%d\n", (bi->flags & INTEGRITY_FLAG_READ) != 0);
287 static ssize_t integrity_write_store(struct blk_integrity *bi,
288 const char *page, size_t count)
290 char *p = (char *) page;
291 unsigned long val = simple_strtoul(p, &p, 10);
293 if (val)
294 bi->flags |= INTEGRITY_FLAG_WRITE;
295 else
296 bi->flags &= ~INTEGRITY_FLAG_WRITE;
298 return count;
301 static ssize_t integrity_write_show(struct blk_integrity *bi, char *page)
303 return sprintf(page, "%d\n", (bi->flags & INTEGRITY_FLAG_WRITE) != 0);
306 static struct integrity_sysfs_entry integrity_format_entry = {
307 .attr = { .name = "format", .mode = S_IRUGO },
308 .show = integrity_format_show,
311 static struct integrity_sysfs_entry integrity_tag_size_entry = {
312 .attr = { .name = "tag_size", .mode = S_IRUGO },
313 .show = integrity_tag_size_show,
316 static struct integrity_sysfs_entry integrity_read_entry = {
317 .attr = { .name = "read_verify", .mode = S_IRUGO | S_IWUSR },
318 .show = integrity_read_show,
319 .store = integrity_read_store,
322 static struct integrity_sysfs_entry integrity_write_entry = {
323 .attr = { .name = "write_generate", .mode = S_IRUGO | S_IWUSR },
324 .show = integrity_write_show,
325 .store = integrity_write_store,
328 static struct attribute *integrity_attrs[] = {
329 &integrity_format_entry.attr,
330 &integrity_tag_size_entry.attr,
331 &integrity_read_entry.attr,
332 &integrity_write_entry.attr,
333 NULL,
336 static const struct sysfs_ops integrity_ops = {
337 .show = &integrity_attr_show,
338 .store = &integrity_attr_store,
341 static int __init blk_dev_integrity_init(void)
343 integrity_cachep = kmem_cache_create("blkdev_integrity",
344 sizeof(struct blk_integrity),
345 0, SLAB_PANIC, NULL);
346 return 0;
348 subsys_initcall(blk_dev_integrity_init);
350 static void blk_integrity_release(struct kobject *kobj)
352 struct blk_integrity *bi =
353 container_of(kobj, struct blk_integrity, kobj);
355 kmem_cache_free(integrity_cachep, bi);
358 static struct kobj_type integrity_ktype = {
359 .default_attrs = integrity_attrs,
360 .sysfs_ops = &integrity_ops,
361 .release = blk_integrity_release,
364 bool blk_integrity_is_initialized(struct gendisk *disk)
366 struct blk_integrity *bi = blk_get_integrity(disk);
368 return (bi && bi->name && strcmp(bi->name, bi_unsupported_name) != 0);
370 EXPORT_SYMBOL(blk_integrity_is_initialized);
373 * blk_integrity_register - Register a gendisk as being integrity-capable
374 * @disk: struct gendisk pointer to make integrity-aware
375 * @template: optional integrity profile to register
377 * Description: When a device needs to advertise itself as being able
378 * to send/receive integrity metadata it must use this function to
379 * register the capability with the block layer. The template is a
380 * blk_integrity struct with values appropriate for the underlying
381 * hardware. If template is NULL the new profile is allocated but
382 * not filled out. See Documentation/block/data-integrity.txt.
384 int blk_integrity_register(struct gendisk *disk, struct blk_integrity *template)
386 struct blk_integrity *bi;
388 BUG_ON(disk == NULL);
390 if (disk->integrity == NULL) {
391 bi = kmem_cache_alloc(integrity_cachep,
392 GFP_KERNEL | __GFP_ZERO);
393 if (!bi)
394 return -1;
396 if (kobject_init_and_add(&bi->kobj, &integrity_ktype,
397 &disk_to_dev(disk)->kobj,
398 "%s", "integrity")) {
399 kmem_cache_free(integrity_cachep, bi);
400 return -1;
403 kobject_uevent(&bi->kobj, KOBJ_ADD);
405 bi->flags |= INTEGRITY_FLAG_READ | INTEGRITY_FLAG_WRITE;
406 bi->sector_size = queue_logical_block_size(disk->queue);
407 disk->integrity = bi;
408 } else
409 bi = disk->integrity;
411 /* Use the provided profile as template */
412 if (template != NULL) {
413 bi->name = template->name;
414 bi->generate_fn = template->generate_fn;
415 bi->verify_fn = template->verify_fn;
416 bi->tuple_size = template->tuple_size;
417 bi->set_tag_fn = template->set_tag_fn;
418 bi->get_tag_fn = template->get_tag_fn;
419 bi->tag_size = template->tag_size;
420 } else
421 bi->name = bi_unsupported_name;
423 disk->queue->backing_dev_info.capabilities |= BDI_CAP_STABLE_WRITES;
425 return 0;
427 EXPORT_SYMBOL(blk_integrity_register);
430 * blk_integrity_unregister - Remove block integrity profile
431 * @disk: disk whose integrity profile to deallocate
433 * Description: This function frees all memory used by the block
434 * integrity profile. To be called at device teardown.
436 void blk_integrity_unregister(struct gendisk *disk)
438 struct blk_integrity *bi;
440 if (!disk || !disk->integrity)
441 return;
443 disk->queue->backing_dev_info.capabilities &= ~BDI_CAP_STABLE_WRITES;
445 bi = disk->integrity;
447 kobject_uevent(&bi->kobj, KOBJ_REMOVE);
448 kobject_del(&bi->kobj);
449 kobject_put(&bi->kobj);
450 disk->integrity = NULL;
452 EXPORT_SYMBOL(blk_integrity_unregister);