11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * gendisk handling 31da177e4SLinus Torvalds */ 41da177e4SLinus Torvalds 51da177e4SLinus Torvalds #include <linux/module.h> 61da177e4SLinus Torvalds #include <linux/fs.h> 71da177e4SLinus Torvalds #include <linux/genhd.h> 8b446b60eSAndrew Morton #include <linux/kdev_t.h> 91da177e4SLinus Torvalds #include <linux/kernel.h> 101da177e4SLinus Torvalds #include <linux/blkdev.h> 111da177e4SLinus Torvalds #include <linux/init.h> 121da177e4SLinus Torvalds #include <linux/spinlock.h> 13f500975aSAlexey Dobriyan #include <linux/proc_fs.h> 141da177e4SLinus Torvalds #include <linux/seq_file.h> 151da177e4SLinus Torvalds #include <linux/slab.h> 161da177e4SLinus Torvalds #include <linux/kmod.h> 171da177e4SLinus Torvalds #include <linux/kobj_map.h> 182ef41634SChristoph Hellwig #include <linux/buffer_head.h> 1958383af6SJes Sorensen #include <linux/mutex.h> 20bcce3de1STejun Heo #include <linux/idr.h> 2177ea887eSTejun Heo #include <linux/log2.h> 221da177e4SLinus Torvalds 23ff88972cSAdrian Bunk #include "blk.h" 24ff88972cSAdrian Bunk 25edfaa7c3SKay Sievers static DEFINE_MUTEX(block_class_lock); 26edfaa7c3SKay Sievers struct kobject *block_depr; 271da177e4SLinus Torvalds 28bcce3de1STejun Heo /* for extended dynamic devt allocation, currently only one major is used */ 29bcce3de1STejun Heo #define MAX_EXT_DEVT (1 << MINORBITS) 30bcce3de1STejun Heo 31bcce3de1STejun Heo /* For extended devt allocation. ext_devt_mutex prevents look up 32bcce3de1STejun Heo * results from going away underneath its user. 33bcce3de1STejun Heo */ 34bcce3de1STejun Heo static DEFINE_MUTEX(ext_devt_mutex); 35bcce3de1STejun Heo static DEFINE_IDR(ext_devt_idr); 36bcce3de1STejun Heo 371826eadfSAdrian Bunk static struct device_type disk_type; 381826eadfSAdrian Bunk 3977ea887eSTejun Heo static void disk_add_events(struct gendisk *disk); 4077ea887eSTejun Heo static void disk_del_events(struct gendisk *disk); 4177ea887eSTejun Heo static void disk_release_events(struct gendisk *disk); 4277ea887eSTejun Heo 43e71bf0d0STejun Heo /** 44e71bf0d0STejun Heo * disk_get_part - get partition 45e71bf0d0STejun Heo * @disk: disk to look partition from 46e71bf0d0STejun Heo * @partno: partition number 47e71bf0d0STejun Heo * 48e71bf0d0STejun Heo * Look for partition @partno from @disk. If found, increment 49e71bf0d0STejun Heo * reference count and return it. 50e71bf0d0STejun Heo * 51e71bf0d0STejun Heo * CONTEXT: 52e71bf0d0STejun Heo * Don't care. 53e71bf0d0STejun Heo * 54e71bf0d0STejun Heo * RETURNS: 55e71bf0d0STejun Heo * Pointer to the found partition on success, NULL if not found. 56e71bf0d0STejun Heo */ 57e71bf0d0STejun Heo struct hd_struct *disk_get_part(struct gendisk *disk, int partno) 58e71bf0d0STejun Heo { 59540eed56STejun Heo struct hd_struct *part = NULL; 60540eed56STejun Heo struct disk_part_tbl *ptbl; 61e71bf0d0STejun Heo 62540eed56STejun Heo if (unlikely(partno < 0)) 63e71bf0d0STejun Heo return NULL; 64540eed56STejun Heo 65e71bf0d0STejun Heo rcu_read_lock(); 66540eed56STejun Heo 67540eed56STejun Heo ptbl = rcu_dereference(disk->part_tbl); 68540eed56STejun Heo if (likely(partno < ptbl->len)) { 69540eed56STejun Heo part = rcu_dereference(ptbl->part[partno]); 70e71bf0d0STejun Heo if (part) 71ed9e1982STejun Heo get_device(part_to_dev(part)); 72540eed56STejun Heo } 73540eed56STejun Heo 74e71bf0d0STejun Heo rcu_read_unlock(); 75e71bf0d0STejun Heo 76e71bf0d0STejun Heo return part; 77e71bf0d0STejun Heo } 78e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_get_part); 79e71bf0d0STejun Heo 80e71bf0d0STejun Heo /** 81e71bf0d0STejun Heo * disk_part_iter_init - initialize partition iterator 82e71bf0d0STejun Heo * @piter: iterator to initialize 83e71bf0d0STejun Heo * @disk: disk to iterate over 84e71bf0d0STejun Heo * @flags: DISK_PITER_* flags 85e71bf0d0STejun Heo * 86e71bf0d0STejun Heo * Initialize @piter so that it iterates over partitions of @disk. 87e71bf0d0STejun Heo * 88e71bf0d0STejun Heo * CONTEXT: 89e71bf0d0STejun Heo * Don't care. 90e71bf0d0STejun Heo */ 91e71bf0d0STejun Heo void disk_part_iter_init(struct disk_part_iter *piter, struct gendisk *disk, 92e71bf0d0STejun Heo unsigned int flags) 93e71bf0d0STejun Heo { 94540eed56STejun Heo struct disk_part_tbl *ptbl; 95540eed56STejun Heo 96540eed56STejun Heo rcu_read_lock(); 97540eed56STejun Heo ptbl = rcu_dereference(disk->part_tbl); 98540eed56STejun Heo 99e71bf0d0STejun Heo piter->disk = disk; 100e71bf0d0STejun Heo piter->part = NULL; 101e71bf0d0STejun Heo 102e71bf0d0STejun Heo if (flags & DISK_PITER_REVERSE) 103540eed56STejun Heo piter->idx = ptbl->len - 1; 10471982a40STejun Heo else if (flags & (DISK_PITER_INCL_PART0 | DISK_PITER_INCL_EMPTY_PART0)) 105e71bf0d0STejun Heo piter->idx = 0; 106b5d0b9dfSTejun Heo else 107b5d0b9dfSTejun Heo piter->idx = 1; 108e71bf0d0STejun Heo 109e71bf0d0STejun Heo piter->flags = flags; 110540eed56STejun Heo 111540eed56STejun Heo rcu_read_unlock(); 112e71bf0d0STejun Heo } 113e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_part_iter_init); 114e71bf0d0STejun Heo 115e71bf0d0STejun Heo /** 116e71bf0d0STejun Heo * disk_part_iter_next - proceed iterator to the next partition and return it 117e71bf0d0STejun Heo * @piter: iterator of interest 118e71bf0d0STejun Heo * 119e71bf0d0STejun Heo * Proceed @piter to the next partition and return it. 120e71bf0d0STejun Heo * 121e71bf0d0STejun Heo * CONTEXT: 122e71bf0d0STejun Heo * Don't care. 123e71bf0d0STejun Heo */ 124e71bf0d0STejun Heo struct hd_struct *disk_part_iter_next(struct disk_part_iter *piter) 125e71bf0d0STejun Heo { 126540eed56STejun Heo struct disk_part_tbl *ptbl; 127e71bf0d0STejun Heo int inc, end; 128e71bf0d0STejun Heo 129e71bf0d0STejun Heo /* put the last partition */ 130e71bf0d0STejun Heo disk_put_part(piter->part); 131e71bf0d0STejun Heo piter->part = NULL; 132e71bf0d0STejun Heo 133540eed56STejun Heo /* get part_tbl */ 134e71bf0d0STejun Heo rcu_read_lock(); 135540eed56STejun Heo ptbl = rcu_dereference(piter->disk->part_tbl); 136e71bf0d0STejun Heo 137e71bf0d0STejun Heo /* determine iteration parameters */ 138e71bf0d0STejun Heo if (piter->flags & DISK_PITER_REVERSE) { 139e71bf0d0STejun Heo inc = -1; 14071982a40STejun Heo if (piter->flags & (DISK_PITER_INCL_PART0 | 14171982a40STejun Heo DISK_PITER_INCL_EMPTY_PART0)) 142e71bf0d0STejun Heo end = -1; 143b5d0b9dfSTejun Heo else 144b5d0b9dfSTejun Heo end = 0; 145e71bf0d0STejun Heo } else { 146e71bf0d0STejun Heo inc = 1; 147540eed56STejun Heo end = ptbl->len; 148e71bf0d0STejun Heo } 149e71bf0d0STejun Heo 150e71bf0d0STejun Heo /* iterate to the next partition */ 151e71bf0d0STejun Heo for (; piter->idx != end; piter->idx += inc) { 152e71bf0d0STejun Heo struct hd_struct *part; 153e71bf0d0STejun Heo 154540eed56STejun Heo part = rcu_dereference(ptbl->part[piter->idx]); 155e71bf0d0STejun Heo if (!part) 156e71bf0d0STejun Heo continue; 15771982a40STejun Heo if (!part->nr_sects && 15871982a40STejun Heo !(piter->flags & DISK_PITER_INCL_EMPTY) && 15971982a40STejun Heo !(piter->flags & DISK_PITER_INCL_EMPTY_PART0 && 16071982a40STejun Heo piter->idx == 0)) 161e71bf0d0STejun Heo continue; 162e71bf0d0STejun Heo 163ed9e1982STejun Heo get_device(part_to_dev(part)); 164e71bf0d0STejun Heo piter->part = part; 165e71bf0d0STejun Heo piter->idx += inc; 166e71bf0d0STejun Heo break; 167e71bf0d0STejun Heo } 168e71bf0d0STejun Heo 169e71bf0d0STejun Heo rcu_read_unlock(); 170e71bf0d0STejun Heo 171e71bf0d0STejun Heo return piter->part; 172e71bf0d0STejun Heo } 173e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_part_iter_next); 174e71bf0d0STejun Heo 175e71bf0d0STejun Heo /** 176e71bf0d0STejun Heo * disk_part_iter_exit - finish up partition iteration 177e71bf0d0STejun Heo * @piter: iter of interest 178e71bf0d0STejun Heo * 179e71bf0d0STejun Heo * Called when iteration is over. Cleans up @piter. 180e71bf0d0STejun Heo * 181e71bf0d0STejun Heo * CONTEXT: 182e71bf0d0STejun Heo * Don't care. 183e71bf0d0STejun Heo */ 184e71bf0d0STejun Heo void disk_part_iter_exit(struct disk_part_iter *piter) 185e71bf0d0STejun Heo { 186e71bf0d0STejun Heo disk_put_part(piter->part); 187e71bf0d0STejun Heo piter->part = NULL; 188e71bf0d0STejun Heo } 189e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_part_iter_exit); 190e71bf0d0STejun Heo 191a6f23657SJens Axboe static inline int sector_in_part(struct hd_struct *part, sector_t sector) 192a6f23657SJens Axboe { 193a6f23657SJens Axboe return part->start_sect <= sector && 194a6f23657SJens Axboe sector < part->start_sect + part->nr_sects; 195a6f23657SJens Axboe } 196a6f23657SJens Axboe 197e71bf0d0STejun Heo /** 198e71bf0d0STejun Heo * disk_map_sector_rcu - map sector to partition 199e71bf0d0STejun Heo * @disk: gendisk of interest 200e71bf0d0STejun Heo * @sector: sector to map 201e71bf0d0STejun Heo * 202e71bf0d0STejun Heo * Find out which partition @sector maps to on @disk. This is 203e71bf0d0STejun Heo * primarily used for stats accounting. 204e71bf0d0STejun Heo * 205e71bf0d0STejun Heo * CONTEXT: 206e71bf0d0STejun Heo * RCU read locked. The returned partition pointer is valid only 207e71bf0d0STejun Heo * while preemption is disabled. 208e71bf0d0STejun Heo * 209e71bf0d0STejun Heo * RETURNS: 210074a7acaSTejun Heo * Found partition on success, part0 is returned if no partition matches 211e71bf0d0STejun Heo */ 212e71bf0d0STejun Heo struct hd_struct *disk_map_sector_rcu(struct gendisk *disk, sector_t sector) 213e71bf0d0STejun Heo { 214540eed56STejun Heo struct disk_part_tbl *ptbl; 215a6f23657SJens Axboe struct hd_struct *part; 216e71bf0d0STejun Heo int i; 217e71bf0d0STejun Heo 218540eed56STejun Heo ptbl = rcu_dereference(disk->part_tbl); 219540eed56STejun Heo 220a6f23657SJens Axboe part = rcu_dereference(ptbl->last_lookup); 221a6f23657SJens Axboe if (part && sector_in_part(part, sector)) 222e71bf0d0STejun Heo return part; 223a6f23657SJens Axboe 224a6f23657SJens Axboe for (i = 1; i < ptbl->len; i++) { 225a6f23657SJens Axboe part = rcu_dereference(ptbl->part[i]); 226a6f23657SJens Axboe 227a6f23657SJens Axboe if (part && sector_in_part(part, sector)) { 228a6f23657SJens Axboe rcu_assign_pointer(ptbl->last_lookup, part); 229a6f23657SJens Axboe return part; 230a6f23657SJens Axboe } 231e71bf0d0STejun Heo } 232074a7acaSTejun Heo return &disk->part0; 233e71bf0d0STejun Heo } 234e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_map_sector_rcu); 235e71bf0d0STejun Heo 2361da177e4SLinus Torvalds /* 2371da177e4SLinus Torvalds * Can be deleted altogether. Later. 2381da177e4SLinus Torvalds * 2391da177e4SLinus Torvalds */ 2401da177e4SLinus Torvalds static struct blk_major_name { 2411da177e4SLinus Torvalds struct blk_major_name *next; 2421da177e4SLinus Torvalds int major; 2431da177e4SLinus Torvalds char name[16]; 24468eef3b4SJoe Korty } *major_names[BLKDEV_MAJOR_HASH_SIZE]; 2451da177e4SLinus Torvalds 2461da177e4SLinus Torvalds /* index in the above - for now: assume no multimajor ranges */ 247e61eb2e9SYang Zhang static inline int major_to_index(unsigned major) 2481da177e4SLinus Torvalds { 24968eef3b4SJoe Korty return major % BLKDEV_MAJOR_HASH_SIZE; 2501da177e4SLinus Torvalds } 2511da177e4SLinus Torvalds 25268eef3b4SJoe Korty #ifdef CONFIG_PROC_FS 253cf771cb5STejun Heo void blkdev_show(struct seq_file *seqf, off_t offset) 2547170be5fSNeil Horman { 25568eef3b4SJoe Korty struct blk_major_name *dp; 2567170be5fSNeil Horman 25768eef3b4SJoe Korty if (offset < BLKDEV_MAJOR_HASH_SIZE) { 258edfaa7c3SKay Sievers mutex_lock(&block_class_lock); 25968eef3b4SJoe Korty for (dp = major_names[offset]; dp; dp = dp->next) 260cf771cb5STejun Heo seq_printf(seqf, "%3d %s\n", dp->major, dp->name); 261edfaa7c3SKay Sievers mutex_unlock(&block_class_lock); 26268eef3b4SJoe Korty } 2637170be5fSNeil Horman } 26468eef3b4SJoe Korty #endif /* CONFIG_PROC_FS */ 2651da177e4SLinus Torvalds 2669e8c0bccSMárton Németh /** 2679e8c0bccSMárton Németh * register_blkdev - register a new block device 2689e8c0bccSMárton Németh * 2699e8c0bccSMárton Németh * @major: the requested major device number [1..255]. If @major=0, try to 2709e8c0bccSMárton Németh * allocate any unused major number. 2719e8c0bccSMárton Németh * @name: the name of the new block device as a zero terminated string 2729e8c0bccSMárton Németh * 2739e8c0bccSMárton Németh * The @name must be unique within the system. 2749e8c0bccSMárton Németh * 2759e8c0bccSMárton Németh * The return value depends on the @major input parameter. 2769e8c0bccSMárton Németh * - if a major device number was requested in range [1..255] then the 2779e8c0bccSMárton Németh * function returns zero on success, or a negative error code 2789e8c0bccSMárton Németh * - if any unused major number was requested with @major=0 parameter 2799e8c0bccSMárton Németh * then the return value is the allocated major number in range 2809e8c0bccSMárton Németh * [1..255] or a negative error code otherwise 2819e8c0bccSMárton Németh */ 2821da177e4SLinus Torvalds int register_blkdev(unsigned int major, const char *name) 2831da177e4SLinus Torvalds { 2841da177e4SLinus Torvalds struct blk_major_name **n, *p; 2851da177e4SLinus Torvalds int index, ret = 0; 2861da177e4SLinus Torvalds 287edfaa7c3SKay Sievers mutex_lock(&block_class_lock); 2881da177e4SLinus Torvalds 2891da177e4SLinus Torvalds /* temporary */ 2901da177e4SLinus Torvalds if (major == 0) { 2911da177e4SLinus Torvalds for (index = ARRAY_SIZE(major_names)-1; index > 0; index--) { 2921da177e4SLinus Torvalds if (major_names[index] == NULL) 2931da177e4SLinus Torvalds break; 2941da177e4SLinus Torvalds } 2951da177e4SLinus Torvalds 2961da177e4SLinus Torvalds if (index == 0) { 2971da177e4SLinus Torvalds printk("register_blkdev: failed to get major for %s\n", 2981da177e4SLinus Torvalds name); 2991da177e4SLinus Torvalds ret = -EBUSY; 3001da177e4SLinus Torvalds goto out; 3011da177e4SLinus Torvalds } 3021da177e4SLinus Torvalds major = index; 3031da177e4SLinus Torvalds ret = major; 3041da177e4SLinus Torvalds } 3051da177e4SLinus Torvalds 3061da177e4SLinus Torvalds p = kmalloc(sizeof(struct blk_major_name), GFP_KERNEL); 3071da177e4SLinus Torvalds if (p == NULL) { 3081da177e4SLinus Torvalds ret = -ENOMEM; 3091da177e4SLinus Torvalds goto out; 3101da177e4SLinus Torvalds } 3111da177e4SLinus Torvalds 3121da177e4SLinus Torvalds p->major = major; 3131da177e4SLinus Torvalds strlcpy(p->name, name, sizeof(p->name)); 3141da177e4SLinus Torvalds p->next = NULL; 3151da177e4SLinus Torvalds index = major_to_index(major); 3161da177e4SLinus Torvalds 3171da177e4SLinus Torvalds for (n = &major_names[index]; *n; n = &(*n)->next) { 3181da177e4SLinus Torvalds if ((*n)->major == major) 3191da177e4SLinus Torvalds break; 3201da177e4SLinus Torvalds } 3211da177e4SLinus Torvalds if (!*n) 3221da177e4SLinus Torvalds *n = p; 3231da177e4SLinus Torvalds else 3241da177e4SLinus Torvalds ret = -EBUSY; 3251da177e4SLinus Torvalds 3261da177e4SLinus Torvalds if (ret < 0) { 3271da177e4SLinus Torvalds printk("register_blkdev: cannot get major %d for %s\n", 3281da177e4SLinus Torvalds major, name); 3291da177e4SLinus Torvalds kfree(p); 3301da177e4SLinus Torvalds } 3311da177e4SLinus Torvalds out: 332edfaa7c3SKay Sievers mutex_unlock(&block_class_lock); 3331da177e4SLinus Torvalds return ret; 3341da177e4SLinus Torvalds } 3351da177e4SLinus Torvalds 3361da177e4SLinus Torvalds EXPORT_SYMBOL(register_blkdev); 3371da177e4SLinus Torvalds 338f4480240SAkinobu Mita void unregister_blkdev(unsigned int major, const char *name) 3391da177e4SLinus Torvalds { 3401da177e4SLinus Torvalds struct blk_major_name **n; 3411da177e4SLinus Torvalds struct blk_major_name *p = NULL; 3421da177e4SLinus Torvalds int index = major_to_index(major); 3431da177e4SLinus Torvalds 344edfaa7c3SKay Sievers mutex_lock(&block_class_lock); 3451da177e4SLinus Torvalds for (n = &major_names[index]; *n; n = &(*n)->next) 3461da177e4SLinus Torvalds if ((*n)->major == major) 3471da177e4SLinus Torvalds break; 348294462a5SAkinobu Mita if (!*n || strcmp((*n)->name, name)) { 349294462a5SAkinobu Mita WARN_ON(1); 350294462a5SAkinobu Mita } else { 3511da177e4SLinus Torvalds p = *n; 3521da177e4SLinus Torvalds *n = p->next; 3531da177e4SLinus Torvalds } 354edfaa7c3SKay Sievers mutex_unlock(&block_class_lock); 3551da177e4SLinus Torvalds kfree(p); 3561da177e4SLinus Torvalds } 3571da177e4SLinus Torvalds 3581da177e4SLinus Torvalds EXPORT_SYMBOL(unregister_blkdev); 3591da177e4SLinus Torvalds 3601da177e4SLinus Torvalds static struct kobj_map *bdev_map; 3611da177e4SLinus Torvalds 362bcce3de1STejun Heo /** 363870d6656STejun Heo * blk_mangle_minor - scatter minor numbers apart 364870d6656STejun Heo * @minor: minor number to mangle 365870d6656STejun Heo * 366870d6656STejun Heo * Scatter consecutively allocated @minor number apart if MANGLE_DEVT 367870d6656STejun Heo * is enabled. Mangling twice gives the original value. 368870d6656STejun Heo * 369870d6656STejun Heo * RETURNS: 370870d6656STejun Heo * Mangled value. 371870d6656STejun Heo * 372870d6656STejun Heo * CONTEXT: 373870d6656STejun Heo * Don't care. 374870d6656STejun Heo */ 375870d6656STejun Heo static int blk_mangle_minor(int minor) 376870d6656STejun Heo { 377870d6656STejun Heo #ifdef CONFIG_DEBUG_BLOCK_EXT_DEVT 378870d6656STejun Heo int i; 379870d6656STejun Heo 380870d6656STejun Heo for (i = 0; i < MINORBITS / 2; i++) { 381870d6656STejun Heo int low = minor & (1 << i); 382870d6656STejun Heo int high = minor & (1 << (MINORBITS - 1 - i)); 383870d6656STejun Heo int distance = MINORBITS - 1 - 2 * i; 384870d6656STejun Heo 385870d6656STejun Heo minor ^= low | high; /* clear both bits */ 386870d6656STejun Heo low <<= distance; /* swap the positions */ 387870d6656STejun Heo high >>= distance; 388870d6656STejun Heo minor |= low | high; /* and set */ 389870d6656STejun Heo } 390870d6656STejun Heo #endif 391870d6656STejun Heo return minor; 392870d6656STejun Heo } 393870d6656STejun Heo 394870d6656STejun Heo /** 395bcce3de1STejun Heo * blk_alloc_devt - allocate a dev_t for a partition 396bcce3de1STejun Heo * @part: partition to allocate dev_t for 397bcce3de1STejun Heo * @devt: out parameter for resulting dev_t 398bcce3de1STejun Heo * 399bcce3de1STejun Heo * Allocate a dev_t for block device. 400bcce3de1STejun Heo * 401bcce3de1STejun Heo * RETURNS: 402bcce3de1STejun Heo * 0 on success, allocated dev_t is returned in *@devt. -errno on 403bcce3de1STejun Heo * failure. 404bcce3de1STejun Heo * 405bcce3de1STejun Heo * CONTEXT: 406bcce3de1STejun Heo * Might sleep. 407bcce3de1STejun Heo */ 408bcce3de1STejun Heo int blk_alloc_devt(struct hd_struct *part, dev_t *devt) 409bcce3de1STejun Heo { 410bcce3de1STejun Heo struct gendisk *disk = part_to_disk(part); 411bcce3de1STejun Heo int idx, rc; 412bcce3de1STejun Heo 413bcce3de1STejun Heo /* in consecutive minor range? */ 414bcce3de1STejun Heo if (part->partno < disk->minors) { 415bcce3de1STejun Heo *devt = MKDEV(disk->major, disk->first_minor + part->partno); 416bcce3de1STejun Heo return 0; 417bcce3de1STejun Heo } 418bcce3de1STejun Heo 419bcce3de1STejun Heo /* allocate ext devt */ 420bcce3de1STejun Heo do { 421bcce3de1STejun Heo if (!idr_pre_get(&ext_devt_idr, GFP_KERNEL)) 422bcce3de1STejun Heo return -ENOMEM; 423bcce3de1STejun Heo rc = idr_get_new(&ext_devt_idr, part, &idx); 424bcce3de1STejun Heo } while (rc == -EAGAIN); 425bcce3de1STejun Heo 426bcce3de1STejun Heo if (rc) 427bcce3de1STejun Heo return rc; 428bcce3de1STejun Heo 429bcce3de1STejun Heo if (idx > MAX_EXT_DEVT) { 430bcce3de1STejun Heo idr_remove(&ext_devt_idr, idx); 431bcce3de1STejun Heo return -EBUSY; 432bcce3de1STejun Heo } 433bcce3de1STejun Heo 434870d6656STejun Heo *devt = MKDEV(BLOCK_EXT_MAJOR, blk_mangle_minor(idx)); 435bcce3de1STejun Heo return 0; 436bcce3de1STejun Heo } 437bcce3de1STejun Heo 438bcce3de1STejun Heo /** 439bcce3de1STejun Heo * blk_free_devt - free a dev_t 440bcce3de1STejun Heo * @devt: dev_t to free 441bcce3de1STejun Heo * 442bcce3de1STejun Heo * Free @devt which was allocated using blk_alloc_devt(). 443bcce3de1STejun Heo * 444bcce3de1STejun Heo * CONTEXT: 445bcce3de1STejun Heo * Might sleep. 446bcce3de1STejun Heo */ 447bcce3de1STejun Heo void blk_free_devt(dev_t devt) 448bcce3de1STejun Heo { 449bcce3de1STejun Heo might_sleep(); 450bcce3de1STejun Heo 451bcce3de1STejun Heo if (devt == MKDEV(0, 0)) 452bcce3de1STejun Heo return; 453bcce3de1STejun Heo 454bcce3de1STejun Heo if (MAJOR(devt) == BLOCK_EXT_MAJOR) { 455bcce3de1STejun Heo mutex_lock(&ext_devt_mutex); 456870d6656STejun Heo idr_remove(&ext_devt_idr, blk_mangle_minor(MINOR(devt))); 457bcce3de1STejun Heo mutex_unlock(&ext_devt_mutex); 458bcce3de1STejun Heo } 459bcce3de1STejun Heo } 460bcce3de1STejun Heo 4611f014290STejun Heo static char *bdevt_str(dev_t devt, char *buf) 4621f014290STejun Heo { 4631f014290STejun Heo if (MAJOR(devt) <= 0xff && MINOR(devt) <= 0xff) { 4641f014290STejun Heo char tbuf[BDEVT_SIZE]; 4651f014290STejun Heo snprintf(tbuf, BDEVT_SIZE, "%02x%02x", MAJOR(devt), MINOR(devt)); 4661f014290STejun Heo snprintf(buf, BDEVT_SIZE, "%-9s", tbuf); 4671f014290STejun Heo } else 4681f014290STejun Heo snprintf(buf, BDEVT_SIZE, "%03x:%05x", MAJOR(devt), MINOR(devt)); 4691f014290STejun Heo 4701f014290STejun Heo return buf; 4711f014290STejun Heo } 4721f014290STejun Heo 4731da177e4SLinus Torvalds /* 4741da177e4SLinus Torvalds * Register device numbers dev..(dev+range-1) 4751da177e4SLinus Torvalds * range must be nonzero 4761da177e4SLinus Torvalds * The hash chain is sorted on range, so that subranges can override. 4771da177e4SLinus Torvalds */ 478edfaa7c3SKay Sievers void blk_register_region(dev_t devt, unsigned long range, struct module *module, 4791da177e4SLinus Torvalds struct kobject *(*probe)(dev_t, int *, void *), 4801da177e4SLinus Torvalds int (*lock)(dev_t, void *), void *data) 4811da177e4SLinus Torvalds { 482edfaa7c3SKay Sievers kobj_map(bdev_map, devt, range, module, probe, lock, data); 4831da177e4SLinus Torvalds } 4841da177e4SLinus Torvalds 4851da177e4SLinus Torvalds EXPORT_SYMBOL(blk_register_region); 4861da177e4SLinus Torvalds 487edfaa7c3SKay Sievers void blk_unregister_region(dev_t devt, unsigned long range) 4881da177e4SLinus Torvalds { 489edfaa7c3SKay Sievers kobj_unmap(bdev_map, devt, range); 4901da177e4SLinus Torvalds } 4911da177e4SLinus Torvalds 4921da177e4SLinus Torvalds EXPORT_SYMBOL(blk_unregister_region); 4931da177e4SLinus Torvalds 494cf771cb5STejun Heo static struct kobject *exact_match(dev_t devt, int *partno, void *data) 4951da177e4SLinus Torvalds { 4961da177e4SLinus Torvalds struct gendisk *p = data; 497edfaa7c3SKay Sievers 498ed9e1982STejun Heo return &disk_to_dev(p)->kobj; 4991da177e4SLinus Torvalds } 5001da177e4SLinus Torvalds 501edfaa7c3SKay Sievers static int exact_lock(dev_t devt, void *data) 5021da177e4SLinus Torvalds { 5031da177e4SLinus Torvalds struct gendisk *p = data; 5041da177e4SLinus Torvalds 5051da177e4SLinus Torvalds if (!get_disk(p)) 5061da177e4SLinus Torvalds return -1; 5071da177e4SLinus Torvalds return 0; 5081da177e4SLinus Torvalds } 5091da177e4SLinus Torvalds 510d2bf1b67STejun Heo void register_disk(struct gendisk *disk) 511d2bf1b67STejun Heo { 512d2bf1b67STejun Heo struct device *ddev = disk_to_dev(disk); 513d2bf1b67STejun Heo struct block_device *bdev; 514d2bf1b67STejun Heo struct disk_part_iter piter; 515d2bf1b67STejun Heo struct hd_struct *part; 516d2bf1b67STejun Heo int err; 517d2bf1b67STejun Heo 518d2bf1b67STejun Heo ddev->parent = disk->driverfs_dev; 519d2bf1b67STejun Heo 520d2bf1b67STejun Heo dev_set_name(ddev, disk->disk_name); 521d2bf1b67STejun Heo 522d2bf1b67STejun Heo /* delay uevents, until we scanned partition table */ 523d2bf1b67STejun Heo dev_set_uevent_suppress(ddev, 1); 524d2bf1b67STejun Heo 525d2bf1b67STejun Heo if (device_add(ddev)) 526d2bf1b67STejun Heo return; 527d2bf1b67STejun Heo if (!sysfs_deprecated) { 528d2bf1b67STejun Heo err = sysfs_create_link(block_depr, &ddev->kobj, 529d2bf1b67STejun Heo kobject_name(&ddev->kobj)); 530d2bf1b67STejun Heo if (err) { 531d2bf1b67STejun Heo device_del(ddev); 532d2bf1b67STejun Heo return; 533d2bf1b67STejun Heo } 534d2bf1b67STejun Heo } 535d2bf1b67STejun Heo disk->part0.holder_dir = kobject_create_and_add("holders", &ddev->kobj); 536d2bf1b67STejun Heo disk->slave_dir = kobject_create_and_add("slaves", &ddev->kobj); 537d2bf1b67STejun Heo 538d2bf1b67STejun Heo /* No minors to use for partitions */ 539d2bf1b67STejun Heo if (!disk_partitionable(disk)) 540d2bf1b67STejun Heo goto exit; 541d2bf1b67STejun Heo 542d2bf1b67STejun Heo /* No such device (e.g., media were just removed) */ 543d2bf1b67STejun Heo if (!get_capacity(disk)) 544d2bf1b67STejun Heo goto exit; 545d2bf1b67STejun Heo 546d2bf1b67STejun Heo bdev = bdget_disk(disk, 0); 547d2bf1b67STejun Heo if (!bdev) 548d2bf1b67STejun Heo goto exit; 549d2bf1b67STejun Heo 550d2bf1b67STejun Heo bdev->bd_invalidated = 1; 551d2bf1b67STejun Heo err = blkdev_get(bdev, FMODE_READ, NULL); 552d2bf1b67STejun Heo if (err < 0) 553d2bf1b67STejun Heo goto exit; 554d2bf1b67STejun Heo blkdev_put(bdev, FMODE_READ); 555d2bf1b67STejun Heo 556d2bf1b67STejun Heo exit: 557d2bf1b67STejun Heo /* announce disk after possible partitions are created */ 558d2bf1b67STejun Heo dev_set_uevent_suppress(ddev, 0); 559d2bf1b67STejun Heo kobject_uevent(&ddev->kobj, KOBJ_ADD); 560d2bf1b67STejun Heo 561d2bf1b67STejun Heo /* announce possible partitions */ 562d2bf1b67STejun Heo disk_part_iter_init(&piter, disk, 0); 563d2bf1b67STejun Heo while ((part = disk_part_iter_next(&piter))) 564d2bf1b67STejun Heo kobject_uevent(&part_to_dev(part)->kobj, KOBJ_ADD); 565d2bf1b67STejun Heo disk_part_iter_exit(&piter); 566d2bf1b67STejun Heo } 567d2bf1b67STejun Heo 5681da177e4SLinus Torvalds /** 5691da177e4SLinus Torvalds * add_disk - add partitioning information to kernel list 5701da177e4SLinus Torvalds * @disk: per-device partitioning information 5711da177e4SLinus Torvalds * 5721da177e4SLinus Torvalds * This function registers the partitioning information in @disk 5731da177e4SLinus Torvalds * with the kernel. 5743e1a7ff8STejun Heo * 5753e1a7ff8STejun Heo * FIXME: error handling 5761da177e4SLinus Torvalds */ 5771da177e4SLinus Torvalds void add_disk(struct gendisk *disk) 5781da177e4SLinus Torvalds { 579cf0ca9feSPeter Zijlstra struct backing_dev_info *bdi; 5803e1a7ff8STejun Heo dev_t devt; 5816ffeea77SGreg Kroah-Hartman int retval; 582cf0ca9feSPeter Zijlstra 5833e1a7ff8STejun Heo /* minors == 0 indicates to use ext devt from part0 and should 5843e1a7ff8STejun Heo * be accompanied with EXT_DEVT flag. Make sure all 5853e1a7ff8STejun Heo * parameters make sense. 5863e1a7ff8STejun Heo */ 5873e1a7ff8STejun Heo WARN_ON(disk->minors && !(disk->major || disk->first_minor)); 5883e1a7ff8STejun Heo WARN_ON(!disk->minors && !(disk->flags & GENHD_FL_EXT_DEVT)); 5893e1a7ff8STejun Heo 5901da177e4SLinus Torvalds disk->flags |= GENHD_FL_UP; 5913e1a7ff8STejun Heo 5923e1a7ff8STejun Heo retval = blk_alloc_devt(&disk->part0, &devt); 5933e1a7ff8STejun Heo if (retval) { 5943e1a7ff8STejun Heo WARN_ON(1); 5953e1a7ff8STejun Heo return; 5963e1a7ff8STejun Heo } 5973e1a7ff8STejun Heo disk_to_dev(disk)->devt = devt; 5983e1a7ff8STejun Heo 5993e1a7ff8STejun Heo /* ->major and ->first_minor aren't supposed to be 6003e1a7ff8STejun Heo * dereferenced from here on, but set them just in case. 6013e1a7ff8STejun Heo */ 6023e1a7ff8STejun Heo disk->major = MAJOR(devt); 6033e1a7ff8STejun Heo disk->first_minor = MINOR(devt); 6043e1a7ff8STejun Heo 60501ea5063SSigned-off-by: Jan Kara /* Register BDI before referencing it from bdev */ 60601ea5063SSigned-off-by: Jan Kara bdi = &disk->queue->backing_dev_info; 60701ea5063SSigned-off-by: Jan Kara bdi_register_dev(bdi, disk_devt(disk)); 60801ea5063SSigned-off-by: Jan Kara 609f331c029STejun Heo blk_register_region(disk_devt(disk), disk->minors, NULL, 610f331c029STejun Heo exact_match, exact_lock, disk); 6111da177e4SLinus Torvalds register_disk(disk); 6121da177e4SLinus Torvalds blk_register_queue(disk); 613cf0ca9feSPeter Zijlstra 614ed9e1982STejun Heo retval = sysfs_create_link(&disk_to_dev(disk)->kobj, &bdi->dev->kobj, 615ed9e1982STejun Heo "bdi"); 6166ffeea77SGreg Kroah-Hartman WARN_ON(retval); 61777ea887eSTejun Heo 61877ea887eSTejun Heo disk_add_events(disk); 6191da177e4SLinus Torvalds } 6201da177e4SLinus Torvalds EXPORT_SYMBOL(add_disk); 6211da177e4SLinus Torvalds 622d2bf1b67STejun Heo void del_gendisk(struct gendisk *disk) 6231da177e4SLinus Torvalds { 624d2bf1b67STejun Heo struct disk_part_iter piter; 625d2bf1b67STejun Heo struct hd_struct *part; 626d2bf1b67STejun Heo 62777ea887eSTejun Heo disk_del_events(disk); 62877ea887eSTejun Heo 629d2bf1b67STejun Heo /* invalidate stuff */ 630d2bf1b67STejun Heo disk_part_iter_init(&piter, disk, 631d2bf1b67STejun Heo DISK_PITER_INCL_EMPTY | DISK_PITER_REVERSE); 632d2bf1b67STejun Heo while ((part = disk_part_iter_next(&piter))) { 633d2bf1b67STejun Heo invalidate_partition(disk, part->partno); 634d2bf1b67STejun Heo delete_partition(disk, part->partno); 635d2bf1b67STejun Heo } 636d2bf1b67STejun Heo disk_part_iter_exit(&piter); 637d2bf1b67STejun Heo 638d2bf1b67STejun Heo invalidate_partition(disk, 0); 639d2bf1b67STejun Heo blk_free_devt(disk_to_dev(disk)->devt); 640d2bf1b67STejun Heo set_capacity(disk, 0); 641d2bf1b67STejun Heo disk->flags &= ~GENHD_FL_UP; 642d2bf1b67STejun Heo 643ed9e1982STejun Heo sysfs_remove_link(&disk_to_dev(disk)->kobj, "bdi"); 644cf0ca9feSPeter Zijlstra bdi_unregister(&disk->queue->backing_dev_info); 6451da177e4SLinus Torvalds blk_unregister_queue(disk); 646f331c029STejun Heo blk_unregister_region(disk_devt(disk), disk->minors); 647d2bf1b67STejun Heo 648d2bf1b67STejun Heo part_stat_set_all(&disk->part0, 0); 649d2bf1b67STejun Heo disk->part0.stamp = 0; 650d2bf1b67STejun Heo 651d2bf1b67STejun Heo kobject_put(disk->part0.holder_dir); 652d2bf1b67STejun Heo kobject_put(disk->slave_dir); 653d2bf1b67STejun Heo disk->driverfs_dev = NULL; 654d2bf1b67STejun Heo if (!sysfs_deprecated) 655d2bf1b67STejun Heo sysfs_remove_link(block_depr, dev_name(disk_to_dev(disk))); 656d2bf1b67STejun Heo device_del(disk_to_dev(disk)); 6571da177e4SLinus Torvalds } 658d2bf1b67STejun Heo EXPORT_SYMBOL(del_gendisk); 6591da177e4SLinus Torvalds 6601da177e4SLinus Torvalds /** 6611da177e4SLinus Torvalds * get_gendisk - get partitioning information for a given device 662710027a4SRandy Dunlap * @devt: device to get partitioning information for 663496aa8a9SRandy Dunlap * @partno: returned partition index 6641da177e4SLinus Torvalds * 6651da177e4SLinus Torvalds * This function gets the structure containing partitioning 666710027a4SRandy Dunlap * information for the given device @devt. 6671da177e4SLinus Torvalds */ 668cf771cb5STejun Heo struct gendisk *get_gendisk(dev_t devt, int *partno) 6691da177e4SLinus Torvalds { 670bcce3de1STejun Heo struct gendisk *disk = NULL; 671edfaa7c3SKay Sievers 672bcce3de1STejun Heo if (MAJOR(devt) != BLOCK_EXT_MAJOR) { 673bcce3de1STejun Heo struct kobject *kobj; 674bcce3de1STejun Heo 675bcce3de1STejun Heo kobj = kobj_lookup(bdev_map, devt, partno); 676bcce3de1STejun Heo if (kobj) 677bcce3de1STejun Heo disk = dev_to_disk(kobj_to_dev(kobj)); 678bcce3de1STejun Heo } else { 679bcce3de1STejun Heo struct hd_struct *part; 680bcce3de1STejun Heo 681bcce3de1STejun Heo mutex_lock(&ext_devt_mutex); 682870d6656STejun Heo part = idr_find(&ext_devt_idr, blk_mangle_minor(MINOR(devt))); 683bcce3de1STejun Heo if (part && get_disk(part_to_disk(part))) { 684bcce3de1STejun Heo *partno = part->partno; 685bcce3de1STejun Heo disk = part_to_disk(part); 686bcce3de1STejun Heo } 687bcce3de1STejun Heo mutex_unlock(&ext_devt_mutex); 688bcce3de1STejun Heo } 689bcce3de1STejun Heo 690bcce3de1STejun Heo return disk; 6911da177e4SLinus Torvalds } 692b6ac23afSDivyesh Shah EXPORT_SYMBOL(get_gendisk); 6931da177e4SLinus Torvalds 694f331c029STejun Heo /** 695f331c029STejun Heo * bdget_disk - do bdget() by gendisk and partition number 696f331c029STejun Heo * @disk: gendisk of interest 697f331c029STejun Heo * @partno: partition number 698f331c029STejun Heo * 699f331c029STejun Heo * Find partition @partno from @disk, do bdget() on it. 700f331c029STejun Heo * 701f331c029STejun Heo * CONTEXT: 702f331c029STejun Heo * Don't care. 703f331c029STejun Heo * 704f331c029STejun Heo * RETURNS: 705f331c029STejun Heo * Resulting block_device on success, NULL on failure. 706f331c029STejun Heo */ 707aeb3d3a8SHarvey Harrison struct block_device *bdget_disk(struct gendisk *disk, int partno) 708f331c029STejun Heo { 709e71bf0d0STejun Heo struct hd_struct *part; 710548b10ebSTejun Heo struct block_device *bdev = NULL; 711f331c029STejun Heo 712e71bf0d0STejun Heo part = disk_get_part(disk, partno); 7132bbedcb4STejun Heo if (part) 714548b10ebSTejun Heo bdev = bdget(part_devt(part)); 715e71bf0d0STejun Heo disk_put_part(part); 716f331c029STejun Heo 717548b10ebSTejun Heo return bdev; 718f331c029STejun Heo } 719f331c029STejun Heo EXPORT_SYMBOL(bdget_disk); 720f331c029STejun Heo 721dd2a345fSDave Gilbert /* 7225c6f35c5SGreg Kroah-Hartman * print a full list of all partitions - intended for places where the root 7235c6f35c5SGreg Kroah-Hartman * filesystem can't be mounted and thus to give the victim some idea of what 7245c6f35c5SGreg Kroah-Hartman * went wrong 7255c6f35c5SGreg Kroah-Hartman */ 7265c6f35c5SGreg Kroah-Hartman void __init printk_all_partitions(void) 7275c6f35c5SGreg Kroah-Hartman { 728def4e38dSTejun Heo struct class_dev_iter iter; 729def4e38dSTejun Heo struct device *dev; 730def4e38dSTejun Heo 731def4e38dSTejun Heo class_dev_iter_init(&iter, &block_class, NULL, &disk_type); 732def4e38dSTejun Heo while ((dev = class_dev_iter_next(&iter))) { 733def4e38dSTejun Heo struct gendisk *disk = dev_to_disk(dev); 734e71bf0d0STejun Heo struct disk_part_iter piter; 735e71bf0d0STejun Heo struct hd_struct *part; 7361f014290STejun Heo char name_buf[BDEVNAME_SIZE]; 7371f014290STejun Heo char devt_buf[BDEVT_SIZE]; 738b5af921eSWill Drewry u8 uuid[PARTITION_META_INFO_UUIDLTH * 2 + 1]; 739def4e38dSTejun Heo 740def4e38dSTejun Heo /* 741def4e38dSTejun Heo * Don't show empty devices or things that have been 74225985edcSLucas De Marchi * suppressed 743def4e38dSTejun Heo */ 744def4e38dSTejun Heo if (get_capacity(disk) == 0 || 745def4e38dSTejun Heo (disk->flags & GENHD_FL_SUPPRESS_PARTITION_INFO)) 746def4e38dSTejun Heo continue; 747def4e38dSTejun Heo 748def4e38dSTejun Heo /* 749def4e38dSTejun Heo * Note, unlike /proc/partitions, I am showing the 750def4e38dSTejun Heo * numbers in hex - the same format as the root= 751def4e38dSTejun Heo * option takes. 752def4e38dSTejun Heo */ 753074a7acaSTejun Heo disk_part_iter_init(&piter, disk, DISK_PITER_INCL_PART0); 754074a7acaSTejun Heo while ((part = disk_part_iter_next(&piter))) { 755074a7acaSTejun Heo bool is_part0 = part == &disk->part0; 756074a7acaSTejun Heo 757b5af921eSWill Drewry uuid[0] = 0; 758b5af921eSWill Drewry if (part->info) 759b5af921eSWill Drewry part_unpack_uuid(part->info->uuid, uuid); 760b5af921eSWill Drewry 761b5af921eSWill Drewry printk("%s%s %10llu %s %s", is_part0 ? "" : " ", 762074a7acaSTejun Heo bdevt_str(part_devt(part), devt_buf), 763074a7acaSTejun Heo (unsigned long long)part->nr_sects >> 1, 764b5af921eSWill Drewry disk_name(disk, part->partno, name_buf), uuid); 765074a7acaSTejun Heo if (is_part0) { 766def4e38dSTejun Heo if (disk->driverfs_dev != NULL && 767def4e38dSTejun Heo disk->driverfs_dev->driver != NULL) 768def4e38dSTejun Heo printk(" driver: %s\n", 769def4e38dSTejun Heo disk->driverfs_dev->driver->name); 770def4e38dSTejun Heo else 771def4e38dSTejun Heo printk(" (driver?)\n"); 772074a7acaSTejun Heo } else 773074a7acaSTejun Heo printk("\n"); 774074a7acaSTejun Heo } 775e71bf0d0STejun Heo disk_part_iter_exit(&piter); 776def4e38dSTejun Heo } 777def4e38dSTejun Heo class_dev_iter_exit(&iter); 778dd2a345fSDave Gilbert } 779dd2a345fSDave Gilbert 7801da177e4SLinus Torvalds #ifdef CONFIG_PROC_FS 7811da177e4SLinus Torvalds /* iterator */ 782def4e38dSTejun Heo static void *disk_seqf_start(struct seq_file *seqf, loff_t *pos) 78368c4d4a7SGreg Kroah-Hartman { 784def4e38dSTejun Heo loff_t skip = *pos; 785def4e38dSTejun Heo struct class_dev_iter *iter; 786def4e38dSTejun Heo struct device *dev; 78768c4d4a7SGreg Kroah-Hartman 788aeb3d3a8SHarvey Harrison iter = kmalloc(sizeof(*iter), GFP_KERNEL); 789def4e38dSTejun Heo if (!iter) 790def4e38dSTejun Heo return ERR_PTR(-ENOMEM); 791def4e38dSTejun Heo 792def4e38dSTejun Heo seqf->private = iter; 793def4e38dSTejun Heo class_dev_iter_init(iter, &block_class, NULL, &disk_type); 794def4e38dSTejun Heo do { 795def4e38dSTejun Heo dev = class_dev_iter_next(iter); 796def4e38dSTejun Heo if (!dev) 797def4e38dSTejun Heo return NULL; 798def4e38dSTejun Heo } while (skip--); 799def4e38dSTejun Heo 800def4e38dSTejun Heo return dev_to_disk(dev); 80168c4d4a7SGreg Kroah-Hartman } 80268c4d4a7SGreg Kroah-Hartman 803def4e38dSTejun Heo static void *disk_seqf_next(struct seq_file *seqf, void *v, loff_t *pos) 8041da177e4SLinus Torvalds { 805edfaa7c3SKay Sievers struct device *dev; 80666c64afeSGreg Kroah-Hartman 807def4e38dSTejun Heo (*pos)++; 808def4e38dSTejun Heo dev = class_dev_iter_next(seqf->private); 8092ac3cee5STejun Heo if (dev) 810edfaa7c3SKay Sievers return dev_to_disk(dev); 8112ac3cee5STejun Heo 8121da177e4SLinus Torvalds return NULL; 8131da177e4SLinus Torvalds } 8141da177e4SLinus Torvalds 815def4e38dSTejun Heo static void disk_seqf_stop(struct seq_file *seqf, void *v) 81627f30251SGreg Kroah-Hartman { 817def4e38dSTejun Heo struct class_dev_iter *iter = seqf->private; 818def4e38dSTejun Heo 819def4e38dSTejun Heo /* stop is called even after start failed :-( */ 820def4e38dSTejun Heo if (iter) { 821def4e38dSTejun Heo class_dev_iter_exit(iter); 822def4e38dSTejun Heo kfree(iter); 823def4e38dSTejun Heo } 82427f30251SGreg Kroah-Hartman } 82527f30251SGreg Kroah-Hartman 826def4e38dSTejun Heo static void *show_partition_start(struct seq_file *seqf, loff_t *pos) 8271da177e4SLinus Torvalds { 828def4e38dSTejun Heo static void *p; 8291da177e4SLinus Torvalds 830def4e38dSTejun Heo p = disk_seqf_start(seqf, pos); 831b9f985b6SYang Zhang if (!IS_ERR_OR_NULL(p) && !*pos) 832def4e38dSTejun Heo seq_puts(seqf, "major minor #blocks name\n\n"); 833def4e38dSTejun Heo return p; 8341da177e4SLinus Torvalds } 8351da177e4SLinus Torvalds 836cf771cb5STejun Heo static int show_partition(struct seq_file *seqf, void *v) 8371da177e4SLinus Torvalds { 8381da177e4SLinus Torvalds struct gendisk *sgp = v; 839e71bf0d0STejun Heo struct disk_part_iter piter; 840e71bf0d0STejun Heo struct hd_struct *part; 8411da177e4SLinus Torvalds char buf[BDEVNAME_SIZE]; 8421da177e4SLinus Torvalds 8431da177e4SLinus Torvalds /* Don't show non-partitionable removeable devices or empty devices */ 844b5d0b9dfSTejun Heo if (!get_capacity(sgp) || (!disk_partitionable(sgp) && 845f331c029STejun Heo (sgp->flags & GENHD_FL_REMOVABLE))) 8461da177e4SLinus Torvalds return 0; 8471da177e4SLinus Torvalds if (sgp->flags & GENHD_FL_SUPPRESS_PARTITION_INFO) 8481da177e4SLinus Torvalds return 0; 8491da177e4SLinus Torvalds 8501da177e4SLinus Torvalds /* show the full disk and all non-0 size partitions of it */ 851074a7acaSTejun Heo disk_part_iter_init(&piter, sgp, DISK_PITER_INCL_PART0); 852e71bf0d0STejun Heo while ((part = disk_part_iter_next(&piter))) 8531f014290STejun Heo seq_printf(seqf, "%4d %7d %10llu %s\n", 854f331c029STejun Heo MAJOR(part_devt(part)), MINOR(part_devt(part)), 855f331c029STejun Heo (unsigned long long)part->nr_sects >> 1, 856f331c029STejun Heo disk_name(sgp, part->partno, buf)); 857e71bf0d0STejun Heo disk_part_iter_exit(&piter); 8581da177e4SLinus Torvalds 8591da177e4SLinus Torvalds return 0; 8601da177e4SLinus Torvalds } 8611da177e4SLinus Torvalds 862f500975aSAlexey Dobriyan static const struct seq_operations partitions_op = { 863def4e38dSTejun Heo .start = show_partition_start, 864def4e38dSTejun Heo .next = disk_seqf_next, 865def4e38dSTejun Heo .stop = disk_seqf_stop, 8661da177e4SLinus Torvalds .show = show_partition 8671da177e4SLinus Torvalds }; 868f500975aSAlexey Dobriyan 869f500975aSAlexey Dobriyan static int partitions_open(struct inode *inode, struct file *file) 870f500975aSAlexey Dobriyan { 871f500975aSAlexey Dobriyan return seq_open(file, &partitions_op); 872f500975aSAlexey Dobriyan } 873f500975aSAlexey Dobriyan 874f500975aSAlexey Dobriyan static const struct file_operations proc_partitions_operations = { 875f500975aSAlexey Dobriyan .open = partitions_open, 876f500975aSAlexey Dobriyan .read = seq_read, 877f500975aSAlexey Dobriyan .llseek = seq_lseek, 878f500975aSAlexey Dobriyan .release = seq_release, 879f500975aSAlexey Dobriyan }; 8801da177e4SLinus Torvalds #endif 8811da177e4SLinus Torvalds 8821da177e4SLinus Torvalds 883cf771cb5STejun Heo static struct kobject *base_probe(dev_t devt, int *partno, void *data) 8841da177e4SLinus Torvalds { 885edfaa7c3SKay Sievers if (request_module("block-major-%d-%d", MAJOR(devt), MINOR(devt)) > 0) 8861da177e4SLinus Torvalds /* Make old-style 2.4 aliases work */ 887edfaa7c3SKay Sievers request_module("block-major-%d", MAJOR(devt)); 8881da177e4SLinus Torvalds return NULL; 8891da177e4SLinus Torvalds } 8901da177e4SLinus Torvalds 8911da177e4SLinus Torvalds static int __init genhd_device_init(void) 8921da177e4SLinus Torvalds { 893e105b8bfSDan Williams int error; 894e105b8bfSDan Williams 895e105b8bfSDan Williams block_class.dev_kobj = sysfs_dev_block_kobj; 896e105b8bfSDan Williams error = class_register(&block_class); 897ee27a558SRoland McGrath if (unlikely(error)) 898ee27a558SRoland McGrath return error; 899edfaa7c3SKay Sievers bdev_map = kobj_map_init(base_probe, &block_class_lock); 9001da177e4SLinus Torvalds blk_dev_init(); 901edfaa7c3SKay Sievers 902561ec68eSZhang, Yanmin register_blkdev(BLOCK_EXT_MAJOR, "blkext"); 903561ec68eSZhang, Yanmin 904edfaa7c3SKay Sievers /* create top-level block dir */ 905e52eec13SAndi Kleen if (!sysfs_deprecated) 906edfaa7c3SKay Sievers block_depr = kobject_create_and_add("block", NULL); 907830d3cfbSGreg Kroah-Hartman return 0; 9081da177e4SLinus Torvalds } 9091da177e4SLinus Torvalds 9101da177e4SLinus Torvalds subsys_initcall(genhd_device_init); 9111da177e4SLinus Torvalds 912edfaa7c3SKay Sievers static ssize_t disk_range_show(struct device *dev, 913edfaa7c3SKay Sievers struct device_attribute *attr, char *buf) 9141da177e4SLinus Torvalds { 915edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 9161da177e4SLinus Torvalds 917edfaa7c3SKay Sievers return sprintf(buf, "%d\n", disk->minors); 9181da177e4SLinus Torvalds } 9191da177e4SLinus Torvalds 9201f014290STejun Heo static ssize_t disk_ext_range_show(struct device *dev, 9211f014290STejun Heo struct device_attribute *attr, char *buf) 9221f014290STejun Heo { 9231f014290STejun Heo struct gendisk *disk = dev_to_disk(dev); 9241f014290STejun Heo 925b5d0b9dfSTejun Heo return sprintf(buf, "%d\n", disk_max_parts(disk)); 9261f014290STejun Heo } 9271f014290STejun Heo 928edfaa7c3SKay Sievers static ssize_t disk_removable_show(struct device *dev, 929edfaa7c3SKay Sievers struct device_attribute *attr, char *buf) 930a7fd6706SKay Sievers { 931edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 932a7fd6706SKay Sievers 933edfaa7c3SKay Sievers return sprintf(buf, "%d\n", 9341da177e4SLinus Torvalds (disk->flags & GENHD_FL_REMOVABLE ? 1 : 0)); 935edfaa7c3SKay Sievers } 9361da177e4SLinus Torvalds 9371c9ce527SKay Sievers static ssize_t disk_ro_show(struct device *dev, 9381c9ce527SKay Sievers struct device_attribute *attr, char *buf) 9391c9ce527SKay Sievers { 9401c9ce527SKay Sievers struct gendisk *disk = dev_to_disk(dev); 9411c9ce527SKay Sievers 942b7db9956STejun Heo return sprintf(buf, "%d\n", get_disk_ro(disk) ? 1 : 0); 9431c9ce527SKay Sievers } 9441c9ce527SKay Sievers 945edfaa7c3SKay Sievers static ssize_t disk_capability_show(struct device *dev, 946edfaa7c3SKay Sievers struct device_attribute *attr, char *buf) 94786ce18d7SKristen Carlson Accardi { 948edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 949edfaa7c3SKay Sievers 950edfaa7c3SKay Sievers return sprintf(buf, "%x\n", disk->flags); 95186ce18d7SKristen Carlson Accardi } 952edfaa7c3SKay Sievers 953c72758f3SMartin K. Petersen static ssize_t disk_alignment_offset_show(struct device *dev, 954c72758f3SMartin K. Petersen struct device_attribute *attr, 955c72758f3SMartin K. Petersen char *buf) 956c72758f3SMartin K. Petersen { 957c72758f3SMartin K. Petersen struct gendisk *disk = dev_to_disk(dev); 958c72758f3SMartin K. Petersen 959c72758f3SMartin K. Petersen return sprintf(buf, "%d\n", queue_alignment_offset(disk->queue)); 960c72758f3SMartin K. Petersen } 961c72758f3SMartin K. Petersen 96286b37281SMartin K. Petersen static ssize_t disk_discard_alignment_show(struct device *dev, 96386b37281SMartin K. Petersen struct device_attribute *attr, 96486b37281SMartin K. Petersen char *buf) 96586b37281SMartin K. Petersen { 96686b37281SMartin K. Petersen struct gendisk *disk = dev_to_disk(dev); 96786b37281SMartin K. Petersen 968dd3d145dSMartin K. Petersen return sprintf(buf, "%d\n", queue_discard_alignment(disk->queue)); 96986b37281SMartin K. Petersen } 97086b37281SMartin K. Petersen 971edfaa7c3SKay Sievers static DEVICE_ATTR(range, S_IRUGO, disk_range_show, NULL); 9721f014290STejun Heo static DEVICE_ATTR(ext_range, S_IRUGO, disk_ext_range_show, NULL); 973edfaa7c3SKay Sievers static DEVICE_ATTR(removable, S_IRUGO, disk_removable_show, NULL); 9741c9ce527SKay Sievers static DEVICE_ATTR(ro, S_IRUGO, disk_ro_show, NULL); 975e5610521STejun Heo static DEVICE_ATTR(size, S_IRUGO, part_size_show, NULL); 976c72758f3SMartin K. Petersen static DEVICE_ATTR(alignment_offset, S_IRUGO, disk_alignment_offset_show, NULL); 97786b37281SMartin K. Petersen static DEVICE_ATTR(discard_alignment, S_IRUGO, disk_discard_alignment_show, 97886b37281SMartin K. Petersen NULL); 979edfaa7c3SKay Sievers static DEVICE_ATTR(capability, S_IRUGO, disk_capability_show, NULL); 980074a7acaSTejun Heo static DEVICE_ATTR(stat, S_IRUGO, part_stat_show, NULL); 981316d315bSNikanth Karthikesan static DEVICE_ATTR(inflight, S_IRUGO, part_inflight_show, NULL); 982c17bb495SAkinobu Mita #ifdef CONFIG_FAIL_MAKE_REQUEST 983edfaa7c3SKay Sievers static struct device_attribute dev_attr_fail = 984eddb2e26STejun Heo __ATTR(make-it-fail, S_IRUGO|S_IWUSR, part_fail_show, part_fail_store); 985c17bb495SAkinobu Mita #endif 986581d4e28SJens Axboe #ifdef CONFIG_FAIL_IO_TIMEOUT 987581d4e28SJens Axboe static struct device_attribute dev_attr_fail_timeout = 988581d4e28SJens Axboe __ATTR(io-timeout-fail, S_IRUGO|S_IWUSR, part_timeout_show, 989581d4e28SJens Axboe part_timeout_store); 990581d4e28SJens Axboe #endif 991edfaa7c3SKay Sievers 992edfaa7c3SKay Sievers static struct attribute *disk_attrs[] = { 993edfaa7c3SKay Sievers &dev_attr_range.attr, 9941f014290STejun Heo &dev_attr_ext_range.attr, 995edfaa7c3SKay Sievers &dev_attr_removable.attr, 9961c9ce527SKay Sievers &dev_attr_ro.attr, 997edfaa7c3SKay Sievers &dev_attr_size.attr, 998c72758f3SMartin K. Petersen &dev_attr_alignment_offset.attr, 99986b37281SMartin K. Petersen &dev_attr_discard_alignment.attr, 1000edfaa7c3SKay Sievers &dev_attr_capability.attr, 1001edfaa7c3SKay Sievers &dev_attr_stat.attr, 1002316d315bSNikanth Karthikesan &dev_attr_inflight.attr, 1003edfaa7c3SKay Sievers #ifdef CONFIG_FAIL_MAKE_REQUEST 1004edfaa7c3SKay Sievers &dev_attr_fail.attr, 1005edfaa7c3SKay Sievers #endif 1006581d4e28SJens Axboe #ifdef CONFIG_FAIL_IO_TIMEOUT 1007581d4e28SJens Axboe &dev_attr_fail_timeout.attr, 1008581d4e28SJens Axboe #endif 1009edfaa7c3SKay Sievers NULL 10101da177e4SLinus Torvalds }; 10111da177e4SLinus Torvalds 1012edfaa7c3SKay Sievers static struct attribute_group disk_attr_group = { 1013edfaa7c3SKay Sievers .attrs = disk_attrs, 1014edfaa7c3SKay Sievers }; 1015edfaa7c3SKay Sievers 1016a4dbd674SDavid Brownell static const struct attribute_group *disk_attr_groups[] = { 1017edfaa7c3SKay Sievers &disk_attr_group, 1018edfaa7c3SKay Sievers NULL 1019edfaa7c3SKay Sievers }; 1020edfaa7c3SKay Sievers 1021540eed56STejun Heo static void disk_free_ptbl_rcu_cb(struct rcu_head *head) 1022540eed56STejun Heo { 1023540eed56STejun Heo struct disk_part_tbl *ptbl = 1024540eed56STejun Heo container_of(head, struct disk_part_tbl, rcu_head); 1025540eed56STejun Heo 1026540eed56STejun Heo kfree(ptbl); 1027540eed56STejun Heo } 1028540eed56STejun Heo 1029540eed56STejun Heo /** 1030540eed56STejun Heo * disk_replace_part_tbl - replace disk->part_tbl in RCU-safe way 1031540eed56STejun Heo * @disk: disk to replace part_tbl for 1032540eed56STejun Heo * @new_ptbl: new part_tbl to install 1033540eed56STejun Heo * 1034540eed56STejun Heo * Replace disk->part_tbl with @new_ptbl in RCU-safe way. The 1035540eed56STejun Heo * original ptbl is freed using RCU callback. 1036540eed56STejun Heo * 1037540eed56STejun Heo * LOCKING: 1038540eed56STejun Heo * Matching bd_mutx locked. 1039540eed56STejun Heo */ 1040540eed56STejun Heo static void disk_replace_part_tbl(struct gendisk *disk, 1041540eed56STejun Heo struct disk_part_tbl *new_ptbl) 1042540eed56STejun Heo { 1043540eed56STejun Heo struct disk_part_tbl *old_ptbl = disk->part_tbl; 1044540eed56STejun Heo 1045540eed56STejun Heo rcu_assign_pointer(disk->part_tbl, new_ptbl); 1046a6f23657SJens Axboe 1047a6f23657SJens Axboe if (old_ptbl) { 1048a6f23657SJens Axboe rcu_assign_pointer(old_ptbl->last_lookup, NULL); 1049540eed56STejun Heo call_rcu(&old_ptbl->rcu_head, disk_free_ptbl_rcu_cb); 1050540eed56STejun Heo } 1051a6f23657SJens Axboe } 1052540eed56STejun Heo 1053540eed56STejun Heo /** 1054540eed56STejun Heo * disk_expand_part_tbl - expand disk->part_tbl 1055540eed56STejun Heo * @disk: disk to expand part_tbl for 1056540eed56STejun Heo * @partno: expand such that this partno can fit in 1057540eed56STejun Heo * 1058540eed56STejun Heo * Expand disk->part_tbl such that @partno can fit in. disk->part_tbl 1059540eed56STejun Heo * uses RCU to allow unlocked dereferencing for stats and other stuff. 1060540eed56STejun Heo * 1061540eed56STejun Heo * LOCKING: 1062540eed56STejun Heo * Matching bd_mutex locked, might sleep. 1063540eed56STejun Heo * 1064540eed56STejun Heo * RETURNS: 1065540eed56STejun Heo * 0 on success, -errno on failure. 1066540eed56STejun Heo */ 1067540eed56STejun Heo int disk_expand_part_tbl(struct gendisk *disk, int partno) 1068540eed56STejun Heo { 1069540eed56STejun Heo struct disk_part_tbl *old_ptbl = disk->part_tbl; 1070540eed56STejun Heo struct disk_part_tbl *new_ptbl; 1071540eed56STejun Heo int len = old_ptbl ? old_ptbl->len : 0; 1072540eed56STejun Heo int target = partno + 1; 1073540eed56STejun Heo size_t size; 1074540eed56STejun Heo int i; 1075540eed56STejun Heo 1076540eed56STejun Heo /* disk_max_parts() is zero during initialization, ignore if so */ 1077540eed56STejun Heo if (disk_max_parts(disk) && target > disk_max_parts(disk)) 1078540eed56STejun Heo return -EINVAL; 1079540eed56STejun Heo 1080540eed56STejun Heo if (target <= len) 1081540eed56STejun Heo return 0; 1082540eed56STejun Heo 1083540eed56STejun Heo size = sizeof(*new_ptbl) + target * sizeof(new_ptbl->part[0]); 1084540eed56STejun Heo new_ptbl = kzalloc_node(size, GFP_KERNEL, disk->node_id); 1085540eed56STejun Heo if (!new_ptbl) 1086540eed56STejun Heo return -ENOMEM; 1087540eed56STejun Heo 1088540eed56STejun Heo new_ptbl->len = target; 1089540eed56STejun Heo 1090540eed56STejun Heo for (i = 0; i < len; i++) 1091540eed56STejun Heo rcu_assign_pointer(new_ptbl->part[i], old_ptbl->part[i]); 1092540eed56STejun Heo 1093540eed56STejun Heo disk_replace_part_tbl(disk, new_ptbl); 1094540eed56STejun Heo return 0; 1095540eed56STejun Heo } 1096540eed56STejun Heo 1097edfaa7c3SKay Sievers static void disk_release(struct device *dev) 10981da177e4SLinus Torvalds { 1099edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 1100edfaa7c3SKay Sievers 110177ea887eSTejun Heo disk_release_events(disk); 11021da177e4SLinus Torvalds kfree(disk->random); 1103540eed56STejun Heo disk_replace_part_tbl(disk, NULL); 1104074a7acaSTejun Heo free_part_stats(&disk->part0); 11056d1d8050SWill Drewry free_part_info(&disk->part0); 11061da177e4SLinus Torvalds kfree(disk); 11071da177e4SLinus Torvalds } 1108edfaa7c3SKay Sievers struct class block_class = { 1109edfaa7c3SKay Sievers .name = "block", 11101da177e4SLinus Torvalds }; 11111da177e4SLinus Torvalds 1112e454cea2SKay Sievers static char *block_devnode(struct device *dev, mode_t *mode) 1113b03f38b6SKay Sievers { 1114b03f38b6SKay Sievers struct gendisk *disk = dev_to_disk(dev); 1115b03f38b6SKay Sievers 1116e454cea2SKay Sievers if (disk->devnode) 1117e454cea2SKay Sievers return disk->devnode(disk, mode); 1118b03f38b6SKay Sievers return NULL; 1119b03f38b6SKay Sievers } 1120b03f38b6SKay Sievers 11211826eadfSAdrian Bunk static struct device_type disk_type = { 1122edfaa7c3SKay Sievers .name = "disk", 1123edfaa7c3SKay Sievers .groups = disk_attr_groups, 1124edfaa7c3SKay Sievers .release = disk_release, 1125e454cea2SKay Sievers .devnode = block_devnode, 11261da177e4SLinus Torvalds }; 11271da177e4SLinus Torvalds 1128a6e2ba88SRandy Dunlap #ifdef CONFIG_PROC_FS 1129cf771cb5STejun Heo /* 1130cf771cb5STejun Heo * aggregate disk stat collector. Uses the same stats that the sysfs 1131cf771cb5STejun Heo * entries do, above, but makes them available through one seq_file. 1132cf771cb5STejun Heo * 1133cf771cb5STejun Heo * The output looks suspiciously like /proc/partitions with a bunch of 1134cf771cb5STejun Heo * extra fields. 1135cf771cb5STejun Heo */ 1136cf771cb5STejun Heo static int diskstats_show(struct seq_file *seqf, void *v) 11371da177e4SLinus Torvalds { 11381da177e4SLinus Torvalds struct gendisk *gp = v; 1139e71bf0d0STejun Heo struct disk_part_iter piter; 1140e71bf0d0STejun Heo struct hd_struct *hd; 11411da177e4SLinus Torvalds char buf[BDEVNAME_SIZE]; 1142c9959059STejun Heo int cpu; 11431da177e4SLinus Torvalds 11441da177e4SLinus Torvalds /* 1145ed9e1982STejun Heo if (&disk_to_dev(gp)->kobj.entry == block_class.devices.next) 1146cf771cb5STejun Heo seq_puts(seqf, "major minor name" 11471da177e4SLinus Torvalds " rio rmerge rsect ruse wio wmerge " 11481da177e4SLinus Torvalds "wsect wuse running use aveq" 11491da177e4SLinus Torvalds "\n\n"); 11501da177e4SLinus Torvalds */ 11511da177e4SLinus Torvalds 115271982a40STejun Heo disk_part_iter_init(&piter, gp, DISK_PITER_INCL_EMPTY_PART0); 1153e71bf0d0STejun Heo while ((hd = disk_part_iter_next(&piter))) { 1154074a7acaSTejun Heo cpu = part_stat_lock(); 1155c9959059STejun Heo part_round_stats(cpu, hd); 1156074a7acaSTejun Heo part_stat_unlock(); 11571f014290STejun Heo seq_printf(seqf, "%4d %7d %s %lu %lu %llu " 115828f39d55SJerome Marchand "%u %lu %lu %llu %u %u %u %u\n", 1159f331c029STejun Heo MAJOR(part_devt(hd)), MINOR(part_devt(hd)), 1160f331c029STejun Heo disk_name(gp, hd->partno, buf), 116153f22956SLiu Yuan part_stat_read(hd, ios[READ]), 116253f22956SLiu Yuan part_stat_read(hd, merges[READ]), 116353f22956SLiu Yuan (unsigned long long)part_stat_read(hd, sectors[READ]), 116453f22956SLiu Yuan jiffies_to_msecs(part_stat_read(hd, ticks[READ])), 116553f22956SLiu Yuan part_stat_read(hd, ios[WRITE]), 116653f22956SLiu Yuan part_stat_read(hd, merges[WRITE]), 116753f22956SLiu Yuan (unsigned long long)part_stat_read(hd, sectors[WRITE]), 116853f22956SLiu Yuan jiffies_to_msecs(part_stat_read(hd, ticks[WRITE])), 1169316d315bSNikanth Karthikesan part_in_flight(hd), 117028f39d55SJerome Marchand jiffies_to_msecs(part_stat_read(hd, io_ticks)), 117128f39d55SJerome Marchand jiffies_to_msecs(part_stat_read(hd, time_in_queue)) 117228f39d55SJerome Marchand ); 11731da177e4SLinus Torvalds } 1174e71bf0d0STejun Heo disk_part_iter_exit(&piter); 11751da177e4SLinus Torvalds 11761da177e4SLinus Torvalds return 0; 11771da177e4SLinus Torvalds } 11781da177e4SLinus Torvalds 117931d85ab2SAlexey Dobriyan static const struct seq_operations diskstats_op = { 1180def4e38dSTejun Heo .start = disk_seqf_start, 1181def4e38dSTejun Heo .next = disk_seqf_next, 1182def4e38dSTejun Heo .stop = disk_seqf_stop, 11831da177e4SLinus Torvalds .show = diskstats_show 11841da177e4SLinus Torvalds }; 1185f500975aSAlexey Dobriyan 118631d85ab2SAlexey Dobriyan static int diskstats_open(struct inode *inode, struct file *file) 118731d85ab2SAlexey Dobriyan { 118831d85ab2SAlexey Dobriyan return seq_open(file, &diskstats_op); 118931d85ab2SAlexey Dobriyan } 119031d85ab2SAlexey Dobriyan 119131d85ab2SAlexey Dobriyan static const struct file_operations proc_diskstats_operations = { 119231d85ab2SAlexey Dobriyan .open = diskstats_open, 119331d85ab2SAlexey Dobriyan .read = seq_read, 119431d85ab2SAlexey Dobriyan .llseek = seq_lseek, 119531d85ab2SAlexey Dobriyan .release = seq_release, 119631d85ab2SAlexey Dobriyan }; 119731d85ab2SAlexey Dobriyan 1198f500975aSAlexey Dobriyan static int __init proc_genhd_init(void) 1199f500975aSAlexey Dobriyan { 120031d85ab2SAlexey Dobriyan proc_create("diskstats", 0, NULL, &proc_diskstats_operations); 1201f500975aSAlexey Dobriyan proc_create("partitions", 0, NULL, &proc_partitions_operations); 1202f500975aSAlexey Dobriyan return 0; 1203f500975aSAlexey Dobriyan } 1204f500975aSAlexey Dobriyan module_init(proc_genhd_init); 1205a6e2ba88SRandy Dunlap #endif /* CONFIG_PROC_FS */ 12061da177e4SLinus Torvalds 1207cf771cb5STejun Heo dev_t blk_lookup_devt(const char *name, int partno) 1208edfaa7c3SKay Sievers { 1209edfaa7c3SKay Sievers dev_t devt = MKDEV(0, 0); 1210def4e38dSTejun Heo struct class_dev_iter iter; 1211def4e38dSTejun Heo struct device *dev; 1212edfaa7c3SKay Sievers 1213def4e38dSTejun Heo class_dev_iter_init(&iter, &block_class, NULL, &disk_type); 1214def4e38dSTejun Heo while ((dev = class_dev_iter_next(&iter))) { 1215def4e38dSTejun Heo struct gendisk *disk = dev_to_disk(dev); 1216548b10ebSTejun Heo struct hd_struct *part; 1217def4e38dSTejun Heo 12183ada8b7eSKay Sievers if (strcmp(dev_name(dev), name)) 1219f331c029STejun Heo continue; 1220f331c029STejun Heo 122141b8c853SNeil Brown if (partno < disk->minors) { 122241b8c853SNeil Brown /* We need to return the right devno, even 122341b8c853SNeil Brown * if the partition doesn't exist yet. 122441b8c853SNeil Brown */ 122541b8c853SNeil Brown devt = MKDEV(MAJOR(dev->devt), 122641b8c853SNeil Brown MINOR(dev->devt) + partno); 122741b8c853SNeil Brown break; 122841b8c853SNeil Brown } 1229e71bf0d0STejun Heo part = disk_get_part(disk, partno); 12302bbedcb4STejun Heo if (part) { 1231f331c029STejun Heo devt = part_devt(part); 1232e71bf0d0STejun Heo disk_put_part(part); 1233f331c029STejun Heo break; 1234def4e38dSTejun Heo } 1235548b10ebSTejun Heo disk_put_part(part); 1236548b10ebSTejun Heo } 1237def4e38dSTejun Heo class_dev_iter_exit(&iter); 1238edfaa7c3SKay Sievers return devt; 1239edfaa7c3SKay Sievers } 1240edfaa7c3SKay Sievers EXPORT_SYMBOL(blk_lookup_devt); 1241edfaa7c3SKay Sievers 12421da177e4SLinus Torvalds struct gendisk *alloc_disk(int minors) 12431da177e4SLinus Torvalds { 12441946089aSChristoph Lameter return alloc_disk_node(minors, -1); 12451946089aSChristoph Lameter } 1246689d6facSTejun Heo EXPORT_SYMBOL(alloc_disk); 12471946089aSChristoph Lameter 12481946089aSChristoph Lameter struct gendisk *alloc_disk_node(int minors, int node_id) 12491946089aSChristoph Lameter { 12501946089aSChristoph Lameter struct gendisk *disk; 12511946089aSChristoph Lameter 125294f6030cSChristoph Lameter disk = kmalloc_node(sizeof(struct gendisk), 125394f6030cSChristoph Lameter GFP_KERNEL | __GFP_ZERO, node_id); 12541da177e4SLinus Torvalds if (disk) { 1255074a7acaSTejun Heo if (!init_part_stats(&disk->part0)) { 12561da177e4SLinus Torvalds kfree(disk); 12571da177e4SLinus Torvalds return NULL; 12581da177e4SLinus Torvalds } 1259bf91db18SCheng Renquan disk->node_id = node_id; 1260540eed56STejun Heo if (disk_expand_part_tbl(disk, 0)) { 1261074a7acaSTejun Heo free_part_stats(&disk->part0); 12621da177e4SLinus Torvalds kfree(disk); 12631da177e4SLinus Torvalds return NULL; 12641da177e4SLinus Torvalds } 1265540eed56STejun Heo disk->part_tbl->part[0] = &disk->part0; 12666c23a968SJens Axboe 12676c23a968SJens Axboe hd_ref_init(&disk->part0); 1268b5d0b9dfSTejun Heo 12691da177e4SLinus Torvalds disk->minors = minors; 12701da177e4SLinus Torvalds rand_initialize_disk(disk); 1271ed9e1982STejun Heo disk_to_dev(disk)->class = &block_class; 1272ed9e1982STejun Heo disk_to_dev(disk)->type = &disk_type; 1273ed9e1982STejun Heo device_initialize(disk_to_dev(disk)); 12741da177e4SLinus Torvalds } 12751da177e4SLinus Torvalds return disk; 12761da177e4SLinus Torvalds } 12771946089aSChristoph Lameter EXPORT_SYMBOL(alloc_disk_node); 12781da177e4SLinus Torvalds 12791da177e4SLinus Torvalds struct kobject *get_disk(struct gendisk *disk) 12801da177e4SLinus Torvalds { 12811da177e4SLinus Torvalds struct module *owner; 12821da177e4SLinus Torvalds struct kobject *kobj; 12831da177e4SLinus Torvalds 12841da177e4SLinus Torvalds if (!disk->fops) 12851da177e4SLinus Torvalds return NULL; 12861da177e4SLinus Torvalds owner = disk->fops->owner; 12871da177e4SLinus Torvalds if (owner && !try_module_get(owner)) 12881da177e4SLinus Torvalds return NULL; 1289ed9e1982STejun Heo kobj = kobject_get(&disk_to_dev(disk)->kobj); 12901da177e4SLinus Torvalds if (kobj == NULL) { 12911da177e4SLinus Torvalds module_put(owner); 12921da177e4SLinus Torvalds return NULL; 12931da177e4SLinus Torvalds } 12941da177e4SLinus Torvalds return kobj; 12951da177e4SLinus Torvalds 12961da177e4SLinus Torvalds } 12971da177e4SLinus Torvalds 12981da177e4SLinus Torvalds EXPORT_SYMBOL(get_disk); 12991da177e4SLinus Torvalds 13001da177e4SLinus Torvalds void put_disk(struct gendisk *disk) 13011da177e4SLinus Torvalds { 13021da177e4SLinus Torvalds if (disk) 1303ed9e1982STejun Heo kobject_put(&disk_to_dev(disk)->kobj); 13041da177e4SLinus Torvalds } 13051da177e4SLinus Torvalds 13061da177e4SLinus Torvalds EXPORT_SYMBOL(put_disk); 13071da177e4SLinus Torvalds 1308e3264a4dSHannes Reinecke static void set_disk_ro_uevent(struct gendisk *gd, int ro) 1309e3264a4dSHannes Reinecke { 1310e3264a4dSHannes Reinecke char event[] = "DISK_RO=1"; 1311e3264a4dSHannes Reinecke char *envp[] = { event, NULL }; 1312e3264a4dSHannes Reinecke 1313e3264a4dSHannes Reinecke if (!ro) 1314e3264a4dSHannes Reinecke event[8] = '0'; 1315e3264a4dSHannes Reinecke kobject_uevent_env(&disk_to_dev(gd)->kobj, KOBJ_CHANGE, envp); 1316e3264a4dSHannes Reinecke } 1317e3264a4dSHannes Reinecke 13181da177e4SLinus Torvalds void set_device_ro(struct block_device *bdev, int flag) 13191da177e4SLinus Torvalds { 13201da177e4SLinus Torvalds bdev->bd_part->policy = flag; 13211da177e4SLinus Torvalds } 13221da177e4SLinus Torvalds 13231da177e4SLinus Torvalds EXPORT_SYMBOL(set_device_ro); 13241da177e4SLinus Torvalds 13251da177e4SLinus Torvalds void set_disk_ro(struct gendisk *disk, int flag) 13261da177e4SLinus Torvalds { 1327e71bf0d0STejun Heo struct disk_part_iter piter; 1328e71bf0d0STejun Heo struct hd_struct *part; 1329e71bf0d0STejun Heo 1330e3264a4dSHannes Reinecke if (disk->part0.policy != flag) { 1331e3264a4dSHannes Reinecke set_disk_ro_uevent(disk, flag); 1332e3264a4dSHannes Reinecke disk->part0.policy = flag; 1333e3264a4dSHannes Reinecke } 1334e3264a4dSHannes Reinecke 1335e3264a4dSHannes Reinecke disk_part_iter_init(&piter, disk, DISK_PITER_INCL_EMPTY); 1336e71bf0d0STejun Heo while ((part = disk_part_iter_next(&piter))) 1337e71bf0d0STejun Heo part->policy = flag; 1338e71bf0d0STejun Heo disk_part_iter_exit(&piter); 13391da177e4SLinus Torvalds } 13401da177e4SLinus Torvalds 13411da177e4SLinus Torvalds EXPORT_SYMBOL(set_disk_ro); 13421da177e4SLinus Torvalds 13431da177e4SLinus Torvalds int bdev_read_only(struct block_device *bdev) 13441da177e4SLinus Torvalds { 13451da177e4SLinus Torvalds if (!bdev) 13461da177e4SLinus Torvalds return 0; 13471da177e4SLinus Torvalds return bdev->bd_part->policy; 13481da177e4SLinus Torvalds } 13491da177e4SLinus Torvalds 13501da177e4SLinus Torvalds EXPORT_SYMBOL(bdev_read_only); 13511da177e4SLinus Torvalds 1352cf771cb5STejun Heo int invalidate_partition(struct gendisk *disk, int partno) 13531da177e4SLinus Torvalds { 13541da177e4SLinus Torvalds int res = 0; 1355cf771cb5STejun Heo struct block_device *bdev = bdget_disk(disk, partno); 13561da177e4SLinus Torvalds if (bdev) { 13572ef41634SChristoph Hellwig fsync_bdev(bdev); 135893b270f7SNeilBrown res = __invalidate_device(bdev, true); 13591da177e4SLinus Torvalds bdput(bdev); 13601da177e4SLinus Torvalds } 13611da177e4SLinus Torvalds return res; 13621da177e4SLinus Torvalds } 13631da177e4SLinus Torvalds 13641da177e4SLinus Torvalds EXPORT_SYMBOL(invalidate_partition); 136577ea887eSTejun Heo 136677ea887eSTejun Heo /* 136777ea887eSTejun Heo * Disk events - monitor disk events like media change and eject request. 136877ea887eSTejun Heo */ 136977ea887eSTejun Heo struct disk_events { 137077ea887eSTejun Heo struct list_head node; /* all disk_event's */ 137177ea887eSTejun Heo struct gendisk *disk; /* the associated disk */ 137277ea887eSTejun Heo spinlock_t lock; 137377ea887eSTejun Heo 1374fdd514e1STejun Heo struct mutex block_mutex; /* protects blocking */ 137577ea887eSTejun Heo int block; /* event blocking depth */ 137677ea887eSTejun Heo unsigned int pending; /* events already sent out */ 137777ea887eSTejun Heo unsigned int clearing; /* events being cleared */ 137877ea887eSTejun Heo 137977ea887eSTejun Heo long poll_msecs; /* interval, -1 for default */ 138077ea887eSTejun Heo struct delayed_work dwork; 138177ea887eSTejun Heo }; 138277ea887eSTejun Heo 138377ea887eSTejun Heo static const char *disk_events_strs[] = { 138477ea887eSTejun Heo [ilog2(DISK_EVENT_MEDIA_CHANGE)] = "media_change", 138577ea887eSTejun Heo [ilog2(DISK_EVENT_EJECT_REQUEST)] = "eject_request", 138677ea887eSTejun Heo }; 138777ea887eSTejun Heo 138877ea887eSTejun Heo static char *disk_uevents[] = { 138977ea887eSTejun Heo [ilog2(DISK_EVENT_MEDIA_CHANGE)] = "DISK_MEDIA_CHANGE=1", 139077ea887eSTejun Heo [ilog2(DISK_EVENT_EJECT_REQUEST)] = "DISK_EJECT_REQUEST=1", 139177ea887eSTejun Heo }; 139277ea887eSTejun Heo 139377ea887eSTejun Heo /* list of all disk_events */ 139477ea887eSTejun Heo static DEFINE_MUTEX(disk_events_mutex); 139577ea887eSTejun Heo static LIST_HEAD(disk_events); 139677ea887eSTejun Heo 139777ea887eSTejun Heo /* disable in-kernel polling by default */ 139877ea887eSTejun Heo static unsigned long disk_events_dfl_poll_msecs = 0; 139977ea887eSTejun Heo 140077ea887eSTejun Heo static unsigned long disk_events_poll_jiffies(struct gendisk *disk) 140177ea887eSTejun Heo { 140277ea887eSTejun Heo struct disk_events *ev = disk->ev; 140377ea887eSTejun Heo long intv_msecs = 0; 140477ea887eSTejun Heo 140577ea887eSTejun Heo /* 140677ea887eSTejun Heo * If device-specific poll interval is set, always use it. If 140777ea887eSTejun Heo * the default is being used, poll iff there are events which 140877ea887eSTejun Heo * can't be monitored asynchronously. 140977ea887eSTejun Heo */ 141077ea887eSTejun Heo if (ev->poll_msecs >= 0) 141177ea887eSTejun Heo intv_msecs = ev->poll_msecs; 141277ea887eSTejun Heo else if (disk->events & ~disk->async_events) 141377ea887eSTejun Heo intv_msecs = disk_events_dfl_poll_msecs; 141477ea887eSTejun Heo 141577ea887eSTejun Heo return msecs_to_jiffies(intv_msecs); 141677ea887eSTejun Heo } 141777ea887eSTejun Heo 1418c3af54afSTejun Heo /** 1419c3af54afSTejun Heo * disk_block_events - block and flush disk event checking 1420c3af54afSTejun Heo * @disk: disk to block events for 1421c3af54afSTejun Heo * 1422c3af54afSTejun Heo * On return from this function, it is guaranteed that event checking 1423c3af54afSTejun Heo * isn't in progress and won't happen until unblocked by 1424c3af54afSTejun Heo * disk_unblock_events(). Events blocking is counted and the actual 1425c3af54afSTejun Heo * unblocking happens after the matching number of unblocks are done. 1426c3af54afSTejun Heo * 1427c3af54afSTejun Heo * Note that this intentionally does not block event checking from 1428c3af54afSTejun Heo * disk_clear_events(). 1429c3af54afSTejun Heo * 1430c3af54afSTejun Heo * CONTEXT: 1431c3af54afSTejun Heo * Might sleep. 1432c3af54afSTejun Heo */ 1433c3af54afSTejun Heo void disk_block_events(struct gendisk *disk) 143477ea887eSTejun Heo { 143577ea887eSTejun Heo struct disk_events *ev = disk->ev; 143677ea887eSTejun Heo unsigned long flags; 143777ea887eSTejun Heo bool cancel; 143877ea887eSTejun Heo 1439c3af54afSTejun Heo if (!ev) 1440c3af54afSTejun Heo return; 1441c3af54afSTejun Heo 1442fdd514e1STejun Heo /* 1443fdd514e1STejun Heo * Outer mutex ensures that the first blocker completes canceling 1444fdd514e1STejun Heo * the event work before further blockers are allowed to finish. 1445fdd514e1STejun Heo */ 1446fdd514e1STejun Heo mutex_lock(&ev->block_mutex); 1447fdd514e1STejun Heo 144877ea887eSTejun Heo spin_lock_irqsave(&ev->lock, flags); 144977ea887eSTejun Heo cancel = !ev->block++; 145077ea887eSTejun Heo spin_unlock_irqrestore(&ev->lock, flags); 145177ea887eSTejun Heo 1452c3af54afSTejun Heo if (cancel) 145377ea887eSTejun Heo cancel_delayed_work_sync(&disk->ev->dwork); 1454fdd514e1STejun Heo 1455fdd514e1STejun Heo mutex_unlock(&ev->block_mutex); 145677ea887eSTejun Heo } 145777ea887eSTejun Heo 145877ea887eSTejun Heo static void __disk_unblock_events(struct gendisk *disk, bool check_now) 145977ea887eSTejun Heo { 146077ea887eSTejun Heo struct disk_events *ev = disk->ev; 146177ea887eSTejun Heo unsigned long intv; 146277ea887eSTejun Heo unsigned long flags; 146377ea887eSTejun Heo 146477ea887eSTejun Heo spin_lock_irqsave(&ev->lock, flags); 146577ea887eSTejun Heo 146677ea887eSTejun Heo if (WARN_ON_ONCE(ev->block <= 0)) 146777ea887eSTejun Heo goto out_unlock; 146877ea887eSTejun Heo 146977ea887eSTejun Heo if (--ev->block) 147077ea887eSTejun Heo goto out_unlock; 147177ea887eSTejun Heo 147277ea887eSTejun Heo /* 147377ea887eSTejun Heo * Not exactly a latency critical operation, set poll timer 147477ea887eSTejun Heo * slack to 25% and kick event check. 147577ea887eSTejun Heo */ 147677ea887eSTejun Heo intv = disk_events_poll_jiffies(disk); 147777ea887eSTejun Heo set_timer_slack(&ev->dwork.timer, intv / 4); 147877ea887eSTejun Heo if (check_now) 147977ea887eSTejun Heo queue_delayed_work(system_nrt_wq, &ev->dwork, 0); 148077ea887eSTejun Heo else if (intv) 148177ea887eSTejun Heo queue_delayed_work(system_nrt_wq, &ev->dwork, intv); 148277ea887eSTejun Heo out_unlock: 148377ea887eSTejun Heo spin_unlock_irqrestore(&ev->lock, flags); 148477ea887eSTejun Heo } 148577ea887eSTejun Heo 148677ea887eSTejun Heo /** 148777ea887eSTejun Heo * disk_unblock_events - unblock disk event checking 148877ea887eSTejun Heo * @disk: disk to unblock events for 148977ea887eSTejun Heo * 149077ea887eSTejun Heo * Undo disk_block_events(). When the block count reaches zero, it 149177ea887eSTejun Heo * starts events polling if configured. 149277ea887eSTejun Heo * 149377ea887eSTejun Heo * CONTEXT: 149477ea887eSTejun Heo * Don't care. Safe to call from irq context. 149577ea887eSTejun Heo */ 149677ea887eSTejun Heo void disk_unblock_events(struct gendisk *disk) 149777ea887eSTejun Heo { 149877ea887eSTejun Heo if (disk->ev) 1499facc31ddSTejun Heo __disk_unblock_events(disk, false); 150077ea887eSTejun Heo } 150177ea887eSTejun Heo 150277ea887eSTejun Heo /** 1503*85ef06d1STejun Heo * disk_flush_events - schedule immediate event checking and flushing 1504*85ef06d1STejun Heo * @disk: disk to check and flush events for 1505*85ef06d1STejun Heo * @mask: events to flush 150677ea887eSTejun Heo * 1507*85ef06d1STejun Heo * Schedule immediate event checking on @disk if not blocked. Events in 1508*85ef06d1STejun Heo * @mask are scheduled to be cleared from the driver. Note that this 1509*85ef06d1STejun Heo * doesn't clear the events from @disk->ev. 151077ea887eSTejun Heo * 151177ea887eSTejun Heo * CONTEXT: 1512*85ef06d1STejun Heo * If @mask is non-zero must be called with bdev->bd_mutex held. 151377ea887eSTejun Heo */ 1514*85ef06d1STejun Heo void disk_flush_events(struct gendisk *disk, unsigned int mask) 151577ea887eSTejun Heo { 1516a9dce2a3STejun Heo struct disk_events *ev = disk->ev; 1517a9dce2a3STejun Heo 1518a9dce2a3STejun Heo if (!ev) 1519a9dce2a3STejun Heo return; 1520a9dce2a3STejun Heo 1521*85ef06d1STejun Heo spin_lock_irq(&ev->lock); 1522*85ef06d1STejun Heo ev->clearing |= mask; 1523a9dce2a3STejun Heo if (!ev->block) { 1524a9dce2a3STejun Heo cancel_delayed_work(&ev->dwork); 1525a9dce2a3STejun Heo queue_delayed_work(system_nrt_wq, &ev->dwork, 0); 152677ea887eSTejun Heo } 1527*85ef06d1STejun Heo spin_unlock_irq(&ev->lock); 152877ea887eSTejun Heo } 152977ea887eSTejun Heo 153077ea887eSTejun Heo /** 153177ea887eSTejun Heo * disk_clear_events - synchronously check, clear and return pending events 153277ea887eSTejun Heo * @disk: disk to fetch and clear events from 153377ea887eSTejun Heo * @mask: mask of events to be fetched and clearted 153477ea887eSTejun Heo * 153577ea887eSTejun Heo * Disk events are synchronously checked and pending events in @mask 153677ea887eSTejun Heo * are cleared and returned. This ignores the block count. 153777ea887eSTejun Heo * 153877ea887eSTejun Heo * CONTEXT: 153977ea887eSTejun Heo * Might sleep. 154077ea887eSTejun Heo */ 154177ea887eSTejun Heo unsigned int disk_clear_events(struct gendisk *disk, unsigned int mask) 154277ea887eSTejun Heo { 154377ea887eSTejun Heo const struct block_device_operations *bdops = disk->fops; 154477ea887eSTejun Heo struct disk_events *ev = disk->ev; 154577ea887eSTejun Heo unsigned int pending; 154677ea887eSTejun Heo 154777ea887eSTejun Heo if (!ev) { 154877ea887eSTejun Heo /* for drivers still using the old ->media_changed method */ 154977ea887eSTejun Heo if ((mask & DISK_EVENT_MEDIA_CHANGE) && 155077ea887eSTejun Heo bdops->media_changed && bdops->media_changed(disk)) 155177ea887eSTejun Heo return DISK_EVENT_MEDIA_CHANGE; 155277ea887eSTejun Heo return 0; 155377ea887eSTejun Heo } 155477ea887eSTejun Heo 155577ea887eSTejun Heo /* tell the workfn about the events being cleared */ 155677ea887eSTejun Heo spin_lock_irq(&ev->lock); 155777ea887eSTejun Heo ev->clearing |= mask; 155877ea887eSTejun Heo spin_unlock_irq(&ev->lock); 155977ea887eSTejun Heo 156077ea887eSTejun Heo /* uncondtionally schedule event check and wait for it to finish */ 1561c3af54afSTejun Heo disk_block_events(disk); 156277ea887eSTejun Heo queue_delayed_work(system_nrt_wq, &ev->dwork, 0); 156377ea887eSTejun Heo flush_delayed_work(&ev->dwork); 156477ea887eSTejun Heo __disk_unblock_events(disk, false); 156577ea887eSTejun Heo 156677ea887eSTejun Heo /* then, fetch and clear pending events */ 156777ea887eSTejun Heo spin_lock_irq(&ev->lock); 156877ea887eSTejun Heo WARN_ON_ONCE(ev->clearing & mask); /* cleared by workfn */ 156977ea887eSTejun Heo pending = ev->pending & mask; 157077ea887eSTejun Heo ev->pending &= ~mask; 157177ea887eSTejun Heo spin_unlock_irq(&ev->lock); 157277ea887eSTejun Heo 157377ea887eSTejun Heo return pending; 157477ea887eSTejun Heo } 157577ea887eSTejun Heo 157677ea887eSTejun Heo static void disk_events_workfn(struct work_struct *work) 157777ea887eSTejun Heo { 157877ea887eSTejun Heo struct delayed_work *dwork = to_delayed_work(work); 157977ea887eSTejun Heo struct disk_events *ev = container_of(dwork, struct disk_events, dwork); 158077ea887eSTejun Heo struct gendisk *disk = ev->disk; 158177ea887eSTejun Heo char *envp[ARRAY_SIZE(disk_uevents) + 1] = { }; 158277ea887eSTejun Heo unsigned int clearing = ev->clearing; 158377ea887eSTejun Heo unsigned int events; 158477ea887eSTejun Heo unsigned long intv; 158577ea887eSTejun Heo int nr_events = 0, i; 158677ea887eSTejun Heo 158777ea887eSTejun Heo /* check events */ 158877ea887eSTejun Heo events = disk->fops->check_events(disk, clearing); 158977ea887eSTejun Heo 159077ea887eSTejun Heo /* accumulate pending events and schedule next poll if necessary */ 159177ea887eSTejun Heo spin_lock_irq(&ev->lock); 159277ea887eSTejun Heo 159377ea887eSTejun Heo events &= ~ev->pending; 159477ea887eSTejun Heo ev->pending |= events; 159577ea887eSTejun Heo ev->clearing &= ~clearing; 159677ea887eSTejun Heo 159777ea887eSTejun Heo intv = disk_events_poll_jiffies(disk); 159877ea887eSTejun Heo if (!ev->block && intv) 159977ea887eSTejun Heo queue_delayed_work(system_nrt_wq, &ev->dwork, intv); 160077ea887eSTejun Heo 160177ea887eSTejun Heo spin_unlock_irq(&ev->lock); 160277ea887eSTejun Heo 16037c88a168STejun Heo /* 16047c88a168STejun Heo * Tell userland about new events. Only the events listed in 16057c88a168STejun Heo * @disk->events are reported. Unlisted events are processed the 16067c88a168STejun Heo * same internally but never get reported to userland. 16077c88a168STejun Heo */ 160877ea887eSTejun Heo for (i = 0; i < ARRAY_SIZE(disk_uevents); i++) 16097c88a168STejun Heo if (events & disk->events & (1 << i)) 161077ea887eSTejun Heo envp[nr_events++] = disk_uevents[i]; 161177ea887eSTejun Heo 161277ea887eSTejun Heo if (nr_events) 161377ea887eSTejun Heo kobject_uevent_env(&disk_to_dev(disk)->kobj, KOBJ_CHANGE, envp); 161477ea887eSTejun Heo } 161577ea887eSTejun Heo 161677ea887eSTejun Heo /* 161777ea887eSTejun Heo * A disk events enabled device has the following sysfs nodes under 161877ea887eSTejun Heo * its /sys/block/X/ directory. 161977ea887eSTejun Heo * 162077ea887eSTejun Heo * events : list of all supported events 162177ea887eSTejun Heo * events_async : list of events which can be detected w/o polling 162277ea887eSTejun Heo * events_poll_msecs : polling interval, 0: disable, -1: system default 162377ea887eSTejun Heo */ 162477ea887eSTejun Heo static ssize_t __disk_events_show(unsigned int events, char *buf) 162577ea887eSTejun Heo { 162677ea887eSTejun Heo const char *delim = ""; 162777ea887eSTejun Heo ssize_t pos = 0; 162877ea887eSTejun Heo int i; 162977ea887eSTejun Heo 163077ea887eSTejun Heo for (i = 0; i < ARRAY_SIZE(disk_events_strs); i++) 163177ea887eSTejun Heo if (events & (1 << i)) { 163277ea887eSTejun Heo pos += sprintf(buf + pos, "%s%s", 163377ea887eSTejun Heo delim, disk_events_strs[i]); 163477ea887eSTejun Heo delim = " "; 163577ea887eSTejun Heo } 163677ea887eSTejun Heo if (pos) 163777ea887eSTejun Heo pos += sprintf(buf + pos, "\n"); 163877ea887eSTejun Heo return pos; 163977ea887eSTejun Heo } 164077ea887eSTejun Heo 164177ea887eSTejun Heo static ssize_t disk_events_show(struct device *dev, 164277ea887eSTejun Heo struct device_attribute *attr, char *buf) 164377ea887eSTejun Heo { 164477ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 164577ea887eSTejun Heo 164677ea887eSTejun Heo return __disk_events_show(disk->events, buf); 164777ea887eSTejun Heo } 164877ea887eSTejun Heo 164977ea887eSTejun Heo static ssize_t disk_events_async_show(struct device *dev, 165077ea887eSTejun Heo struct device_attribute *attr, char *buf) 165177ea887eSTejun Heo { 165277ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 165377ea887eSTejun Heo 165477ea887eSTejun Heo return __disk_events_show(disk->async_events, buf); 165577ea887eSTejun Heo } 165677ea887eSTejun Heo 165777ea887eSTejun Heo static ssize_t disk_events_poll_msecs_show(struct device *dev, 165877ea887eSTejun Heo struct device_attribute *attr, 165977ea887eSTejun Heo char *buf) 166077ea887eSTejun Heo { 166177ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 166277ea887eSTejun Heo 166377ea887eSTejun Heo return sprintf(buf, "%ld\n", disk->ev->poll_msecs); 166477ea887eSTejun Heo } 166577ea887eSTejun Heo 166677ea887eSTejun Heo static ssize_t disk_events_poll_msecs_store(struct device *dev, 166777ea887eSTejun Heo struct device_attribute *attr, 166877ea887eSTejun Heo const char *buf, size_t count) 166977ea887eSTejun Heo { 167077ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 167177ea887eSTejun Heo long intv; 167277ea887eSTejun Heo 167377ea887eSTejun Heo if (!count || !sscanf(buf, "%ld", &intv)) 167477ea887eSTejun Heo return -EINVAL; 167577ea887eSTejun Heo 167677ea887eSTejun Heo if (intv < 0 && intv != -1) 167777ea887eSTejun Heo return -EINVAL; 167877ea887eSTejun Heo 1679c3af54afSTejun Heo disk_block_events(disk); 168077ea887eSTejun Heo disk->ev->poll_msecs = intv; 168177ea887eSTejun Heo __disk_unblock_events(disk, true); 168277ea887eSTejun Heo 168377ea887eSTejun Heo return count; 168477ea887eSTejun Heo } 168577ea887eSTejun Heo 168677ea887eSTejun Heo static const DEVICE_ATTR(events, S_IRUGO, disk_events_show, NULL); 168777ea887eSTejun Heo static const DEVICE_ATTR(events_async, S_IRUGO, disk_events_async_show, NULL); 168877ea887eSTejun Heo static const DEVICE_ATTR(events_poll_msecs, S_IRUGO|S_IWUSR, 168977ea887eSTejun Heo disk_events_poll_msecs_show, 169077ea887eSTejun Heo disk_events_poll_msecs_store); 169177ea887eSTejun Heo 169277ea887eSTejun Heo static const struct attribute *disk_events_attrs[] = { 169377ea887eSTejun Heo &dev_attr_events.attr, 169477ea887eSTejun Heo &dev_attr_events_async.attr, 169577ea887eSTejun Heo &dev_attr_events_poll_msecs.attr, 169677ea887eSTejun Heo NULL, 169777ea887eSTejun Heo }; 169877ea887eSTejun Heo 169977ea887eSTejun Heo /* 170077ea887eSTejun Heo * The default polling interval can be specified by the kernel 170177ea887eSTejun Heo * parameter block.events_dfl_poll_msecs which defaults to 0 170277ea887eSTejun Heo * (disable). This can also be modified runtime by writing to 170377ea887eSTejun Heo * /sys/module/block/events_dfl_poll_msecs. 170477ea887eSTejun Heo */ 170577ea887eSTejun Heo static int disk_events_set_dfl_poll_msecs(const char *val, 170677ea887eSTejun Heo const struct kernel_param *kp) 170777ea887eSTejun Heo { 170877ea887eSTejun Heo struct disk_events *ev; 170977ea887eSTejun Heo int ret; 171077ea887eSTejun Heo 171177ea887eSTejun Heo ret = param_set_ulong(val, kp); 171277ea887eSTejun Heo if (ret < 0) 171377ea887eSTejun Heo return ret; 171477ea887eSTejun Heo 171577ea887eSTejun Heo mutex_lock(&disk_events_mutex); 171677ea887eSTejun Heo 171777ea887eSTejun Heo list_for_each_entry(ev, &disk_events, node) 1718*85ef06d1STejun Heo disk_flush_events(ev->disk, 0); 171977ea887eSTejun Heo 172077ea887eSTejun Heo mutex_unlock(&disk_events_mutex); 172177ea887eSTejun Heo 172277ea887eSTejun Heo return 0; 172377ea887eSTejun Heo } 172477ea887eSTejun Heo 172577ea887eSTejun Heo static const struct kernel_param_ops disk_events_dfl_poll_msecs_param_ops = { 172677ea887eSTejun Heo .set = disk_events_set_dfl_poll_msecs, 172777ea887eSTejun Heo .get = param_get_ulong, 172877ea887eSTejun Heo }; 172977ea887eSTejun Heo 173077ea887eSTejun Heo #undef MODULE_PARAM_PREFIX 173177ea887eSTejun Heo #define MODULE_PARAM_PREFIX "block." 173277ea887eSTejun Heo 173377ea887eSTejun Heo module_param_cb(events_dfl_poll_msecs, &disk_events_dfl_poll_msecs_param_ops, 173477ea887eSTejun Heo &disk_events_dfl_poll_msecs, 0644); 173577ea887eSTejun Heo 173677ea887eSTejun Heo /* 173777ea887eSTejun Heo * disk_{add|del|release}_events - initialize and destroy disk_events. 173877ea887eSTejun Heo */ 173977ea887eSTejun Heo static void disk_add_events(struct gendisk *disk) 174077ea887eSTejun Heo { 174177ea887eSTejun Heo struct disk_events *ev; 174277ea887eSTejun Heo 174375e3f3eeSTejun Heo if (!disk->fops->check_events) 174477ea887eSTejun Heo return; 174577ea887eSTejun Heo 174677ea887eSTejun Heo ev = kzalloc(sizeof(*ev), GFP_KERNEL); 174777ea887eSTejun Heo if (!ev) { 174877ea887eSTejun Heo pr_warn("%s: failed to initialize events\n", disk->disk_name); 174977ea887eSTejun Heo return; 175077ea887eSTejun Heo } 175177ea887eSTejun Heo 175277ea887eSTejun Heo if (sysfs_create_files(&disk_to_dev(disk)->kobj, 175377ea887eSTejun Heo disk_events_attrs) < 0) { 175477ea887eSTejun Heo pr_warn("%s: failed to create sysfs files for events\n", 175577ea887eSTejun Heo disk->disk_name); 175677ea887eSTejun Heo kfree(ev); 175777ea887eSTejun Heo return; 175877ea887eSTejun Heo } 175977ea887eSTejun Heo 176077ea887eSTejun Heo disk->ev = ev; 176177ea887eSTejun Heo 176277ea887eSTejun Heo INIT_LIST_HEAD(&ev->node); 176377ea887eSTejun Heo ev->disk = disk; 176477ea887eSTejun Heo spin_lock_init(&ev->lock); 1765fdd514e1STejun Heo mutex_init(&ev->block_mutex); 176677ea887eSTejun Heo ev->block = 1; 176777ea887eSTejun Heo ev->poll_msecs = -1; 176877ea887eSTejun Heo INIT_DELAYED_WORK(&ev->dwork, disk_events_workfn); 176977ea887eSTejun Heo 177077ea887eSTejun Heo mutex_lock(&disk_events_mutex); 177177ea887eSTejun Heo list_add_tail(&ev->node, &disk_events); 177277ea887eSTejun Heo mutex_unlock(&disk_events_mutex); 177377ea887eSTejun Heo 177477ea887eSTejun Heo /* 177577ea887eSTejun Heo * Block count is initialized to 1 and the following initial 177677ea887eSTejun Heo * unblock kicks it into action. 177777ea887eSTejun Heo */ 177877ea887eSTejun Heo __disk_unblock_events(disk, true); 177977ea887eSTejun Heo } 178077ea887eSTejun Heo 178177ea887eSTejun Heo static void disk_del_events(struct gendisk *disk) 178277ea887eSTejun Heo { 178377ea887eSTejun Heo if (!disk->ev) 178477ea887eSTejun Heo return; 178577ea887eSTejun Heo 1786c3af54afSTejun Heo disk_block_events(disk); 178777ea887eSTejun Heo 178877ea887eSTejun Heo mutex_lock(&disk_events_mutex); 178977ea887eSTejun Heo list_del_init(&disk->ev->node); 179077ea887eSTejun Heo mutex_unlock(&disk_events_mutex); 179177ea887eSTejun Heo 179277ea887eSTejun Heo sysfs_remove_files(&disk_to_dev(disk)->kobj, disk_events_attrs); 179377ea887eSTejun Heo } 179477ea887eSTejun Heo 179577ea887eSTejun Heo static void disk_release_events(struct gendisk *disk) 179677ea887eSTejun Heo { 179777ea887eSTejun Heo /* the block count should be 1 from disk_del_events() */ 179877ea887eSTejun Heo WARN_ON_ONCE(disk->ev && disk->ev->block != 1); 179977ea887eSTejun Heo kfree(disk->ev); 180077ea887eSTejun Heo } 1801