11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * gendisk handling 31da177e4SLinus Torvalds */ 41da177e4SLinus Torvalds 51da177e4SLinus Torvalds #include <linux/module.h> 61da177e4SLinus Torvalds #include <linux/fs.h> 71da177e4SLinus Torvalds #include <linux/genhd.h> 8b446b60eSAndrew Morton #include <linux/kdev_t.h> 91da177e4SLinus Torvalds #include <linux/kernel.h> 101da177e4SLinus Torvalds #include <linux/blkdev.h> 111da177e4SLinus Torvalds #include <linux/init.h> 121da177e4SLinus Torvalds #include <linux/spinlock.h> 13f500975aSAlexey Dobriyan #include <linux/proc_fs.h> 141da177e4SLinus Torvalds #include <linux/seq_file.h> 151da177e4SLinus Torvalds #include <linux/slab.h> 161da177e4SLinus Torvalds #include <linux/kmod.h> 171da177e4SLinus Torvalds #include <linux/kobj_map.h> 1858383af6SJes Sorensen #include <linux/mutex.h> 19bcce3de1STejun Heo #include <linux/idr.h> 2077ea887eSTejun Heo #include <linux/log2.h> 211da177e4SLinus Torvalds 22ff88972cSAdrian Bunk #include "blk.h" 23ff88972cSAdrian Bunk 24edfaa7c3SKay Sievers static DEFINE_MUTEX(block_class_lock); 25edfaa7c3SKay Sievers struct kobject *block_depr; 261da177e4SLinus Torvalds 27bcce3de1STejun Heo /* for extended dynamic devt allocation, currently only one major is used */ 28bcce3de1STejun Heo #define MAX_EXT_DEVT (1 << MINORBITS) 29bcce3de1STejun Heo 30bcce3de1STejun Heo /* For extended devt allocation. ext_devt_mutex prevents look up 31bcce3de1STejun Heo * results from going away underneath its user. 32bcce3de1STejun Heo */ 33bcce3de1STejun Heo static DEFINE_MUTEX(ext_devt_mutex); 34bcce3de1STejun Heo static DEFINE_IDR(ext_devt_idr); 35bcce3de1STejun Heo 361826eadfSAdrian Bunk static struct device_type disk_type; 371826eadfSAdrian Bunk 389f53d2feSStanislaw Gruszka static void disk_alloc_events(struct gendisk *disk); 3977ea887eSTejun Heo static void disk_add_events(struct gendisk *disk); 4077ea887eSTejun Heo static void disk_del_events(struct gendisk *disk); 4177ea887eSTejun Heo static void disk_release_events(struct gendisk *disk); 4277ea887eSTejun Heo 43e71bf0d0STejun Heo /** 44e71bf0d0STejun Heo * disk_get_part - get partition 45e71bf0d0STejun Heo * @disk: disk to look partition from 46e71bf0d0STejun Heo * @partno: partition number 47e71bf0d0STejun Heo * 48e71bf0d0STejun Heo * Look for partition @partno from @disk. If found, increment 49e71bf0d0STejun Heo * reference count and return it. 50e71bf0d0STejun Heo * 51e71bf0d0STejun Heo * CONTEXT: 52e71bf0d0STejun Heo * Don't care. 53e71bf0d0STejun Heo * 54e71bf0d0STejun Heo * RETURNS: 55e71bf0d0STejun Heo * Pointer to the found partition on success, NULL if not found. 56e71bf0d0STejun Heo */ 57e71bf0d0STejun Heo struct hd_struct *disk_get_part(struct gendisk *disk, int partno) 58e71bf0d0STejun Heo { 59540eed56STejun Heo struct hd_struct *part = NULL; 60540eed56STejun Heo struct disk_part_tbl *ptbl; 61e71bf0d0STejun Heo 62540eed56STejun Heo if (unlikely(partno < 0)) 63e71bf0d0STejun Heo return NULL; 64540eed56STejun Heo 65e71bf0d0STejun Heo rcu_read_lock(); 66540eed56STejun Heo 67540eed56STejun Heo ptbl = rcu_dereference(disk->part_tbl); 68540eed56STejun Heo if (likely(partno < ptbl->len)) { 69540eed56STejun Heo part = rcu_dereference(ptbl->part[partno]); 70e71bf0d0STejun Heo if (part) 71ed9e1982STejun Heo get_device(part_to_dev(part)); 72540eed56STejun Heo } 73540eed56STejun Heo 74e71bf0d0STejun Heo rcu_read_unlock(); 75e71bf0d0STejun Heo 76e71bf0d0STejun Heo return part; 77e71bf0d0STejun Heo } 78e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_get_part); 79e71bf0d0STejun Heo 80e71bf0d0STejun Heo /** 81e71bf0d0STejun Heo * disk_part_iter_init - initialize partition iterator 82e71bf0d0STejun Heo * @piter: iterator to initialize 83e71bf0d0STejun Heo * @disk: disk to iterate over 84e71bf0d0STejun Heo * @flags: DISK_PITER_* flags 85e71bf0d0STejun Heo * 86e71bf0d0STejun Heo * Initialize @piter so that it iterates over partitions of @disk. 87e71bf0d0STejun Heo * 88e71bf0d0STejun Heo * CONTEXT: 89e71bf0d0STejun Heo * Don't care. 90e71bf0d0STejun Heo */ 91e71bf0d0STejun Heo void disk_part_iter_init(struct disk_part_iter *piter, struct gendisk *disk, 92e71bf0d0STejun Heo unsigned int flags) 93e71bf0d0STejun Heo { 94540eed56STejun Heo struct disk_part_tbl *ptbl; 95540eed56STejun Heo 96540eed56STejun Heo rcu_read_lock(); 97540eed56STejun Heo ptbl = rcu_dereference(disk->part_tbl); 98540eed56STejun Heo 99e71bf0d0STejun Heo piter->disk = disk; 100e71bf0d0STejun Heo piter->part = NULL; 101e71bf0d0STejun Heo 102e71bf0d0STejun Heo if (flags & DISK_PITER_REVERSE) 103540eed56STejun Heo piter->idx = ptbl->len - 1; 10471982a40STejun Heo else if (flags & (DISK_PITER_INCL_PART0 | DISK_PITER_INCL_EMPTY_PART0)) 105e71bf0d0STejun Heo piter->idx = 0; 106b5d0b9dfSTejun Heo else 107b5d0b9dfSTejun Heo piter->idx = 1; 108e71bf0d0STejun Heo 109e71bf0d0STejun Heo piter->flags = flags; 110540eed56STejun Heo 111540eed56STejun Heo rcu_read_unlock(); 112e71bf0d0STejun Heo } 113e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_part_iter_init); 114e71bf0d0STejun Heo 115e71bf0d0STejun Heo /** 116e71bf0d0STejun Heo * disk_part_iter_next - proceed iterator to the next partition and return it 117e71bf0d0STejun Heo * @piter: iterator of interest 118e71bf0d0STejun Heo * 119e71bf0d0STejun Heo * Proceed @piter to the next partition and return it. 120e71bf0d0STejun Heo * 121e71bf0d0STejun Heo * CONTEXT: 122e71bf0d0STejun Heo * Don't care. 123e71bf0d0STejun Heo */ 124e71bf0d0STejun Heo struct hd_struct *disk_part_iter_next(struct disk_part_iter *piter) 125e71bf0d0STejun Heo { 126540eed56STejun Heo struct disk_part_tbl *ptbl; 127e71bf0d0STejun Heo int inc, end; 128e71bf0d0STejun Heo 129e71bf0d0STejun Heo /* put the last partition */ 130e71bf0d0STejun Heo disk_put_part(piter->part); 131e71bf0d0STejun Heo piter->part = NULL; 132e71bf0d0STejun Heo 133540eed56STejun Heo /* get part_tbl */ 134e71bf0d0STejun Heo rcu_read_lock(); 135540eed56STejun Heo ptbl = rcu_dereference(piter->disk->part_tbl); 136e71bf0d0STejun Heo 137e71bf0d0STejun Heo /* determine iteration parameters */ 138e71bf0d0STejun Heo if (piter->flags & DISK_PITER_REVERSE) { 139e71bf0d0STejun Heo inc = -1; 14071982a40STejun Heo if (piter->flags & (DISK_PITER_INCL_PART0 | 14171982a40STejun Heo DISK_PITER_INCL_EMPTY_PART0)) 142e71bf0d0STejun Heo end = -1; 143b5d0b9dfSTejun Heo else 144b5d0b9dfSTejun Heo end = 0; 145e71bf0d0STejun Heo } else { 146e71bf0d0STejun Heo inc = 1; 147540eed56STejun Heo end = ptbl->len; 148e71bf0d0STejun Heo } 149e71bf0d0STejun Heo 150e71bf0d0STejun Heo /* iterate to the next partition */ 151e71bf0d0STejun Heo for (; piter->idx != end; piter->idx += inc) { 152e71bf0d0STejun Heo struct hd_struct *part; 153e71bf0d0STejun Heo 154540eed56STejun Heo part = rcu_dereference(ptbl->part[piter->idx]); 155e71bf0d0STejun Heo if (!part) 156e71bf0d0STejun Heo continue; 157c83f6bf9SVivek Goyal if (!part_nr_sects_read(part) && 15871982a40STejun Heo !(piter->flags & DISK_PITER_INCL_EMPTY) && 15971982a40STejun Heo !(piter->flags & DISK_PITER_INCL_EMPTY_PART0 && 16071982a40STejun Heo piter->idx == 0)) 161e71bf0d0STejun Heo continue; 162e71bf0d0STejun Heo 163ed9e1982STejun Heo get_device(part_to_dev(part)); 164e71bf0d0STejun Heo piter->part = part; 165e71bf0d0STejun Heo piter->idx += inc; 166e71bf0d0STejun Heo break; 167e71bf0d0STejun Heo } 168e71bf0d0STejun Heo 169e71bf0d0STejun Heo rcu_read_unlock(); 170e71bf0d0STejun Heo 171e71bf0d0STejun Heo return piter->part; 172e71bf0d0STejun Heo } 173e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_part_iter_next); 174e71bf0d0STejun Heo 175e71bf0d0STejun Heo /** 176e71bf0d0STejun Heo * disk_part_iter_exit - finish up partition iteration 177e71bf0d0STejun Heo * @piter: iter of interest 178e71bf0d0STejun Heo * 179e71bf0d0STejun Heo * Called when iteration is over. Cleans up @piter. 180e71bf0d0STejun Heo * 181e71bf0d0STejun Heo * CONTEXT: 182e71bf0d0STejun Heo * Don't care. 183e71bf0d0STejun Heo */ 184e71bf0d0STejun Heo void disk_part_iter_exit(struct disk_part_iter *piter) 185e71bf0d0STejun Heo { 186e71bf0d0STejun Heo disk_put_part(piter->part); 187e71bf0d0STejun Heo piter->part = NULL; 188e71bf0d0STejun Heo } 189e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_part_iter_exit); 190e71bf0d0STejun Heo 191a6f23657SJens Axboe static inline int sector_in_part(struct hd_struct *part, sector_t sector) 192a6f23657SJens Axboe { 193a6f23657SJens Axboe return part->start_sect <= sector && 194c83f6bf9SVivek Goyal sector < part->start_sect + part_nr_sects_read(part); 195a6f23657SJens Axboe } 196a6f23657SJens Axboe 197e71bf0d0STejun Heo /** 198e71bf0d0STejun Heo * disk_map_sector_rcu - map sector to partition 199e71bf0d0STejun Heo * @disk: gendisk of interest 200e71bf0d0STejun Heo * @sector: sector to map 201e71bf0d0STejun Heo * 202e71bf0d0STejun Heo * Find out which partition @sector maps to on @disk. This is 203e71bf0d0STejun Heo * primarily used for stats accounting. 204e71bf0d0STejun Heo * 205e71bf0d0STejun Heo * CONTEXT: 206e71bf0d0STejun Heo * RCU read locked. The returned partition pointer is valid only 207e71bf0d0STejun Heo * while preemption is disabled. 208e71bf0d0STejun Heo * 209e71bf0d0STejun Heo * RETURNS: 210074a7acaSTejun Heo * Found partition on success, part0 is returned if no partition matches 211e71bf0d0STejun Heo */ 212e71bf0d0STejun Heo struct hd_struct *disk_map_sector_rcu(struct gendisk *disk, sector_t sector) 213e71bf0d0STejun Heo { 214540eed56STejun Heo struct disk_part_tbl *ptbl; 215a6f23657SJens Axboe struct hd_struct *part; 216e71bf0d0STejun Heo int i; 217e71bf0d0STejun Heo 218540eed56STejun Heo ptbl = rcu_dereference(disk->part_tbl); 219540eed56STejun Heo 220a6f23657SJens Axboe part = rcu_dereference(ptbl->last_lookup); 221a6f23657SJens Axboe if (part && sector_in_part(part, sector)) 222e71bf0d0STejun Heo return part; 223a6f23657SJens Axboe 224a6f23657SJens Axboe for (i = 1; i < ptbl->len; i++) { 225a6f23657SJens Axboe part = rcu_dereference(ptbl->part[i]); 226a6f23657SJens Axboe 227a6f23657SJens Axboe if (part && sector_in_part(part, sector)) { 228a6f23657SJens Axboe rcu_assign_pointer(ptbl->last_lookup, part); 229a6f23657SJens Axboe return part; 230a6f23657SJens Axboe } 231e71bf0d0STejun Heo } 232074a7acaSTejun Heo return &disk->part0; 233e71bf0d0STejun Heo } 234e71bf0d0STejun Heo EXPORT_SYMBOL_GPL(disk_map_sector_rcu); 235e71bf0d0STejun Heo 2361da177e4SLinus Torvalds /* 2371da177e4SLinus Torvalds * Can be deleted altogether. Later. 2381da177e4SLinus Torvalds * 2391da177e4SLinus Torvalds */ 2401da177e4SLinus Torvalds static struct blk_major_name { 2411da177e4SLinus Torvalds struct blk_major_name *next; 2421da177e4SLinus Torvalds int major; 2431da177e4SLinus Torvalds char name[16]; 24468eef3b4SJoe Korty } *major_names[BLKDEV_MAJOR_HASH_SIZE]; 2451da177e4SLinus Torvalds 2461da177e4SLinus Torvalds /* index in the above - for now: assume no multimajor ranges */ 247e61eb2e9SYang Zhang static inline int major_to_index(unsigned major) 2481da177e4SLinus Torvalds { 24968eef3b4SJoe Korty return major % BLKDEV_MAJOR_HASH_SIZE; 2501da177e4SLinus Torvalds } 2511da177e4SLinus Torvalds 25268eef3b4SJoe Korty #ifdef CONFIG_PROC_FS 253cf771cb5STejun Heo void blkdev_show(struct seq_file *seqf, off_t offset) 2547170be5fSNeil Horman { 25568eef3b4SJoe Korty struct blk_major_name *dp; 2567170be5fSNeil Horman 25768eef3b4SJoe Korty if (offset < BLKDEV_MAJOR_HASH_SIZE) { 258edfaa7c3SKay Sievers mutex_lock(&block_class_lock); 25968eef3b4SJoe Korty for (dp = major_names[offset]; dp; dp = dp->next) 260cf771cb5STejun Heo seq_printf(seqf, "%3d %s\n", dp->major, dp->name); 261edfaa7c3SKay Sievers mutex_unlock(&block_class_lock); 26268eef3b4SJoe Korty } 2637170be5fSNeil Horman } 26468eef3b4SJoe Korty #endif /* CONFIG_PROC_FS */ 2651da177e4SLinus Torvalds 2669e8c0bccSMárton Németh /** 2679e8c0bccSMárton Németh * register_blkdev - register a new block device 2689e8c0bccSMárton Németh * 2699e8c0bccSMárton Németh * @major: the requested major device number [1..255]. If @major=0, try to 2709e8c0bccSMárton Németh * allocate any unused major number. 2719e8c0bccSMárton Németh * @name: the name of the new block device as a zero terminated string 2729e8c0bccSMárton Németh * 2739e8c0bccSMárton Németh * The @name must be unique within the system. 2749e8c0bccSMárton Németh * 2759e8c0bccSMárton Németh * The return value depends on the @major input parameter. 2769e8c0bccSMárton Németh * - if a major device number was requested in range [1..255] then the 2779e8c0bccSMárton Németh * function returns zero on success, or a negative error code 2789e8c0bccSMárton Németh * - if any unused major number was requested with @major=0 parameter 2799e8c0bccSMárton Németh * then the return value is the allocated major number in range 2809e8c0bccSMárton Németh * [1..255] or a negative error code otherwise 2819e8c0bccSMárton Németh */ 2821da177e4SLinus Torvalds int register_blkdev(unsigned int major, const char *name) 2831da177e4SLinus Torvalds { 2841da177e4SLinus Torvalds struct blk_major_name **n, *p; 2851da177e4SLinus Torvalds int index, ret = 0; 2861da177e4SLinus Torvalds 287edfaa7c3SKay Sievers mutex_lock(&block_class_lock); 2881da177e4SLinus Torvalds 2891da177e4SLinus Torvalds /* temporary */ 2901da177e4SLinus Torvalds if (major == 0) { 2911da177e4SLinus Torvalds for (index = ARRAY_SIZE(major_names)-1; index > 0; index--) { 2921da177e4SLinus Torvalds if (major_names[index] == NULL) 2931da177e4SLinus Torvalds break; 2941da177e4SLinus Torvalds } 2951da177e4SLinus Torvalds 2961da177e4SLinus Torvalds if (index == 0) { 2971da177e4SLinus Torvalds printk("register_blkdev: failed to get major for %s\n", 2981da177e4SLinus Torvalds name); 2991da177e4SLinus Torvalds ret = -EBUSY; 3001da177e4SLinus Torvalds goto out; 3011da177e4SLinus Torvalds } 3021da177e4SLinus Torvalds major = index; 3031da177e4SLinus Torvalds ret = major; 3041da177e4SLinus Torvalds } 3051da177e4SLinus Torvalds 3061da177e4SLinus Torvalds p = kmalloc(sizeof(struct blk_major_name), GFP_KERNEL); 3071da177e4SLinus Torvalds if (p == NULL) { 3081da177e4SLinus Torvalds ret = -ENOMEM; 3091da177e4SLinus Torvalds goto out; 3101da177e4SLinus Torvalds } 3111da177e4SLinus Torvalds 3121da177e4SLinus Torvalds p->major = major; 3131da177e4SLinus Torvalds strlcpy(p->name, name, sizeof(p->name)); 3141da177e4SLinus Torvalds p->next = NULL; 3151da177e4SLinus Torvalds index = major_to_index(major); 3161da177e4SLinus Torvalds 3171da177e4SLinus Torvalds for (n = &major_names[index]; *n; n = &(*n)->next) { 3181da177e4SLinus Torvalds if ((*n)->major == major) 3191da177e4SLinus Torvalds break; 3201da177e4SLinus Torvalds } 3211da177e4SLinus Torvalds if (!*n) 3221da177e4SLinus Torvalds *n = p; 3231da177e4SLinus Torvalds else 3241da177e4SLinus Torvalds ret = -EBUSY; 3251da177e4SLinus Torvalds 3261da177e4SLinus Torvalds if (ret < 0) { 3271da177e4SLinus Torvalds printk("register_blkdev: cannot get major %d for %s\n", 3281da177e4SLinus Torvalds major, name); 3291da177e4SLinus Torvalds kfree(p); 3301da177e4SLinus Torvalds } 3311da177e4SLinus Torvalds out: 332edfaa7c3SKay Sievers mutex_unlock(&block_class_lock); 3331da177e4SLinus Torvalds return ret; 3341da177e4SLinus Torvalds } 3351da177e4SLinus Torvalds 3361da177e4SLinus Torvalds EXPORT_SYMBOL(register_blkdev); 3371da177e4SLinus Torvalds 338f4480240SAkinobu Mita void unregister_blkdev(unsigned int major, const char *name) 3391da177e4SLinus Torvalds { 3401da177e4SLinus Torvalds struct blk_major_name **n; 3411da177e4SLinus Torvalds struct blk_major_name *p = NULL; 3421da177e4SLinus Torvalds int index = major_to_index(major); 3431da177e4SLinus Torvalds 344edfaa7c3SKay Sievers mutex_lock(&block_class_lock); 3451da177e4SLinus Torvalds for (n = &major_names[index]; *n; n = &(*n)->next) 3461da177e4SLinus Torvalds if ((*n)->major == major) 3471da177e4SLinus Torvalds break; 348294462a5SAkinobu Mita if (!*n || strcmp((*n)->name, name)) { 349294462a5SAkinobu Mita WARN_ON(1); 350294462a5SAkinobu Mita } else { 3511da177e4SLinus Torvalds p = *n; 3521da177e4SLinus Torvalds *n = p->next; 3531da177e4SLinus Torvalds } 354edfaa7c3SKay Sievers mutex_unlock(&block_class_lock); 3551da177e4SLinus Torvalds kfree(p); 3561da177e4SLinus Torvalds } 3571da177e4SLinus Torvalds 3581da177e4SLinus Torvalds EXPORT_SYMBOL(unregister_blkdev); 3591da177e4SLinus Torvalds 3601da177e4SLinus Torvalds static struct kobj_map *bdev_map; 3611da177e4SLinus Torvalds 362bcce3de1STejun Heo /** 363870d6656STejun Heo * blk_mangle_minor - scatter minor numbers apart 364870d6656STejun Heo * @minor: minor number to mangle 365870d6656STejun Heo * 366870d6656STejun Heo * Scatter consecutively allocated @minor number apart if MANGLE_DEVT 367870d6656STejun Heo * is enabled. Mangling twice gives the original value. 368870d6656STejun Heo * 369870d6656STejun Heo * RETURNS: 370870d6656STejun Heo * Mangled value. 371870d6656STejun Heo * 372870d6656STejun Heo * CONTEXT: 373870d6656STejun Heo * Don't care. 374870d6656STejun Heo */ 375870d6656STejun Heo static int blk_mangle_minor(int minor) 376870d6656STejun Heo { 377870d6656STejun Heo #ifdef CONFIG_DEBUG_BLOCK_EXT_DEVT 378870d6656STejun Heo int i; 379870d6656STejun Heo 380870d6656STejun Heo for (i = 0; i < MINORBITS / 2; i++) { 381870d6656STejun Heo int low = minor & (1 << i); 382870d6656STejun Heo int high = minor & (1 << (MINORBITS - 1 - i)); 383870d6656STejun Heo int distance = MINORBITS - 1 - 2 * i; 384870d6656STejun Heo 385870d6656STejun Heo minor ^= low | high; /* clear both bits */ 386870d6656STejun Heo low <<= distance; /* swap the positions */ 387870d6656STejun Heo high >>= distance; 388870d6656STejun Heo minor |= low | high; /* and set */ 389870d6656STejun Heo } 390870d6656STejun Heo #endif 391870d6656STejun Heo return minor; 392870d6656STejun Heo } 393870d6656STejun Heo 394870d6656STejun Heo /** 395bcce3de1STejun Heo * blk_alloc_devt - allocate a dev_t for a partition 396bcce3de1STejun Heo * @part: partition to allocate dev_t for 397bcce3de1STejun Heo * @devt: out parameter for resulting dev_t 398bcce3de1STejun Heo * 399bcce3de1STejun Heo * Allocate a dev_t for block device. 400bcce3de1STejun Heo * 401bcce3de1STejun Heo * RETURNS: 402bcce3de1STejun Heo * 0 on success, allocated dev_t is returned in *@devt. -errno on 403bcce3de1STejun Heo * failure. 404bcce3de1STejun Heo * 405bcce3de1STejun Heo * CONTEXT: 406bcce3de1STejun Heo * Might sleep. 407bcce3de1STejun Heo */ 408bcce3de1STejun Heo int blk_alloc_devt(struct hd_struct *part, dev_t *devt) 409bcce3de1STejun Heo { 410bcce3de1STejun Heo struct gendisk *disk = part_to_disk(part); 411bcce3de1STejun Heo int idx, rc; 412bcce3de1STejun Heo 413bcce3de1STejun Heo /* in consecutive minor range? */ 414bcce3de1STejun Heo if (part->partno < disk->minors) { 415bcce3de1STejun Heo *devt = MKDEV(disk->major, disk->first_minor + part->partno); 416bcce3de1STejun Heo return 0; 417bcce3de1STejun Heo } 418bcce3de1STejun Heo 419bcce3de1STejun Heo /* allocate ext devt */ 420bcce3de1STejun Heo do { 421bcce3de1STejun Heo if (!idr_pre_get(&ext_devt_idr, GFP_KERNEL)) 422bcce3de1STejun Heo return -ENOMEM; 423bcce3de1STejun Heo rc = idr_get_new(&ext_devt_idr, part, &idx); 424bcce3de1STejun Heo } while (rc == -EAGAIN); 425bcce3de1STejun Heo 426bcce3de1STejun Heo if (rc) 427bcce3de1STejun Heo return rc; 428bcce3de1STejun Heo 429bcce3de1STejun Heo if (idx > MAX_EXT_DEVT) { 430bcce3de1STejun Heo idr_remove(&ext_devt_idr, idx); 431bcce3de1STejun Heo return -EBUSY; 432bcce3de1STejun Heo } 433bcce3de1STejun Heo 434870d6656STejun Heo *devt = MKDEV(BLOCK_EXT_MAJOR, blk_mangle_minor(idx)); 435bcce3de1STejun Heo return 0; 436bcce3de1STejun Heo } 437bcce3de1STejun Heo 438bcce3de1STejun Heo /** 439bcce3de1STejun Heo * blk_free_devt - free a dev_t 440bcce3de1STejun Heo * @devt: dev_t to free 441bcce3de1STejun Heo * 442bcce3de1STejun Heo * Free @devt which was allocated using blk_alloc_devt(). 443bcce3de1STejun Heo * 444bcce3de1STejun Heo * CONTEXT: 445bcce3de1STejun Heo * Might sleep. 446bcce3de1STejun Heo */ 447bcce3de1STejun Heo void blk_free_devt(dev_t devt) 448bcce3de1STejun Heo { 449bcce3de1STejun Heo might_sleep(); 450bcce3de1STejun Heo 451bcce3de1STejun Heo if (devt == MKDEV(0, 0)) 452bcce3de1STejun Heo return; 453bcce3de1STejun Heo 454bcce3de1STejun Heo if (MAJOR(devt) == BLOCK_EXT_MAJOR) { 455bcce3de1STejun Heo mutex_lock(&ext_devt_mutex); 456870d6656STejun Heo idr_remove(&ext_devt_idr, blk_mangle_minor(MINOR(devt))); 457bcce3de1STejun Heo mutex_unlock(&ext_devt_mutex); 458bcce3de1STejun Heo } 459bcce3de1STejun Heo } 460bcce3de1STejun Heo 4611f014290STejun Heo static char *bdevt_str(dev_t devt, char *buf) 4621f014290STejun Heo { 4631f014290STejun Heo if (MAJOR(devt) <= 0xff && MINOR(devt) <= 0xff) { 4641f014290STejun Heo char tbuf[BDEVT_SIZE]; 4651f014290STejun Heo snprintf(tbuf, BDEVT_SIZE, "%02x%02x", MAJOR(devt), MINOR(devt)); 4661f014290STejun Heo snprintf(buf, BDEVT_SIZE, "%-9s", tbuf); 4671f014290STejun Heo } else 4681f014290STejun Heo snprintf(buf, BDEVT_SIZE, "%03x:%05x", MAJOR(devt), MINOR(devt)); 4691f014290STejun Heo 4701f014290STejun Heo return buf; 4711f014290STejun Heo } 4721f014290STejun Heo 4731da177e4SLinus Torvalds /* 4741da177e4SLinus Torvalds * Register device numbers dev..(dev+range-1) 4751da177e4SLinus Torvalds * range must be nonzero 4761da177e4SLinus Torvalds * The hash chain is sorted on range, so that subranges can override. 4771da177e4SLinus Torvalds */ 478edfaa7c3SKay Sievers void blk_register_region(dev_t devt, unsigned long range, struct module *module, 4791da177e4SLinus Torvalds struct kobject *(*probe)(dev_t, int *, void *), 4801da177e4SLinus Torvalds int (*lock)(dev_t, void *), void *data) 4811da177e4SLinus Torvalds { 482edfaa7c3SKay Sievers kobj_map(bdev_map, devt, range, module, probe, lock, data); 4831da177e4SLinus Torvalds } 4841da177e4SLinus Torvalds 4851da177e4SLinus Torvalds EXPORT_SYMBOL(blk_register_region); 4861da177e4SLinus Torvalds 487edfaa7c3SKay Sievers void blk_unregister_region(dev_t devt, unsigned long range) 4881da177e4SLinus Torvalds { 489edfaa7c3SKay Sievers kobj_unmap(bdev_map, devt, range); 4901da177e4SLinus Torvalds } 4911da177e4SLinus Torvalds 4921da177e4SLinus Torvalds EXPORT_SYMBOL(blk_unregister_region); 4931da177e4SLinus Torvalds 494cf771cb5STejun Heo static struct kobject *exact_match(dev_t devt, int *partno, void *data) 4951da177e4SLinus Torvalds { 4961da177e4SLinus Torvalds struct gendisk *p = data; 497edfaa7c3SKay Sievers 498ed9e1982STejun Heo return &disk_to_dev(p)->kobj; 4991da177e4SLinus Torvalds } 5001da177e4SLinus Torvalds 501edfaa7c3SKay Sievers static int exact_lock(dev_t devt, void *data) 5021da177e4SLinus Torvalds { 5031da177e4SLinus Torvalds struct gendisk *p = data; 5041da177e4SLinus Torvalds 5051da177e4SLinus Torvalds if (!get_disk(p)) 5061da177e4SLinus Torvalds return -1; 5071da177e4SLinus Torvalds return 0; 5081da177e4SLinus Torvalds } 5091da177e4SLinus Torvalds 5104752bc30SAl Viro static void register_disk(struct gendisk *disk) 511d2bf1b67STejun Heo { 512d2bf1b67STejun Heo struct device *ddev = disk_to_dev(disk); 513d2bf1b67STejun Heo struct block_device *bdev; 514d2bf1b67STejun Heo struct disk_part_iter piter; 515d2bf1b67STejun Heo struct hd_struct *part; 516d2bf1b67STejun Heo int err; 517d2bf1b67STejun Heo 518d2bf1b67STejun Heo ddev->parent = disk->driverfs_dev; 519d2bf1b67STejun Heo 520d2bf1b67STejun Heo dev_set_name(ddev, disk->disk_name); 521d2bf1b67STejun Heo 522d2bf1b67STejun Heo /* delay uevents, until we scanned partition table */ 523d2bf1b67STejun Heo dev_set_uevent_suppress(ddev, 1); 524d2bf1b67STejun Heo 525d2bf1b67STejun Heo if (device_add(ddev)) 526d2bf1b67STejun Heo return; 527d2bf1b67STejun Heo if (!sysfs_deprecated) { 528d2bf1b67STejun Heo err = sysfs_create_link(block_depr, &ddev->kobj, 529d2bf1b67STejun Heo kobject_name(&ddev->kobj)); 530d2bf1b67STejun Heo if (err) { 531d2bf1b67STejun Heo device_del(ddev); 532d2bf1b67STejun Heo return; 533d2bf1b67STejun Heo } 534d2bf1b67STejun Heo } 535d2bf1b67STejun Heo disk->part0.holder_dir = kobject_create_and_add("holders", &ddev->kobj); 536d2bf1b67STejun Heo disk->slave_dir = kobject_create_and_add("slaves", &ddev->kobj); 537d2bf1b67STejun Heo 538d2bf1b67STejun Heo /* No minors to use for partitions */ 539d27769ecSTejun Heo if (!disk_part_scan_enabled(disk)) 540d2bf1b67STejun Heo goto exit; 541d2bf1b67STejun Heo 542d2bf1b67STejun Heo /* No such device (e.g., media were just removed) */ 543d2bf1b67STejun Heo if (!get_capacity(disk)) 544d2bf1b67STejun Heo goto exit; 545d2bf1b67STejun Heo 546d2bf1b67STejun Heo bdev = bdget_disk(disk, 0); 547d2bf1b67STejun Heo if (!bdev) 548d2bf1b67STejun Heo goto exit; 549d2bf1b67STejun Heo 550d2bf1b67STejun Heo bdev->bd_invalidated = 1; 551d2bf1b67STejun Heo err = blkdev_get(bdev, FMODE_READ, NULL); 552d2bf1b67STejun Heo if (err < 0) 553d2bf1b67STejun Heo goto exit; 554d2bf1b67STejun Heo blkdev_put(bdev, FMODE_READ); 555d2bf1b67STejun Heo 556d2bf1b67STejun Heo exit: 557d2bf1b67STejun Heo /* announce disk after possible partitions are created */ 558d2bf1b67STejun Heo dev_set_uevent_suppress(ddev, 0); 559d2bf1b67STejun Heo kobject_uevent(&ddev->kobj, KOBJ_ADD); 560d2bf1b67STejun Heo 561d2bf1b67STejun Heo /* announce possible partitions */ 562d2bf1b67STejun Heo disk_part_iter_init(&piter, disk, 0); 563d2bf1b67STejun Heo while ((part = disk_part_iter_next(&piter))) 564d2bf1b67STejun Heo kobject_uevent(&part_to_dev(part)->kobj, KOBJ_ADD); 565d2bf1b67STejun Heo disk_part_iter_exit(&piter); 566d2bf1b67STejun Heo } 567d2bf1b67STejun Heo 5681da177e4SLinus Torvalds /** 5691da177e4SLinus Torvalds * add_disk - add partitioning information to kernel list 5701da177e4SLinus Torvalds * @disk: per-device partitioning information 5711da177e4SLinus Torvalds * 5721da177e4SLinus Torvalds * This function registers the partitioning information in @disk 5731da177e4SLinus Torvalds * with the kernel. 5743e1a7ff8STejun Heo * 5753e1a7ff8STejun Heo * FIXME: error handling 5761da177e4SLinus Torvalds */ 5771da177e4SLinus Torvalds void add_disk(struct gendisk *disk) 5781da177e4SLinus Torvalds { 579cf0ca9feSPeter Zijlstra struct backing_dev_info *bdi; 5803e1a7ff8STejun Heo dev_t devt; 5816ffeea77SGreg Kroah-Hartman int retval; 582cf0ca9feSPeter Zijlstra 5833e1a7ff8STejun Heo /* minors == 0 indicates to use ext devt from part0 and should 5843e1a7ff8STejun Heo * be accompanied with EXT_DEVT flag. Make sure all 5853e1a7ff8STejun Heo * parameters make sense. 5863e1a7ff8STejun Heo */ 5873e1a7ff8STejun Heo WARN_ON(disk->minors && !(disk->major || disk->first_minor)); 5883e1a7ff8STejun Heo WARN_ON(!disk->minors && !(disk->flags & GENHD_FL_EXT_DEVT)); 5893e1a7ff8STejun Heo 5901da177e4SLinus Torvalds disk->flags |= GENHD_FL_UP; 5913e1a7ff8STejun Heo 5923e1a7ff8STejun Heo retval = blk_alloc_devt(&disk->part0, &devt); 5933e1a7ff8STejun Heo if (retval) { 5943e1a7ff8STejun Heo WARN_ON(1); 5953e1a7ff8STejun Heo return; 5963e1a7ff8STejun Heo } 5973e1a7ff8STejun Heo disk_to_dev(disk)->devt = devt; 5983e1a7ff8STejun Heo 5993e1a7ff8STejun Heo /* ->major and ->first_minor aren't supposed to be 6003e1a7ff8STejun Heo * dereferenced from here on, but set them just in case. 6013e1a7ff8STejun Heo */ 6023e1a7ff8STejun Heo disk->major = MAJOR(devt); 6033e1a7ff8STejun Heo disk->first_minor = MINOR(devt); 6043e1a7ff8STejun Heo 6059f53d2feSStanislaw Gruszka disk_alloc_events(disk); 6069f53d2feSStanislaw Gruszka 60701ea5063SSigned-off-by: Jan Kara /* Register BDI before referencing it from bdev */ 60801ea5063SSigned-off-by: Jan Kara bdi = &disk->queue->backing_dev_info; 60901ea5063SSigned-off-by: Jan Kara bdi_register_dev(bdi, disk_devt(disk)); 61001ea5063SSigned-off-by: Jan Kara 611f331c029STejun Heo blk_register_region(disk_devt(disk), disk->minors, NULL, 612f331c029STejun Heo exact_match, exact_lock, disk); 6131da177e4SLinus Torvalds register_disk(disk); 6141da177e4SLinus Torvalds blk_register_queue(disk); 615cf0ca9feSPeter Zijlstra 616523e1d39STejun Heo /* 617523e1d39STejun Heo * Take an extra ref on queue which will be put on disk_release() 618523e1d39STejun Heo * so that it sticks around as long as @disk is there. 619523e1d39STejun Heo */ 62009ac46c4STejun Heo WARN_ON_ONCE(!blk_get_queue(disk->queue)); 621523e1d39STejun Heo 622ed9e1982STejun Heo retval = sysfs_create_link(&disk_to_dev(disk)->kobj, &bdi->dev->kobj, 623ed9e1982STejun Heo "bdi"); 6246ffeea77SGreg Kroah-Hartman WARN_ON(retval); 62577ea887eSTejun Heo 62677ea887eSTejun Heo disk_add_events(disk); 6271da177e4SLinus Torvalds } 6281da177e4SLinus Torvalds EXPORT_SYMBOL(add_disk); 6291da177e4SLinus Torvalds 630d2bf1b67STejun Heo void del_gendisk(struct gendisk *disk) 6311da177e4SLinus Torvalds { 632d2bf1b67STejun Heo struct disk_part_iter piter; 633d2bf1b67STejun Heo struct hd_struct *part; 634d2bf1b67STejun Heo 63577ea887eSTejun Heo disk_del_events(disk); 63677ea887eSTejun Heo 637d2bf1b67STejun Heo /* invalidate stuff */ 638d2bf1b67STejun Heo disk_part_iter_init(&piter, disk, 639d2bf1b67STejun Heo DISK_PITER_INCL_EMPTY | DISK_PITER_REVERSE); 640d2bf1b67STejun Heo while ((part = disk_part_iter_next(&piter))) { 641d2bf1b67STejun Heo invalidate_partition(disk, part->partno); 642d2bf1b67STejun Heo delete_partition(disk, part->partno); 643d2bf1b67STejun Heo } 644d2bf1b67STejun Heo disk_part_iter_exit(&piter); 645d2bf1b67STejun Heo 646d2bf1b67STejun Heo invalidate_partition(disk, 0); 647d2bf1b67STejun Heo blk_free_devt(disk_to_dev(disk)->devt); 648d2bf1b67STejun Heo set_capacity(disk, 0); 649d2bf1b67STejun Heo disk->flags &= ~GENHD_FL_UP; 650d2bf1b67STejun Heo 651ed9e1982STejun Heo sysfs_remove_link(&disk_to_dev(disk)->kobj, "bdi"); 652cf0ca9feSPeter Zijlstra bdi_unregister(&disk->queue->backing_dev_info); 6531da177e4SLinus Torvalds blk_unregister_queue(disk); 654f331c029STejun Heo blk_unregister_region(disk_devt(disk), disk->minors); 655d2bf1b67STejun Heo 656d2bf1b67STejun Heo part_stat_set_all(&disk->part0, 0); 657d2bf1b67STejun Heo disk->part0.stamp = 0; 658d2bf1b67STejun Heo 659d2bf1b67STejun Heo kobject_put(disk->part0.holder_dir); 660d2bf1b67STejun Heo kobject_put(disk->slave_dir); 661d2bf1b67STejun Heo disk->driverfs_dev = NULL; 662d2bf1b67STejun Heo if (!sysfs_deprecated) 663d2bf1b67STejun Heo sysfs_remove_link(block_depr, dev_name(disk_to_dev(disk))); 664d2bf1b67STejun Heo device_del(disk_to_dev(disk)); 6651da177e4SLinus Torvalds } 666d2bf1b67STejun Heo EXPORT_SYMBOL(del_gendisk); 6671da177e4SLinus Torvalds 6681da177e4SLinus Torvalds /** 6691da177e4SLinus Torvalds * get_gendisk - get partitioning information for a given device 670710027a4SRandy Dunlap * @devt: device to get partitioning information for 671496aa8a9SRandy Dunlap * @partno: returned partition index 6721da177e4SLinus Torvalds * 6731da177e4SLinus Torvalds * This function gets the structure containing partitioning 674710027a4SRandy Dunlap * information for the given device @devt. 6751da177e4SLinus Torvalds */ 676cf771cb5STejun Heo struct gendisk *get_gendisk(dev_t devt, int *partno) 6771da177e4SLinus Torvalds { 678bcce3de1STejun Heo struct gendisk *disk = NULL; 679edfaa7c3SKay Sievers 680bcce3de1STejun Heo if (MAJOR(devt) != BLOCK_EXT_MAJOR) { 681bcce3de1STejun Heo struct kobject *kobj; 682bcce3de1STejun Heo 683bcce3de1STejun Heo kobj = kobj_lookup(bdev_map, devt, partno); 684bcce3de1STejun Heo if (kobj) 685bcce3de1STejun Heo disk = dev_to_disk(kobj_to_dev(kobj)); 686bcce3de1STejun Heo } else { 687bcce3de1STejun Heo struct hd_struct *part; 688bcce3de1STejun Heo 689bcce3de1STejun Heo mutex_lock(&ext_devt_mutex); 690870d6656STejun Heo part = idr_find(&ext_devt_idr, blk_mangle_minor(MINOR(devt))); 691bcce3de1STejun Heo if (part && get_disk(part_to_disk(part))) { 692bcce3de1STejun Heo *partno = part->partno; 693bcce3de1STejun Heo disk = part_to_disk(part); 694bcce3de1STejun Heo } 695bcce3de1STejun Heo mutex_unlock(&ext_devt_mutex); 696bcce3de1STejun Heo } 697bcce3de1STejun Heo 698bcce3de1STejun Heo return disk; 6991da177e4SLinus Torvalds } 700b6ac23afSDivyesh Shah EXPORT_SYMBOL(get_gendisk); 7011da177e4SLinus Torvalds 702f331c029STejun Heo /** 703f331c029STejun Heo * bdget_disk - do bdget() by gendisk and partition number 704f331c029STejun Heo * @disk: gendisk of interest 705f331c029STejun Heo * @partno: partition number 706f331c029STejun Heo * 707f331c029STejun Heo * Find partition @partno from @disk, do bdget() on it. 708f331c029STejun Heo * 709f331c029STejun Heo * CONTEXT: 710f331c029STejun Heo * Don't care. 711f331c029STejun Heo * 712f331c029STejun Heo * RETURNS: 713f331c029STejun Heo * Resulting block_device on success, NULL on failure. 714f331c029STejun Heo */ 715aeb3d3a8SHarvey Harrison struct block_device *bdget_disk(struct gendisk *disk, int partno) 716f331c029STejun Heo { 717e71bf0d0STejun Heo struct hd_struct *part; 718548b10ebSTejun Heo struct block_device *bdev = NULL; 719f331c029STejun Heo 720e71bf0d0STejun Heo part = disk_get_part(disk, partno); 7212bbedcb4STejun Heo if (part) 722548b10ebSTejun Heo bdev = bdget(part_devt(part)); 723e71bf0d0STejun Heo disk_put_part(part); 724f331c029STejun Heo 725548b10ebSTejun Heo return bdev; 726f331c029STejun Heo } 727f331c029STejun Heo EXPORT_SYMBOL(bdget_disk); 728f331c029STejun Heo 729dd2a345fSDave Gilbert /* 7305c6f35c5SGreg Kroah-Hartman * print a full list of all partitions - intended for places where the root 7315c6f35c5SGreg Kroah-Hartman * filesystem can't be mounted and thus to give the victim some idea of what 7325c6f35c5SGreg Kroah-Hartman * went wrong 7335c6f35c5SGreg Kroah-Hartman */ 7345c6f35c5SGreg Kroah-Hartman void __init printk_all_partitions(void) 7355c6f35c5SGreg Kroah-Hartman { 736def4e38dSTejun Heo struct class_dev_iter iter; 737def4e38dSTejun Heo struct device *dev; 738def4e38dSTejun Heo 739def4e38dSTejun Heo class_dev_iter_init(&iter, &block_class, NULL, &disk_type); 740def4e38dSTejun Heo while ((dev = class_dev_iter_next(&iter))) { 741def4e38dSTejun Heo struct gendisk *disk = dev_to_disk(dev); 742e71bf0d0STejun Heo struct disk_part_iter piter; 743e71bf0d0STejun Heo struct hd_struct *part; 7441f014290STejun Heo char name_buf[BDEVNAME_SIZE]; 7451f014290STejun Heo char devt_buf[BDEVT_SIZE]; 74605c69d29STejun Heo char uuid_buf[PARTITION_META_INFO_UUIDLTH * 2 + 5]; 747def4e38dSTejun Heo 748def4e38dSTejun Heo /* 749def4e38dSTejun Heo * Don't show empty devices or things that have been 75025985edcSLucas De Marchi * suppressed 751def4e38dSTejun Heo */ 752def4e38dSTejun Heo if (get_capacity(disk) == 0 || 753def4e38dSTejun Heo (disk->flags & GENHD_FL_SUPPRESS_PARTITION_INFO)) 754def4e38dSTejun Heo continue; 755def4e38dSTejun Heo 756def4e38dSTejun Heo /* 757def4e38dSTejun Heo * Note, unlike /proc/partitions, I am showing the 758def4e38dSTejun Heo * numbers in hex - the same format as the root= 759def4e38dSTejun Heo * option takes. 760def4e38dSTejun Heo */ 761074a7acaSTejun Heo disk_part_iter_init(&piter, disk, DISK_PITER_INCL_PART0); 762074a7acaSTejun Heo while ((part = disk_part_iter_next(&piter))) { 763074a7acaSTejun Heo bool is_part0 = part == &disk->part0; 764074a7acaSTejun Heo 76505c69d29STejun Heo uuid_buf[0] = '\0'; 766b5af921eSWill Drewry if (part->info) 76705c69d29STejun Heo snprintf(uuid_buf, sizeof(uuid_buf), "%pU", 76805c69d29STejun Heo part->info->uuid); 769b5af921eSWill Drewry 770b5af921eSWill Drewry printk("%s%s %10llu %s %s", is_part0 ? "" : " ", 771074a7acaSTejun Heo bdevt_str(part_devt(part), devt_buf), 772c83f6bf9SVivek Goyal (unsigned long long)part_nr_sects_read(part) >> 1 773c83f6bf9SVivek Goyal , disk_name(disk, part->partno, name_buf), 77405c69d29STejun Heo uuid_buf); 775074a7acaSTejun Heo if (is_part0) { 776def4e38dSTejun Heo if (disk->driverfs_dev != NULL && 777def4e38dSTejun Heo disk->driverfs_dev->driver != NULL) 778def4e38dSTejun Heo printk(" driver: %s\n", 779def4e38dSTejun Heo disk->driverfs_dev->driver->name); 780def4e38dSTejun Heo else 781def4e38dSTejun Heo printk(" (driver?)\n"); 782074a7acaSTejun Heo } else 783074a7acaSTejun Heo printk("\n"); 784074a7acaSTejun Heo } 785e71bf0d0STejun Heo disk_part_iter_exit(&piter); 786def4e38dSTejun Heo } 787def4e38dSTejun Heo class_dev_iter_exit(&iter); 788dd2a345fSDave Gilbert } 789dd2a345fSDave Gilbert 7901da177e4SLinus Torvalds #ifdef CONFIG_PROC_FS 7911da177e4SLinus Torvalds /* iterator */ 792def4e38dSTejun Heo static void *disk_seqf_start(struct seq_file *seqf, loff_t *pos) 79368c4d4a7SGreg Kroah-Hartman { 794def4e38dSTejun Heo loff_t skip = *pos; 795def4e38dSTejun Heo struct class_dev_iter *iter; 796def4e38dSTejun Heo struct device *dev; 79768c4d4a7SGreg Kroah-Hartman 798aeb3d3a8SHarvey Harrison iter = kmalloc(sizeof(*iter), GFP_KERNEL); 799def4e38dSTejun Heo if (!iter) 800def4e38dSTejun Heo return ERR_PTR(-ENOMEM); 801def4e38dSTejun Heo 802def4e38dSTejun Heo seqf->private = iter; 803def4e38dSTejun Heo class_dev_iter_init(iter, &block_class, NULL, &disk_type); 804def4e38dSTejun Heo do { 805def4e38dSTejun Heo dev = class_dev_iter_next(iter); 806def4e38dSTejun Heo if (!dev) 807def4e38dSTejun Heo return NULL; 808def4e38dSTejun Heo } while (skip--); 809def4e38dSTejun Heo 810def4e38dSTejun Heo return dev_to_disk(dev); 81168c4d4a7SGreg Kroah-Hartman } 81268c4d4a7SGreg Kroah-Hartman 813def4e38dSTejun Heo static void *disk_seqf_next(struct seq_file *seqf, void *v, loff_t *pos) 8141da177e4SLinus Torvalds { 815edfaa7c3SKay Sievers struct device *dev; 81666c64afeSGreg Kroah-Hartman 817def4e38dSTejun Heo (*pos)++; 818def4e38dSTejun Heo dev = class_dev_iter_next(seqf->private); 8192ac3cee5STejun Heo if (dev) 820edfaa7c3SKay Sievers return dev_to_disk(dev); 8212ac3cee5STejun Heo 8221da177e4SLinus Torvalds return NULL; 8231da177e4SLinus Torvalds } 8241da177e4SLinus Torvalds 825def4e38dSTejun Heo static void disk_seqf_stop(struct seq_file *seqf, void *v) 82627f30251SGreg Kroah-Hartman { 827def4e38dSTejun Heo struct class_dev_iter *iter = seqf->private; 828def4e38dSTejun Heo 829def4e38dSTejun Heo /* stop is called even after start failed :-( */ 830def4e38dSTejun Heo if (iter) { 831def4e38dSTejun Heo class_dev_iter_exit(iter); 832def4e38dSTejun Heo kfree(iter); 833def4e38dSTejun Heo } 83427f30251SGreg Kroah-Hartman } 83527f30251SGreg Kroah-Hartman 836def4e38dSTejun Heo static void *show_partition_start(struct seq_file *seqf, loff_t *pos) 8371da177e4SLinus Torvalds { 83806768067SJianpeng Ma void *p; 8391da177e4SLinus Torvalds 840def4e38dSTejun Heo p = disk_seqf_start(seqf, pos); 841b9f985b6SYang Zhang if (!IS_ERR_OR_NULL(p) && !*pos) 842def4e38dSTejun Heo seq_puts(seqf, "major minor #blocks name\n\n"); 843def4e38dSTejun Heo return p; 8441da177e4SLinus Torvalds } 8451da177e4SLinus Torvalds 846cf771cb5STejun Heo static int show_partition(struct seq_file *seqf, void *v) 8471da177e4SLinus Torvalds { 8481da177e4SLinus Torvalds struct gendisk *sgp = v; 849e71bf0d0STejun Heo struct disk_part_iter piter; 850e71bf0d0STejun Heo struct hd_struct *part; 8511da177e4SLinus Torvalds char buf[BDEVNAME_SIZE]; 8521da177e4SLinus Torvalds 8531da177e4SLinus Torvalds /* Don't show non-partitionable removeable devices or empty devices */ 854d27769ecSTejun Heo if (!get_capacity(sgp) || (!disk_max_parts(sgp) && 855f331c029STejun Heo (sgp->flags & GENHD_FL_REMOVABLE))) 8561da177e4SLinus Torvalds return 0; 8571da177e4SLinus Torvalds if (sgp->flags & GENHD_FL_SUPPRESS_PARTITION_INFO) 8581da177e4SLinus Torvalds return 0; 8591da177e4SLinus Torvalds 8601da177e4SLinus Torvalds /* show the full disk and all non-0 size partitions of it */ 861074a7acaSTejun Heo disk_part_iter_init(&piter, sgp, DISK_PITER_INCL_PART0); 862e71bf0d0STejun Heo while ((part = disk_part_iter_next(&piter))) 8631f014290STejun Heo seq_printf(seqf, "%4d %7d %10llu %s\n", 864f331c029STejun Heo MAJOR(part_devt(part)), MINOR(part_devt(part)), 865c83f6bf9SVivek Goyal (unsigned long long)part_nr_sects_read(part) >> 1, 866f331c029STejun Heo disk_name(sgp, part->partno, buf)); 867e71bf0d0STejun Heo disk_part_iter_exit(&piter); 8681da177e4SLinus Torvalds 8691da177e4SLinus Torvalds return 0; 8701da177e4SLinus Torvalds } 8711da177e4SLinus Torvalds 872f500975aSAlexey Dobriyan static const struct seq_operations partitions_op = { 873def4e38dSTejun Heo .start = show_partition_start, 874def4e38dSTejun Heo .next = disk_seqf_next, 875def4e38dSTejun Heo .stop = disk_seqf_stop, 8761da177e4SLinus Torvalds .show = show_partition 8771da177e4SLinus Torvalds }; 878f500975aSAlexey Dobriyan 879f500975aSAlexey Dobriyan static int partitions_open(struct inode *inode, struct file *file) 880f500975aSAlexey Dobriyan { 881f500975aSAlexey Dobriyan return seq_open(file, &partitions_op); 882f500975aSAlexey Dobriyan } 883f500975aSAlexey Dobriyan 884f500975aSAlexey Dobriyan static const struct file_operations proc_partitions_operations = { 885f500975aSAlexey Dobriyan .open = partitions_open, 886f500975aSAlexey Dobriyan .read = seq_read, 887f500975aSAlexey Dobriyan .llseek = seq_lseek, 888f500975aSAlexey Dobriyan .release = seq_release, 889f500975aSAlexey Dobriyan }; 8901da177e4SLinus Torvalds #endif 8911da177e4SLinus Torvalds 8921da177e4SLinus Torvalds 893cf771cb5STejun Heo static struct kobject *base_probe(dev_t devt, int *partno, void *data) 8941da177e4SLinus Torvalds { 895edfaa7c3SKay Sievers if (request_module("block-major-%d-%d", MAJOR(devt), MINOR(devt)) > 0) 8961da177e4SLinus Torvalds /* Make old-style 2.4 aliases work */ 897edfaa7c3SKay Sievers request_module("block-major-%d", MAJOR(devt)); 8981da177e4SLinus Torvalds return NULL; 8991da177e4SLinus Torvalds } 9001da177e4SLinus Torvalds 9011da177e4SLinus Torvalds static int __init genhd_device_init(void) 9021da177e4SLinus Torvalds { 903e105b8bfSDan Williams int error; 904e105b8bfSDan Williams 905e105b8bfSDan Williams block_class.dev_kobj = sysfs_dev_block_kobj; 906e105b8bfSDan Williams error = class_register(&block_class); 907ee27a558SRoland McGrath if (unlikely(error)) 908ee27a558SRoland McGrath return error; 909edfaa7c3SKay Sievers bdev_map = kobj_map_init(base_probe, &block_class_lock); 9101da177e4SLinus Torvalds blk_dev_init(); 911edfaa7c3SKay Sievers 912561ec68eSZhang, Yanmin register_blkdev(BLOCK_EXT_MAJOR, "blkext"); 913561ec68eSZhang, Yanmin 914edfaa7c3SKay Sievers /* create top-level block dir */ 915e52eec13SAndi Kleen if (!sysfs_deprecated) 916edfaa7c3SKay Sievers block_depr = kobject_create_and_add("block", NULL); 917830d3cfbSGreg Kroah-Hartman return 0; 9181da177e4SLinus Torvalds } 9191da177e4SLinus Torvalds 9201da177e4SLinus Torvalds subsys_initcall(genhd_device_init); 9211da177e4SLinus Torvalds 922edfaa7c3SKay Sievers static ssize_t disk_range_show(struct device *dev, 923edfaa7c3SKay Sievers struct device_attribute *attr, char *buf) 9241da177e4SLinus Torvalds { 925edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 9261da177e4SLinus Torvalds 927edfaa7c3SKay Sievers return sprintf(buf, "%d\n", disk->minors); 9281da177e4SLinus Torvalds } 9291da177e4SLinus Torvalds 9301f014290STejun Heo static ssize_t disk_ext_range_show(struct device *dev, 9311f014290STejun Heo struct device_attribute *attr, char *buf) 9321f014290STejun Heo { 9331f014290STejun Heo struct gendisk *disk = dev_to_disk(dev); 9341f014290STejun Heo 935b5d0b9dfSTejun Heo return sprintf(buf, "%d\n", disk_max_parts(disk)); 9361f014290STejun Heo } 9371f014290STejun Heo 938edfaa7c3SKay Sievers static ssize_t disk_removable_show(struct device *dev, 939edfaa7c3SKay Sievers struct device_attribute *attr, char *buf) 940a7fd6706SKay Sievers { 941edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 942a7fd6706SKay Sievers 943edfaa7c3SKay Sievers return sprintf(buf, "%d\n", 9441da177e4SLinus Torvalds (disk->flags & GENHD_FL_REMOVABLE ? 1 : 0)); 945edfaa7c3SKay Sievers } 9461da177e4SLinus Torvalds 9471c9ce527SKay Sievers static ssize_t disk_ro_show(struct device *dev, 9481c9ce527SKay Sievers struct device_attribute *attr, char *buf) 9491c9ce527SKay Sievers { 9501c9ce527SKay Sievers struct gendisk *disk = dev_to_disk(dev); 9511c9ce527SKay Sievers 952b7db9956STejun Heo return sprintf(buf, "%d\n", get_disk_ro(disk) ? 1 : 0); 9531c9ce527SKay Sievers } 9541c9ce527SKay Sievers 955edfaa7c3SKay Sievers static ssize_t disk_capability_show(struct device *dev, 956edfaa7c3SKay Sievers struct device_attribute *attr, char *buf) 95786ce18d7SKristen Carlson Accardi { 958edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 959edfaa7c3SKay Sievers 960edfaa7c3SKay Sievers return sprintf(buf, "%x\n", disk->flags); 96186ce18d7SKristen Carlson Accardi } 962edfaa7c3SKay Sievers 963c72758f3SMartin K. Petersen static ssize_t disk_alignment_offset_show(struct device *dev, 964c72758f3SMartin K. Petersen struct device_attribute *attr, 965c72758f3SMartin K. Petersen char *buf) 966c72758f3SMartin K. Petersen { 967c72758f3SMartin K. Petersen struct gendisk *disk = dev_to_disk(dev); 968c72758f3SMartin K. Petersen 969c72758f3SMartin K. Petersen return sprintf(buf, "%d\n", queue_alignment_offset(disk->queue)); 970c72758f3SMartin K. Petersen } 971c72758f3SMartin K. Petersen 97286b37281SMartin K. Petersen static ssize_t disk_discard_alignment_show(struct device *dev, 97386b37281SMartin K. Petersen struct device_attribute *attr, 97486b37281SMartin K. Petersen char *buf) 97586b37281SMartin K. Petersen { 97686b37281SMartin K. Petersen struct gendisk *disk = dev_to_disk(dev); 97786b37281SMartin K. Petersen 978dd3d145dSMartin K. Petersen return sprintf(buf, "%d\n", queue_discard_alignment(disk->queue)); 97986b37281SMartin K. Petersen } 98086b37281SMartin K. Petersen 981edfaa7c3SKay Sievers static DEVICE_ATTR(range, S_IRUGO, disk_range_show, NULL); 9821f014290STejun Heo static DEVICE_ATTR(ext_range, S_IRUGO, disk_ext_range_show, NULL); 983edfaa7c3SKay Sievers static DEVICE_ATTR(removable, S_IRUGO, disk_removable_show, NULL); 9841c9ce527SKay Sievers static DEVICE_ATTR(ro, S_IRUGO, disk_ro_show, NULL); 985e5610521STejun Heo static DEVICE_ATTR(size, S_IRUGO, part_size_show, NULL); 986c72758f3SMartin K. Petersen static DEVICE_ATTR(alignment_offset, S_IRUGO, disk_alignment_offset_show, NULL); 98786b37281SMartin K. Petersen static DEVICE_ATTR(discard_alignment, S_IRUGO, disk_discard_alignment_show, 98886b37281SMartin K. Petersen NULL); 989edfaa7c3SKay Sievers static DEVICE_ATTR(capability, S_IRUGO, disk_capability_show, NULL); 990074a7acaSTejun Heo static DEVICE_ATTR(stat, S_IRUGO, part_stat_show, NULL); 991316d315bSNikanth Karthikesan static DEVICE_ATTR(inflight, S_IRUGO, part_inflight_show, NULL); 992c17bb495SAkinobu Mita #ifdef CONFIG_FAIL_MAKE_REQUEST 993edfaa7c3SKay Sievers static struct device_attribute dev_attr_fail = 994eddb2e26STejun Heo __ATTR(make-it-fail, S_IRUGO|S_IWUSR, part_fail_show, part_fail_store); 995c17bb495SAkinobu Mita #endif 996581d4e28SJens Axboe #ifdef CONFIG_FAIL_IO_TIMEOUT 997581d4e28SJens Axboe static struct device_attribute dev_attr_fail_timeout = 998581d4e28SJens Axboe __ATTR(io-timeout-fail, S_IRUGO|S_IWUSR, part_timeout_show, 999581d4e28SJens Axboe part_timeout_store); 1000581d4e28SJens Axboe #endif 1001edfaa7c3SKay Sievers 1002edfaa7c3SKay Sievers static struct attribute *disk_attrs[] = { 1003edfaa7c3SKay Sievers &dev_attr_range.attr, 10041f014290STejun Heo &dev_attr_ext_range.attr, 1005edfaa7c3SKay Sievers &dev_attr_removable.attr, 10061c9ce527SKay Sievers &dev_attr_ro.attr, 1007edfaa7c3SKay Sievers &dev_attr_size.attr, 1008c72758f3SMartin K. Petersen &dev_attr_alignment_offset.attr, 100986b37281SMartin K. Petersen &dev_attr_discard_alignment.attr, 1010edfaa7c3SKay Sievers &dev_attr_capability.attr, 1011edfaa7c3SKay Sievers &dev_attr_stat.attr, 1012316d315bSNikanth Karthikesan &dev_attr_inflight.attr, 1013edfaa7c3SKay Sievers #ifdef CONFIG_FAIL_MAKE_REQUEST 1014edfaa7c3SKay Sievers &dev_attr_fail.attr, 1015edfaa7c3SKay Sievers #endif 1016581d4e28SJens Axboe #ifdef CONFIG_FAIL_IO_TIMEOUT 1017581d4e28SJens Axboe &dev_attr_fail_timeout.attr, 1018581d4e28SJens Axboe #endif 1019edfaa7c3SKay Sievers NULL 10201da177e4SLinus Torvalds }; 10211da177e4SLinus Torvalds 1022edfaa7c3SKay Sievers static struct attribute_group disk_attr_group = { 1023edfaa7c3SKay Sievers .attrs = disk_attrs, 1024edfaa7c3SKay Sievers }; 1025edfaa7c3SKay Sievers 1026a4dbd674SDavid Brownell static const struct attribute_group *disk_attr_groups[] = { 1027edfaa7c3SKay Sievers &disk_attr_group, 1028edfaa7c3SKay Sievers NULL 1029edfaa7c3SKay Sievers }; 1030edfaa7c3SKay Sievers 1031540eed56STejun Heo /** 1032540eed56STejun Heo * disk_replace_part_tbl - replace disk->part_tbl in RCU-safe way 1033540eed56STejun Heo * @disk: disk to replace part_tbl for 1034540eed56STejun Heo * @new_ptbl: new part_tbl to install 1035540eed56STejun Heo * 1036540eed56STejun Heo * Replace disk->part_tbl with @new_ptbl in RCU-safe way. The 1037540eed56STejun Heo * original ptbl is freed using RCU callback. 1038540eed56STejun Heo * 1039540eed56STejun Heo * LOCKING: 1040540eed56STejun Heo * Matching bd_mutx locked. 1041540eed56STejun Heo */ 1042540eed56STejun Heo static void disk_replace_part_tbl(struct gendisk *disk, 1043540eed56STejun Heo struct disk_part_tbl *new_ptbl) 1044540eed56STejun Heo { 1045540eed56STejun Heo struct disk_part_tbl *old_ptbl = disk->part_tbl; 1046540eed56STejun Heo 1047540eed56STejun Heo rcu_assign_pointer(disk->part_tbl, new_ptbl); 1048a6f23657SJens Axboe 1049a6f23657SJens Axboe if (old_ptbl) { 1050a6f23657SJens Axboe rcu_assign_pointer(old_ptbl->last_lookup, NULL); 105157bdfbf9SLai Jiangshan kfree_rcu(old_ptbl, rcu_head); 1052540eed56STejun Heo } 1053a6f23657SJens Axboe } 1054540eed56STejun Heo 1055540eed56STejun Heo /** 1056540eed56STejun Heo * disk_expand_part_tbl - expand disk->part_tbl 1057540eed56STejun Heo * @disk: disk to expand part_tbl for 1058540eed56STejun Heo * @partno: expand such that this partno can fit in 1059540eed56STejun Heo * 1060540eed56STejun Heo * Expand disk->part_tbl such that @partno can fit in. disk->part_tbl 1061540eed56STejun Heo * uses RCU to allow unlocked dereferencing for stats and other stuff. 1062540eed56STejun Heo * 1063540eed56STejun Heo * LOCKING: 1064540eed56STejun Heo * Matching bd_mutex locked, might sleep. 1065540eed56STejun Heo * 1066540eed56STejun Heo * RETURNS: 1067540eed56STejun Heo * 0 on success, -errno on failure. 1068540eed56STejun Heo */ 1069540eed56STejun Heo int disk_expand_part_tbl(struct gendisk *disk, int partno) 1070540eed56STejun Heo { 1071540eed56STejun Heo struct disk_part_tbl *old_ptbl = disk->part_tbl; 1072540eed56STejun Heo struct disk_part_tbl *new_ptbl; 1073540eed56STejun Heo int len = old_ptbl ? old_ptbl->len : 0; 1074540eed56STejun Heo int target = partno + 1; 1075540eed56STejun Heo size_t size; 1076540eed56STejun Heo int i; 1077540eed56STejun Heo 1078540eed56STejun Heo /* disk_max_parts() is zero during initialization, ignore if so */ 1079540eed56STejun Heo if (disk_max_parts(disk) && target > disk_max_parts(disk)) 1080540eed56STejun Heo return -EINVAL; 1081540eed56STejun Heo 1082540eed56STejun Heo if (target <= len) 1083540eed56STejun Heo return 0; 1084540eed56STejun Heo 1085540eed56STejun Heo size = sizeof(*new_ptbl) + target * sizeof(new_ptbl->part[0]); 1086540eed56STejun Heo new_ptbl = kzalloc_node(size, GFP_KERNEL, disk->node_id); 1087540eed56STejun Heo if (!new_ptbl) 1088540eed56STejun Heo return -ENOMEM; 1089540eed56STejun Heo 1090540eed56STejun Heo new_ptbl->len = target; 1091540eed56STejun Heo 1092540eed56STejun Heo for (i = 0; i < len; i++) 1093540eed56STejun Heo rcu_assign_pointer(new_ptbl->part[i], old_ptbl->part[i]); 1094540eed56STejun Heo 1095540eed56STejun Heo disk_replace_part_tbl(disk, new_ptbl); 1096540eed56STejun Heo return 0; 1097540eed56STejun Heo } 1098540eed56STejun Heo 1099edfaa7c3SKay Sievers static void disk_release(struct device *dev) 11001da177e4SLinus Torvalds { 1101edfaa7c3SKay Sievers struct gendisk *disk = dev_to_disk(dev); 1102edfaa7c3SKay Sievers 110377ea887eSTejun Heo disk_release_events(disk); 11041da177e4SLinus Torvalds kfree(disk->random); 1105540eed56STejun Heo disk_replace_part_tbl(disk, NULL); 1106074a7acaSTejun Heo free_part_stats(&disk->part0); 11076d1d8050SWill Drewry free_part_info(&disk->part0); 1108523e1d39STejun Heo if (disk->queue) 1109523e1d39STejun Heo blk_put_queue(disk->queue); 11101da177e4SLinus Torvalds kfree(disk); 11111da177e4SLinus Torvalds } 1112edfaa7c3SKay Sievers struct class block_class = { 1113edfaa7c3SKay Sievers .name = "block", 11141da177e4SLinus Torvalds }; 11151da177e4SLinus Torvalds 11162c9ede55SAl Viro static char *block_devnode(struct device *dev, umode_t *mode) 1117b03f38b6SKay Sievers { 1118b03f38b6SKay Sievers struct gendisk *disk = dev_to_disk(dev); 1119b03f38b6SKay Sievers 1120e454cea2SKay Sievers if (disk->devnode) 1121e454cea2SKay Sievers return disk->devnode(disk, mode); 1122b03f38b6SKay Sievers return NULL; 1123b03f38b6SKay Sievers } 1124b03f38b6SKay Sievers 11251826eadfSAdrian Bunk static struct device_type disk_type = { 1126edfaa7c3SKay Sievers .name = "disk", 1127edfaa7c3SKay Sievers .groups = disk_attr_groups, 1128edfaa7c3SKay Sievers .release = disk_release, 1129e454cea2SKay Sievers .devnode = block_devnode, 11301da177e4SLinus Torvalds }; 11311da177e4SLinus Torvalds 1132a6e2ba88SRandy Dunlap #ifdef CONFIG_PROC_FS 1133cf771cb5STejun Heo /* 1134cf771cb5STejun Heo * aggregate disk stat collector. Uses the same stats that the sysfs 1135cf771cb5STejun Heo * entries do, above, but makes them available through one seq_file. 1136cf771cb5STejun Heo * 1137cf771cb5STejun Heo * The output looks suspiciously like /proc/partitions with a bunch of 1138cf771cb5STejun Heo * extra fields. 1139cf771cb5STejun Heo */ 1140cf771cb5STejun Heo static int diskstats_show(struct seq_file *seqf, void *v) 11411da177e4SLinus Torvalds { 11421da177e4SLinus Torvalds struct gendisk *gp = v; 1143e71bf0d0STejun Heo struct disk_part_iter piter; 1144e71bf0d0STejun Heo struct hd_struct *hd; 11451da177e4SLinus Torvalds char buf[BDEVNAME_SIZE]; 1146c9959059STejun Heo int cpu; 11471da177e4SLinus Torvalds 11481da177e4SLinus Torvalds /* 1149ed9e1982STejun Heo if (&disk_to_dev(gp)->kobj.entry == block_class.devices.next) 1150cf771cb5STejun Heo seq_puts(seqf, "major minor name" 11511da177e4SLinus Torvalds " rio rmerge rsect ruse wio wmerge " 11521da177e4SLinus Torvalds "wsect wuse running use aveq" 11531da177e4SLinus Torvalds "\n\n"); 11541da177e4SLinus Torvalds */ 11551da177e4SLinus Torvalds 115671982a40STejun Heo disk_part_iter_init(&piter, gp, DISK_PITER_INCL_EMPTY_PART0); 1157e71bf0d0STejun Heo while ((hd = disk_part_iter_next(&piter))) { 1158074a7acaSTejun Heo cpu = part_stat_lock(); 1159c9959059STejun Heo part_round_stats(cpu, hd); 1160074a7acaSTejun Heo part_stat_unlock(); 1161f95fe9cfSHerbert Poetzl seq_printf(seqf, "%4d %7d %s %lu %lu %lu " 1162f95fe9cfSHerbert Poetzl "%u %lu %lu %lu %u %u %u %u\n", 1163f331c029STejun Heo MAJOR(part_devt(hd)), MINOR(part_devt(hd)), 1164f331c029STejun Heo disk_name(gp, hd->partno, buf), 116553f22956SLiu Yuan part_stat_read(hd, ios[READ]), 116653f22956SLiu Yuan part_stat_read(hd, merges[READ]), 1167f95fe9cfSHerbert Poetzl part_stat_read(hd, sectors[READ]), 116853f22956SLiu Yuan jiffies_to_msecs(part_stat_read(hd, ticks[READ])), 116953f22956SLiu Yuan part_stat_read(hd, ios[WRITE]), 117053f22956SLiu Yuan part_stat_read(hd, merges[WRITE]), 1171f95fe9cfSHerbert Poetzl part_stat_read(hd, sectors[WRITE]), 117253f22956SLiu Yuan jiffies_to_msecs(part_stat_read(hd, ticks[WRITE])), 1173316d315bSNikanth Karthikesan part_in_flight(hd), 117428f39d55SJerome Marchand jiffies_to_msecs(part_stat_read(hd, io_ticks)), 117528f39d55SJerome Marchand jiffies_to_msecs(part_stat_read(hd, time_in_queue)) 117628f39d55SJerome Marchand ); 11771da177e4SLinus Torvalds } 1178e71bf0d0STejun Heo disk_part_iter_exit(&piter); 11791da177e4SLinus Torvalds 11801da177e4SLinus Torvalds return 0; 11811da177e4SLinus Torvalds } 11821da177e4SLinus Torvalds 118331d85ab2SAlexey Dobriyan static const struct seq_operations diskstats_op = { 1184def4e38dSTejun Heo .start = disk_seqf_start, 1185def4e38dSTejun Heo .next = disk_seqf_next, 1186def4e38dSTejun Heo .stop = disk_seqf_stop, 11871da177e4SLinus Torvalds .show = diskstats_show 11881da177e4SLinus Torvalds }; 1189f500975aSAlexey Dobriyan 119031d85ab2SAlexey Dobriyan static int diskstats_open(struct inode *inode, struct file *file) 119131d85ab2SAlexey Dobriyan { 119231d85ab2SAlexey Dobriyan return seq_open(file, &diskstats_op); 119331d85ab2SAlexey Dobriyan } 119431d85ab2SAlexey Dobriyan 119531d85ab2SAlexey Dobriyan static const struct file_operations proc_diskstats_operations = { 119631d85ab2SAlexey Dobriyan .open = diskstats_open, 119731d85ab2SAlexey Dobriyan .read = seq_read, 119831d85ab2SAlexey Dobriyan .llseek = seq_lseek, 119931d85ab2SAlexey Dobriyan .release = seq_release, 120031d85ab2SAlexey Dobriyan }; 120131d85ab2SAlexey Dobriyan 1202f500975aSAlexey Dobriyan static int __init proc_genhd_init(void) 1203f500975aSAlexey Dobriyan { 120431d85ab2SAlexey Dobriyan proc_create("diskstats", 0, NULL, &proc_diskstats_operations); 1205f500975aSAlexey Dobriyan proc_create("partitions", 0, NULL, &proc_partitions_operations); 1206f500975aSAlexey Dobriyan return 0; 1207f500975aSAlexey Dobriyan } 1208f500975aSAlexey Dobriyan module_init(proc_genhd_init); 1209a6e2ba88SRandy Dunlap #endif /* CONFIG_PROC_FS */ 12101da177e4SLinus Torvalds 1211cf771cb5STejun Heo dev_t blk_lookup_devt(const char *name, int partno) 1212edfaa7c3SKay Sievers { 1213edfaa7c3SKay Sievers dev_t devt = MKDEV(0, 0); 1214def4e38dSTejun Heo struct class_dev_iter iter; 1215def4e38dSTejun Heo struct device *dev; 1216edfaa7c3SKay Sievers 1217def4e38dSTejun Heo class_dev_iter_init(&iter, &block_class, NULL, &disk_type); 1218def4e38dSTejun Heo while ((dev = class_dev_iter_next(&iter))) { 1219def4e38dSTejun Heo struct gendisk *disk = dev_to_disk(dev); 1220548b10ebSTejun Heo struct hd_struct *part; 1221def4e38dSTejun Heo 12223ada8b7eSKay Sievers if (strcmp(dev_name(dev), name)) 1223f331c029STejun Heo continue; 1224f331c029STejun Heo 122541b8c853SNeil Brown if (partno < disk->minors) { 122641b8c853SNeil Brown /* We need to return the right devno, even 122741b8c853SNeil Brown * if the partition doesn't exist yet. 122841b8c853SNeil Brown */ 122941b8c853SNeil Brown devt = MKDEV(MAJOR(dev->devt), 123041b8c853SNeil Brown MINOR(dev->devt) + partno); 123141b8c853SNeil Brown break; 123241b8c853SNeil Brown } 1233e71bf0d0STejun Heo part = disk_get_part(disk, partno); 12342bbedcb4STejun Heo if (part) { 1235f331c029STejun Heo devt = part_devt(part); 1236e71bf0d0STejun Heo disk_put_part(part); 1237f331c029STejun Heo break; 1238def4e38dSTejun Heo } 1239548b10ebSTejun Heo disk_put_part(part); 1240548b10ebSTejun Heo } 1241def4e38dSTejun Heo class_dev_iter_exit(&iter); 1242edfaa7c3SKay Sievers return devt; 1243edfaa7c3SKay Sievers } 1244edfaa7c3SKay Sievers EXPORT_SYMBOL(blk_lookup_devt); 1245edfaa7c3SKay Sievers 12461da177e4SLinus Torvalds struct gendisk *alloc_disk(int minors) 12471da177e4SLinus Torvalds { 1248*c304a51bSEzequiel Garcia return alloc_disk_node(minors, NUMA_NO_NODE); 12491946089aSChristoph Lameter } 1250689d6facSTejun Heo EXPORT_SYMBOL(alloc_disk); 12511946089aSChristoph Lameter 12521946089aSChristoph Lameter struct gendisk *alloc_disk_node(int minors, int node_id) 12531946089aSChristoph Lameter { 12541946089aSChristoph Lameter struct gendisk *disk; 12551946089aSChristoph Lameter 125694f6030cSChristoph Lameter disk = kmalloc_node(sizeof(struct gendisk), 125794f6030cSChristoph Lameter GFP_KERNEL | __GFP_ZERO, node_id); 12581da177e4SLinus Torvalds if (disk) { 1259074a7acaSTejun Heo if (!init_part_stats(&disk->part0)) { 12601da177e4SLinus Torvalds kfree(disk); 12611da177e4SLinus Torvalds return NULL; 12621da177e4SLinus Torvalds } 1263bf91db18SCheng Renquan disk->node_id = node_id; 1264540eed56STejun Heo if (disk_expand_part_tbl(disk, 0)) { 1265074a7acaSTejun Heo free_part_stats(&disk->part0); 12661da177e4SLinus Torvalds kfree(disk); 12671da177e4SLinus Torvalds return NULL; 12681da177e4SLinus Torvalds } 1269540eed56STejun Heo disk->part_tbl->part[0] = &disk->part0; 12706c23a968SJens Axboe 1271c83f6bf9SVivek Goyal /* 1272c83f6bf9SVivek Goyal * set_capacity() and get_capacity() currently don't use 1273c83f6bf9SVivek Goyal * seqcounter to read/update the part0->nr_sects. Still init 1274c83f6bf9SVivek Goyal * the counter as we can read the sectors in IO submission 1275c83f6bf9SVivek Goyal * patch using seqence counters. 1276c83f6bf9SVivek Goyal * 1277c83f6bf9SVivek Goyal * TODO: Ideally set_capacity() and get_capacity() should be 1278c83f6bf9SVivek Goyal * converted to make use of bd_mutex and sequence counters. 1279c83f6bf9SVivek Goyal */ 1280c83f6bf9SVivek Goyal seqcount_init(&disk->part0.nr_sects_seq); 12816c23a968SJens Axboe hd_ref_init(&disk->part0); 1282b5d0b9dfSTejun Heo 12831da177e4SLinus Torvalds disk->minors = minors; 12841da177e4SLinus Torvalds rand_initialize_disk(disk); 1285ed9e1982STejun Heo disk_to_dev(disk)->class = &block_class; 1286ed9e1982STejun Heo disk_to_dev(disk)->type = &disk_type; 1287ed9e1982STejun Heo device_initialize(disk_to_dev(disk)); 12881da177e4SLinus Torvalds } 12891da177e4SLinus Torvalds return disk; 12901da177e4SLinus Torvalds } 12911946089aSChristoph Lameter EXPORT_SYMBOL(alloc_disk_node); 12921da177e4SLinus Torvalds 12931da177e4SLinus Torvalds struct kobject *get_disk(struct gendisk *disk) 12941da177e4SLinus Torvalds { 12951da177e4SLinus Torvalds struct module *owner; 12961da177e4SLinus Torvalds struct kobject *kobj; 12971da177e4SLinus Torvalds 12981da177e4SLinus Torvalds if (!disk->fops) 12991da177e4SLinus Torvalds return NULL; 13001da177e4SLinus Torvalds owner = disk->fops->owner; 13011da177e4SLinus Torvalds if (owner && !try_module_get(owner)) 13021da177e4SLinus Torvalds return NULL; 1303ed9e1982STejun Heo kobj = kobject_get(&disk_to_dev(disk)->kobj); 13041da177e4SLinus Torvalds if (kobj == NULL) { 13051da177e4SLinus Torvalds module_put(owner); 13061da177e4SLinus Torvalds return NULL; 13071da177e4SLinus Torvalds } 13081da177e4SLinus Torvalds return kobj; 13091da177e4SLinus Torvalds 13101da177e4SLinus Torvalds } 13111da177e4SLinus Torvalds 13121da177e4SLinus Torvalds EXPORT_SYMBOL(get_disk); 13131da177e4SLinus Torvalds 13141da177e4SLinus Torvalds void put_disk(struct gendisk *disk) 13151da177e4SLinus Torvalds { 13161da177e4SLinus Torvalds if (disk) 1317ed9e1982STejun Heo kobject_put(&disk_to_dev(disk)->kobj); 13181da177e4SLinus Torvalds } 13191da177e4SLinus Torvalds 13201da177e4SLinus Torvalds EXPORT_SYMBOL(put_disk); 13211da177e4SLinus Torvalds 1322e3264a4dSHannes Reinecke static void set_disk_ro_uevent(struct gendisk *gd, int ro) 1323e3264a4dSHannes Reinecke { 1324e3264a4dSHannes Reinecke char event[] = "DISK_RO=1"; 1325e3264a4dSHannes Reinecke char *envp[] = { event, NULL }; 1326e3264a4dSHannes Reinecke 1327e3264a4dSHannes Reinecke if (!ro) 1328e3264a4dSHannes Reinecke event[8] = '0'; 1329e3264a4dSHannes Reinecke kobject_uevent_env(&disk_to_dev(gd)->kobj, KOBJ_CHANGE, envp); 1330e3264a4dSHannes Reinecke } 1331e3264a4dSHannes Reinecke 13321da177e4SLinus Torvalds void set_device_ro(struct block_device *bdev, int flag) 13331da177e4SLinus Torvalds { 13341da177e4SLinus Torvalds bdev->bd_part->policy = flag; 13351da177e4SLinus Torvalds } 13361da177e4SLinus Torvalds 13371da177e4SLinus Torvalds EXPORT_SYMBOL(set_device_ro); 13381da177e4SLinus Torvalds 13391da177e4SLinus Torvalds void set_disk_ro(struct gendisk *disk, int flag) 13401da177e4SLinus Torvalds { 1341e71bf0d0STejun Heo struct disk_part_iter piter; 1342e71bf0d0STejun Heo struct hd_struct *part; 1343e71bf0d0STejun Heo 1344e3264a4dSHannes Reinecke if (disk->part0.policy != flag) { 1345e3264a4dSHannes Reinecke set_disk_ro_uevent(disk, flag); 1346e3264a4dSHannes Reinecke disk->part0.policy = flag; 1347e3264a4dSHannes Reinecke } 1348e3264a4dSHannes Reinecke 1349e3264a4dSHannes Reinecke disk_part_iter_init(&piter, disk, DISK_PITER_INCL_EMPTY); 1350e71bf0d0STejun Heo while ((part = disk_part_iter_next(&piter))) 1351e71bf0d0STejun Heo part->policy = flag; 1352e71bf0d0STejun Heo disk_part_iter_exit(&piter); 13531da177e4SLinus Torvalds } 13541da177e4SLinus Torvalds 13551da177e4SLinus Torvalds EXPORT_SYMBOL(set_disk_ro); 13561da177e4SLinus Torvalds 13571da177e4SLinus Torvalds int bdev_read_only(struct block_device *bdev) 13581da177e4SLinus Torvalds { 13591da177e4SLinus Torvalds if (!bdev) 13601da177e4SLinus Torvalds return 0; 13611da177e4SLinus Torvalds return bdev->bd_part->policy; 13621da177e4SLinus Torvalds } 13631da177e4SLinus Torvalds 13641da177e4SLinus Torvalds EXPORT_SYMBOL(bdev_read_only); 13651da177e4SLinus Torvalds 1366cf771cb5STejun Heo int invalidate_partition(struct gendisk *disk, int partno) 13671da177e4SLinus Torvalds { 13681da177e4SLinus Torvalds int res = 0; 1369cf771cb5STejun Heo struct block_device *bdev = bdget_disk(disk, partno); 13701da177e4SLinus Torvalds if (bdev) { 13712ef41634SChristoph Hellwig fsync_bdev(bdev); 137293b270f7SNeilBrown res = __invalidate_device(bdev, true); 13731da177e4SLinus Torvalds bdput(bdev); 13741da177e4SLinus Torvalds } 13751da177e4SLinus Torvalds return res; 13761da177e4SLinus Torvalds } 13771da177e4SLinus Torvalds 13781da177e4SLinus Torvalds EXPORT_SYMBOL(invalidate_partition); 137977ea887eSTejun Heo 138077ea887eSTejun Heo /* 138177ea887eSTejun Heo * Disk events - monitor disk events like media change and eject request. 138277ea887eSTejun Heo */ 138377ea887eSTejun Heo struct disk_events { 138477ea887eSTejun Heo struct list_head node; /* all disk_event's */ 138577ea887eSTejun Heo struct gendisk *disk; /* the associated disk */ 138677ea887eSTejun Heo spinlock_t lock; 138777ea887eSTejun Heo 1388fdd514e1STejun Heo struct mutex block_mutex; /* protects blocking */ 138977ea887eSTejun Heo int block; /* event blocking depth */ 139077ea887eSTejun Heo unsigned int pending; /* events already sent out */ 139177ea887eSTejun Heo unsigned int clearing; /* events being cleared */ 139277ea887eSTejun Heo 139377ea887eSTejun Heo long poll_msecs; /* interval, -1 for default */ 139477ea887eSTejun Heo struct delayed_work dwork; 139577ea887eSTejun Heo }; 139677ea887eSTejun Heo 139777ea887eSTejun Heo static const char *disk_events_strs[] = { 139877ea887eSTejun Heo [ilog2(DISK_EVENT_MEDIA_CHANGE)] = "media_change", 139977ea887eSTejun Heo [ilog2(DISK_EVENT_EJECT_REQUEST)] = "eject_request", 140077ea887eSTejun Heo }; 140177ea887eSTejun Heo 140277ea887eSTejun Heo static char *disk_uevents[] = { 140377ea887eSTejun Heo [ilog2(DISK_EVENT_MEDIA_CHANGE)] = "DISK_MEDIA_CHANGE=1", 140477ea887eSTejun Heo [ilog2(DISK_EVENT_EJECT_REQUEST)] = "DISK_EJECT_REQUEST=1", 140577ea887eSTejun Heo }; 140677ea887eSTejun Heo 140777ea887eSTejun Heo /* list of all disk_events */ 140877ea887eSTejun Heo static DEFINE_MUTEX(disk_events_mutex); 140977ea887eSTejun Heo static LIST_HEAD(disk_events); 141077ea887eSTejun Heo 141177ea887eSTejun Heo /* disable in-kernel polling by default */ 141277ea887eSTejun Heo static unsigned long disk_events_dfl_poll_msecs = 0; 141377ea887eSTejun Heo 141477ea887eSTejun Heo static unsigned long disk_events_poll_jiffies(struct gendisk *disk) 141577ea887eSTejun Heo { 141677ea887eSTejun Heo struct disk_events *ev = disk->ev; 141777ea887eSTejun Heo long intv_msecs = 0; 141877ea887eSTejun Heo 141977ea887eSTejun Heo /* 142077ea887eSTejun Heo * If device-specific poll interval is set, always use it. If 142177ea887eSTejun Heo * the default is being used, poll iff there are events which 142277ea887eSTejun Heo * can't be monitored asynchronously. 142377ea887eSTejun Heo */ 142477ea887eSTejun Heo if (ev->poll_msecs >= 0) 142577ea887eSTejun Heo intv_msecs = ev->poll_msecs; 142677ea887eSTejun Heo else if (disk->events & ~disk->async_events) 142777ea887eSTejun Heo intv_msecs = disk_events_dfl_poll_msecs; 142877ea887eSTejun Heo 142977ea887eSTejun Heo return msecs_to_jiffies(intv_msecs); 143077ea887eSTejun Heo } 143177ea887eSTejun Heo 1432c3af54afSTejun Heo /** 1433c3af54afSTejun Heo * disk_block_events - block and flush disk event checking 1434c3af54afSTejun Heo * @disk: disk to block events for 1435c3af54afSTejun Heo * 1436c3af54afSTejun Heo * On return from this function, it is guaranteed that event checking 1437c3af54afSTejun Heo * isn't in progress and won't happen until unblocked by 1438c3af54afSTejun Heo * disk_unblock_events(). Events blocking is counted and the actual 1439c3af54afSTejun Heo * unblocking happens after the matching number of unblocks are done. 1440c3af54afSTejun Heo * 1441c3af54afSTejun Heo * Note that this intentionally does not block event checking from 1442c3af54afSTejun Heo * disk_clear_events(). 1443c3af54afSTejun Heo * 1444c3af54afSTejun Heo * CONTEXT: 1445c3af54afSTejun Heo * Might sleep. 1446c3af54afSTejun Heo */ 1447c3af54afSTejun Heo void disk_block_events(struct gendisk *disk) 144877ea887eSTejun Heo { 144977ea887eSTejun Heo struct disk_events *ev = disk->ev; 145077ea887eSTejun Heo unsigned long flags; 145177ea887eSTejun Heo bool cancel; 145277ea887eSTejun Heo 1453c3af54afSTejun Heo if (!ev) 1454c3af54afSTejun Heo return; 1455c3af54afSTejun Heo 1456fdd514e1STejun Heo /* 1457fdd514e1STejun Heo * Outer mutex ensures that the first blocker completes canceling 1458fdd514e1STejun Heo * the event work before further blockers are allowed to finish. 1459fdd514e1STejun Heo */ 1460fdd514e1STejun Heo mutex_lock(&ev->block_mutex); 1461fdd514e1STejun Heo 146277ea887eSTejun Heo spin_lock_irqsave(&ev->lock, flags); 146377ea887eSTejun Heo cancel = !ev->block++; 146477ea887eSTejun Heo spin_unlock_irqrestore(&ev->lock, flags); 146577ea887eSTejun Heo 1466c3af54afSTejun Heo if (cancel) 146777ea887eSTejun Heo cancel_delayed_work_sync(&disk->ev->dwork); 1468fdd514e1STejun Heo 1469fdd514e1STejun Heo mutex_unlock(&ev->block_mutex); 147077ea887eSTejun Heo } 147177ea887eSTejun Heo 147277ea887eSTejun Heo static void __disk_unblock_events(struct gendisk *disk, bool check_now) 147377ea887eSTejun Heo { 147477ea887eSTejun Heo struct disk_events *ev = disk->ev; 147577ea887eSTejun Heo unsigned long intv; 147677ea887eSTejun Heo unsigned long flags; 147777ea887eSTejun Heo 147877ea887eSTejun Heo spin_lock_irqsave(&ev->lock, flags); 147977ea887eSTejun Heo 148077ea887eSTejun Heo if (WARN_ON_ONCE(ev->block <= 0)) 148177ea887eSTejun Heo goto out_unlock; 148277ea887eSTejun Heo 148377ea887eSTejun Heo if (--ev->block) 148477ea887eSTejun Heo goto out_unlock; 148577ea887eSTejun Heo 148677ea887eSTejun Heo /* 148777ea887eSTejun Heo * Not exactly a latency critical operation, set poll timer 148877ea887eSTejun Heo * slack to 25% and kick event check. 148977ea887eSTejun Heo */ 149077ea887eSTejun Heo intv = disk_events_poll_jiffies(disk); 149177ea887eSTejun Heo set_timer_slack(&ev->dwork.timer, intv / 4); 149277ea887eSTejun Heo if (check_now) 14933b07e9caSTejun Heo queue_delayed_work(system_freezable_wq, &ev->dwork, 0); 149477ea887eSTejun Heo else if (intv) 14953b07e9caSTejun Heo queue_delayed_work(system_freezable_wq, &ev->dwork, intv); 149677ea887eSTejun Heo out_unlock: 149777ea887eSTejun Heo spin_unlock_irqrestore(&ev->lock, flags); 149877ea887eSTejun Heo } 149977ea887eSTejun Heo 150077ea887eSTejun Heo /** 150177ea887eSTejun Heo * disk_unblock_events - unblock disk event checking 150277ea887eSTejun Heo * @disk: disk to unblock events for 150377ea887eSTejun Heo * 150477ea887eSTejun Heo * Undo disk_block_events(). When the block count reaches zero, it 150577ea887eSTejun Heo * starts events polling if configured. 150677ea887eSTejun Heo * 150777ea887eSTejun Heo * CONTEXT: 150877ea887eSTejun Heo * Don't care. Safe to call from irq context. 150977ea887eSTejun Heo */ 151077ea887eSTejun Heo void disk_unblock_events(struct gendisk *disk) 151177ea887eSTejun Heo { 151277ea887eSTejun Heo if (disk->ev) 1513facc31ddSTejun Heo __disk_unblock_events(disk, false); 151477ea887eSTejun Heo } 151577ea887eSTejun Heo 151677ea887eSTejun Heo /** 151785ef06d1STejun Heo * disk_flush_events - schedule immediate event checking and flushing 151885ef06d1STejun Heo * @disk: disk to check and flush events for 151985ef06d1STejun Heo * @mask: events to flush 152077ea887eSTejun Heo * 152185ef06d1STejun Heo * Schedule immediate event checking on @disk if not blocked. Events in 152285ef06d1STejun Heo * @mask are scheduled to be cleared from the driver. Note that this 152385ef06d1STejun Heo * doesn't clear the events from @disk->ev. 152477ea887eSTejun Heo * 152577ea887eSTejun Heo * CONTEXT: 152685ef06d1STejun Heo * If @mask is non-zero must be called with bdev->bd_mutex held. 152777ea887eSTejun Heo */ 152885ef06d1STejun Heo void disk_flush_events(struct gendisk *disk, unsigned int mask) 152977ea887eSTejun Heo { 1530a9dce2a3STejun Heo struct disk_events *ev = disk->ev; 1531a9dce2a3STejun Heo 1532a9dce2a3STejun Heo if (!ev) 1533a9dce2a3STejun Heo return; 1534a9dce2a3STejun Heo 153585ef06d1STejun Heo spin_lock_irq(&ev->lock); 153685ef06d1STejun Heo ev->clearing |= mask; 153741f63c53STejun Heo if (!ev->block) 15383b07e9caSTejun Heo mod_delayed_work(system_freezable_wq, &ev->dwork, 0); 153985ef06d1STejun Heo spin_unlock_irq(&ev->lock); 154077ea887eSTejun Heo } 154177ea887eSTejun Heo 154277ea887eSTejun Heo /** 154377ea887eSTejun Heo * disk_clear_events - synchronously check, clear and return pending events 154477ea887eSTejun Heo * @disk: disk to fetch and clear events from 154577ea887eSTejun Heo * @mask: mask of events to be fetched and clearted 154677ea887eSTejun Heo * 154777ea887eSTejun Heo * Disk events are synchronously checked and pending events in @mask 154877ea887eSTejun Heo * are cleared and returned. This ignores the block count. 154977ea887eSTejun Heo * 155077ea887eSTejun Heo * CONTEXT: 155177ea887eSTejun Heo * Might sleep. 155277ea887eSTejun Heo */ 155377ea887eSTejun Heo unsigned int disk_clear_events(struct gendisk *disk, unsigned int mask) 155477ea887eSTejun Heo { 155577ea887eSTejun Heo const struct block_device_operations *bdops = disk->fops; 155677ea887eSTejun Heo struct disk_events *ev = disk->ev; 155777ea887eSTejun Heo unsigned int pending; 155877ea887eSTejun Heo 155977ea887eSTejun Heo if (!ev) { 156077ea887eSTejun Heo /* for drivers still using the old ->media_changed method */ 156177ea887eSTejun Heo if ((mask & DISK_EVENT_MEDIA_CHANGE) && 156277ea887eSTejun Heo bdops->media_changed && bdops->media_changed(disk)) 156377ea887eSTejun Heo return DISK_EVENT_MEDIA_CHANGE; 156477ea887eSTejun Heo return 0; 156577ea887eSTejun Heo } 156677ea887eSTejun Heo 156777ea887eSTejun Heo /* tell the workfn about the events being cleared */ 156877ea887eSTejun Heo spin_lock_irq(&ev->lock); 156977ea887eSTejun Heo ev->clearing |= mask; 157077ea887eSTejun Heo spin_unlock_irq(&ev->lock); 157177ea887eSTejun Heo 157277ea887eSTejun Heo /* uncondtionally schedule event check and wait for it to finish */ 1573c3af54afSTejun Heo disk_block_events(disk); 15743b07e9caSTejun Heo queue_delayed_work(system_freezable_wq, &ev->dwork, 0); 157577ea887eSTejun Heo flush_delayed_work(&ev->dwork); 157677ea887eSTejun Heo __disk_unblock_events(disk, false); 157777ea887eSTejun Heo 157877ea887eSTejun Heo /* then, fetch and clear pending events */ 157977ea887eSTejun Heo spin_lock_irq(&ev->lock); 158077ea887eSTejun Heo WARN_ON_ONCE(ev->clearing & mask); /* cleared by workfn */ 158177ea887eSTejun Heo pending = ev->pending & mask; 158277ea887eSTejun Heo ev->pending &= ~mask; 158377ea887eSTejun Heo spin_unlock_irq(&ev->lock); 158477ea887eSTejun Heo 158577ea887eSTejun Heo return pending; 158677ea887eSTejun Heo } 158777ea887eSTejun Heo 158877ea887eSTejun Heo static void disk_events_workfn(struct work_struct *work) 158977ea887eSTejun Heo { 159077ea887eSTejun Heo struct delayed_work *dwork = to_delayed_work(work); 159177ea887eSTejun Heo struct disk_events *ev = container_of(dwork, struct disk_events, dwork); 159277ea887eSTejun Heo struct gendisk *disk = ev->disk; 159377ea887eSTejun Heo char *envp[ARRAY_SIZE(disk_uevents) + 1] = { }; 159477ea887eSTejun Heo unsigned int clearing = ev->clearing; 159577ea887eSTejun Heo unsigned int events; 159677ea887eSTejun Heo unsigned long intv; 159777ea887eSTejun Heo int nr_events = 0, i; 159877ea887eSTejun Heo 159977ea887eSTejun Heo /* check events */ 160077ea887eSTejun Heo events = disk->fops->check_events(disk, clearing); 160177ea887eSTejun Heo 160277ea887eSTejun Heo /* accumulate pending events and schedule next poll if necessary */ 160377ea887eSTejun Heo spin_lock_irq(&ev->lock); 160477ea887eSTejun Heo 160577ea887eSTejun Heo events &= ~ev->pending; 160677ea887eSTejun Heo ev->pending |= events; 160777ea887eSTejun Heo ev->clearing &= ~clearing; 160877ea887eSTejun Heo 160977ea887eSTejun Heo intv = disk_events_poll_jiffies(disk); 161077ea887eSTejun Heo if (!ev->block && intv) 16113b07e9caSTejun Heo queue_delayed_work(system_freezable_wq, &ev->dwork, intv); 161277ea887eSTejun Heo 161377ea887eSTejun Heo spin_unlock_irq(&ev->lock); 161477ea887eSTejun Heo 16157c88a168STejun Heo /* 16167c88a168STejun Heo * Tell userland about new events. Only the events listed in 16177c88a168STejun Heo * @disk->events are reported. Unlisted events are processed the 16187c88a168STejun Heo * same internally but never get reported to userland. 16197c88a168STejun Heo */ 162077ea887eSTejun Heo for (i = 0; i < ARRAY_SIZE(disk_uevents); i++) 16217c88a168STejun Heo if (events & disk->events & (1 << i)) 162277ea887eSTejun Heo envp[nr_events++] = disk_uevents[i]; 162377ea887eSTejun Heo 162477ea887eSTejun Heo if (nr_events) 162577ea887eSTejun Heo kobject_uevent_env(&disk_to_dev(disk)->kobj, KOBJ_CHANGE, envp); 162677ea887eSTejun Heo } 162777ea887eSTejun Heo 162877ea887eSTejun Heo /* 162977ea887eSTejun Heo * A disk events enabled device has the following sysfs nodes under 163077ea887eSTejun Heo * its /sys/block/X/ directory. 163177ea887eSTejun Heo * 163277ea887eSTejun Heo * events : list of all supported events 163377ea887eSTejun Heo * events_async : list of events which can be detected w/o polling 163477ea887eSTejun Heo * events_poll_msecs : polling interval, 0: disable, -1: system default 163577ea887eSTejun Heo */ 163677ea887eSTejun Heo static ssize_t __disk_events_show(unsigned int events, char *buf) 163777ea887eSTejun Heo { 163877ea887eSTejun Heo const char *delim = ""; 163977ea887eSTejun Heo ssize_t pos = 0; 164077ea887eSTejun Heo int i; 164177ea887eSTejun Heo 164277ea887eSTejun Heo for (i = 0; i < ARRAY_SIZE(disk_events_strs); i++) 164377ea887eSTejun Heo if (events & (1 << i)) { 164477ea887eSTejun Heo pos += sprintf(buf + pos, "%s%s", 164577ea887eSTejun Heo delim, disk_events_strs[i]); 164677ea887eSTejun Heo delim = " "; 164777ea887eSTejun Heo } 164877ea887eSTejun Heo if (pos) 164977ea887eSTejun Heo pos += sprintf(buf + pos, "\n"); 165077ea887eSTejun Heo return pos; 165177ea887eSTejun Heo } 165277ea887eSTejun Heo 165377ea887eSTejun Heo static ssize_t disk_events_show(struct device *dev, 165477ea887eSTejun Heo struct device_attribute *attr, char *buf) 165577ea887eSTejun Heo { 165677ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 165777ea887eSTejun Heo 165877ea887eSTejun Heo return __disk_events_show(disk->events, buf); 165977ea887eSTejun Heo } 166077ea887eSTejun Heo 166177ea887eSTejun Heo static ssize_t disk_events_async_show(struct device *dev, 166277ea887eSTejun Heo struct device_attribute *attr, char *buf) 166377ea887eSTejun Heo { 166477ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 166577ea887eSTejun Heo 166677ea887eSTejun Heo return __disk_events_show(disk->async_events, buf); 166777ea887eSTejun Heo } 166877ea887eSTejun Heo 166977ea887eSTejun Heo static ssize_t disk_events_poll_msecs_show(struct device *dev, 167077ea887eSTejun Heo struct device_attribute *attr, 167177ea887eSTejun Heo char *buf) 167277ea887eSTejun Heo { 167377ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 167477ea887eSTejun Heo 167577ea887eSTejun Heo return sprintf(buf, "%ld\n", disk->ev->poll_msecs); 167677ea887eSTejun Heo } 167777ea887eSTejun Heo 167877ea887eSTejun Heo static ssize_t disk_events_poll_msecs_store(struct device *dev, 167977ea887eSTejun Heo struct device_attribute *attr, 168077ea887eSTejun Heo const char *buf, size_t count) 168177ea887eSTejun Heo { 168277ea887eSTejun Heo struct gendisk *disk = dev_to_disk(dev); 168377ea887eSTejun Heo long intv; 168477ea887eSTejun Heo 168577ea887eSTejun Heo if (!count || !sscanf(buf, "%ld", &intv)) 168677ea887eSTejun Heo return -EINVAL; 168777ea887eSTejun Heo 168877ea887eSTejun Heo if (intv < 0 && intv != -1) 168977ea887eSTejun Heo return -EINVAL; 169077ea887eSTejun Heo 1691c3af54afSTejun Heo disk_block_events(disk); 169277ea887eSTejun Heo disk->ev->poll_msecs = intv; 169377ea887eSTejun Heo __disk_unblock_events(disk, true); 169477ea887eSTejun Heo 169577ea887eSTejun Heo return count; 169677ea887eSTejun Heo } 169777ea887eSTejun Heo 169877ea887eSTejun Heo static const DEVICE_ATTR(events, S_IRUGO, disk_events_show, NULL); 169977ea887eSTejun Heo static const DEVICE_ATTR(events_async, S_IRUGO, disk_events_async_show, NULL); 170077ea887eSTejun Heo static const DEVICE_ATTR(events_poll_msecs, S_IRUGO|S_IWUSR, 170177ea887eSTejun Heo disk_events_poll_msecs_show, 170277ea887eSTejun Heo disk_events_poll_msecs_store); 170377ea887eSTejun Heo 170477ea887eSTejun Heo static const struct attribute *disk_events_attrs[] = { 170577ea887eSTejun Heo &dev_attr_events.attr, 170677ea887eSTejun Heo &dev_attr_events_async.attr, 170777ea887eSTejun Heo &dev_attr_events_poll_msecs.attr, 170877ea887eSTejun Heo NULL, 170977ea887eSTejun Heo }; 171077ea887eSTejun Heo 171177ea887eSTejun Heo /* 171277ea887eSTejun Heo * The default polling interval can be specified by the kernel 171377ea887eSTejun Heo * parameter block.events_dfl_poll_msecs which defaults to 0 171477ea887eSTejun Heo * (disable). This can also be modified runtime by writing to 171577ea887eSTejun Heo * /sys/module/block/events_dfl_poll_msecs. 171677ea887eSTejun Heo */ 171777ea887eSTejun Heo static int disk_events_set_dfl_poll_msecs(const char *val, 171877ea887eSTejun Heo const struct kernel_param *kp) 171977ea887eSTejun Heo { 172077ea887eSTejun Heo struct disk_events *ev; 172177ea887eSTejun Heo int ret; 172277ea887eSTejun Heo 172377ea887eSTejun Heo ret = param_set_ulong(val, kp); 172477ea887eSTejun Heo if (ret < 0) 172577ea887eSTejun Heo return ret; 172677ea887eSTejun Heo 172777ea887eSTejun Heo mutex_lock(&disk_events_mutex); 172877ea887eSTejun Heo 172977ea887eSTejun Heo list_for_each_entry(ev, &disk_events, node) 173085ef06d1STejun Heo disk_flush_events(ev->disk, 0); 173177ea887eSTejun Heo 173277ea887eSTejun Heo mutex_unlock(&disk_events_mutex); 173377ea887eSTejun Heo 173477ea887eSTejun Heo return 0; 173577ea887eSTejun Heo } 173677ea887eSTejun Heo 173777ea887eSTejun Heo static const struct kernel_param_ops disk_events_dfl_poll_msecs_param_ops = { 173877ea887eSTejun Heo .set = disk_events_set_dfl_poll_msecs, 173977ea887eSTejun Heo .get = param_get_ulong, 174077ea887eSTejun Heo }; 174177ea887eSTejun Heo 174277ea887eSTejun Heo #undef MODULE_PARAM_PREFIX 174377ea887eSTejun Heo #define MODULE_PARAM_PREFIX "block." 174477ea887eSTejun Heo 174577ea887eSTejun Heo module_param_cb(events_dfl_poll_msecs, &disk_events_dfl_poll_msecs_param_ops, 174677ea887eSTejun Heo &disk_events_dfl_poll_msecs, 0644); 174777ea887eSTejun Heo 174877ea887eSTejun Heo /* 17499f53d2feSStanislaw Gruszka * disk_{alloc|add|del|release}_events - initialize and destroy disk_events. 175077ea887eSTejun Heo */ 17519f53d2feSStanislaw Gruszka static void disk_alloc_events(struct gendisk *disk) 175277ea887eSTejun Heo { 175377ea887eSTejun Heo struct disk_events *ev; 175477ea887eSTejun Heo 175575e3f3eeSTejun Heo if (!disk->fops->check_events) 175677ea887eSTejun Heo return; 175777ea887eSTejun Heo 175877ea887eSTejun Heo ev = kzalloc(sizeof(*ev), GFP_KERNEL); 175977ea887eSTejun Heo if (!ev) { 176077ea887eSTejun Heo pr_warn("%s: failed to initialize events\n", disk->disk_name); 176177ea887eSTejun Heo return; 176277ea887eSTejun Heo } 176377ea887eSTejun Heo 176477ea887eSTejun Heo INIT_LIST_HEAD(&ev->node); 176577ea887eSTejun Heo ev->disk = disk; 176677ea887eSTejun Heo spin_lock_init(&ev->lock); 1767fdd514e1STejun Heo mutex_init(&ev->block_mutex); 176877ea887eSTejun Heo ev->block = 1; 176977ea887eSTejun Heo ev->poll_msecs = -1; 177077ea887eSTejun Heo INIT_DELAYED_WORK(&ev->dwork, disk_events_workfn); 177177ea887eSTejun Heo 17729f53d2feSStanislaw Gruszka disk->ev = ev; 17739f53d2feSStanislaw Gruszka } 17749f53d2feSStanislaw Gruszka 17759f53d2feSStanislaw Gruszka static void disk_add_events(struct gendisk *disk) 17769f53d2feSStanislaw Gruszka { 17779f53d2feSStanislaw Gruszka if (!disk->ev) 17789f53d2feSStanislaw Gruszka return; 17799f53d2feSStanislaw Gruszka 17809f53d2feSStanislaw Gruszka /* FIXME: error handling */ 17819f53d2feSStanislaw Gruszka if (sysfs_create_files(&disk_to_dev(disk)->kobj, disk_events_attrs) < 0) 17829f53d2feSStanislaw Gruszka pr_warn("%s: failed to create sysfs files for events\n", 17839f53d2feSStanislaw Gruszka disk->disk_name); 17849f53d2feSStanislaw Gruszka 178577ea887eSTejun Heo mutex_lock(&disk_events_mutex); 17869f53d2feSStanislaw Gruszka list_add_tail(&disk->ev->node, &disk_events); 178777ea887eSTejun Heo mutex_unlock(&disk_events_mutex); 178877ea887eSTejun Heo 178977ea887eSTejun Heo /* 179077ea887eSTejun Heo * Block count is initialized to 1 and the following initial 179177ea887eSTejun Heo * unblock kicks it into action. 179277ea887eSTejun Heo */ 179377ea887eSTejun Heo __disk_unblock_events(disk, true); 179477ea887eSTejun Heo } 179577ea887eSTejun Heo 179677ea887eSTejun Heo static void disk_del_events(struct gendisk *disk) 179777ea887eSTejun Heo { 179877ea887eSTejun Heo if (!disk->ev) 179977ea887eSTejun Heo return; 180077ea887eSTejun Heo 1801c3af54afSTejun Heo disk_block_events(disk); 180277ea887eSTejun Heo 180377ea887eSTejun Heo mutex_lock(&disk_events_mutex); 180477ea887eSTejun Heo list_del_init(&disk->ev->node); 180577ea887eSTejun Heo mutex_unlock(&disk_events_mutex); 180677ea887eSTejun Heo 180777ea887eSTejun Heo sysfs_remove_files(&disk_to_dev(disk)->kobj, disk_events_attrs); 180877ea887eSTejun Heo } 180977ea887eSTejun Heo 181077ea887eSTejun Heo static void disk_release_events(struct gendisk *disk) 181177ea887eSTejun Heo { 181277ea887eSTejun Heo /* the block count should be 1 from disk_del_events() */ 181377ea887eSTejun Heo WARN_ON_ONCE(disk->ev && disk->ev->block != 1); 181477ea887eSTejun Heo kfree(disk->ev); 181577ea887eSTejun Heo } 1816