Blame - block/blk-settings.c - kernel/msm-4.9

blob: cd9b7302dfc18d5056f1f308c7c4b70aeac9ab64 [file] [log] [blame]

Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	1	/*
				2	* Functions related to setting various queue properties from drivers
				3	*/
				4	#include <linux/kernel.h>
				5	#include <linux/module.h>
				6	#include <linux/init.h>
				7	#include <linux/bio.h>
				8	#include <linux/blkdev.h>
				9	#include <linux/bootmem.h> /* for max_pfn/max_low_pfn */
Martin K. Petersen	70dd5bf	2009-07-31 11:49:12 -0400	[diff] [blame]	10	#include <linux/gcd.h>
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	11
				12	#include "blk.h"
				13
Jens Axboe	6728cb0	2008-01-31 13:03:55 +0100	[diff] [blame]	14	unsigned long blk_max_low_pfn;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	15	EXPORT_SYMBOL(blk_max_low_pfn);
Jens Axboe	6728cb0	2008-01-31 13:03:55 +0100	[diff] [blame]	16
				17	unsigned long blk_max_pfn;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	18
				19	/**
				20	* blk_queue_prep_rq - set a prepare_request function for queue
				21	* @q: queue
				22	* @pfn: prepare_request function
				23	*
				24	* It's possible for a queue to register a prepare_request callback which
				25	* is invoked before the request is handed to the request_fn. The goal of
				26	* the function is to prepare a request for I/O, it can be used to build a
				27	* cdb from the request data for instance.
				28	*
				29	*/
				30	void blk_queue_prep_rq(struct request_queue q, prep_rq_fn pfn)
				31	{
				32	q->prep_rq_fn = pfn;
				33	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	34	EXPORT_SYMBOL(blk_queue_prep_rq);
				35
				36	/**
David Woodhouse	fb2dce8	2008-08-05 18:01:53 +0100	[diff] [blame]	37	* blk_queue_set_discard - set a discard_sectors function for queue
				38	* @q: queue
				39	* @dfn: prepare_discard function
				40	*
				41	* It's possible for a queue to register a discard callback which is used
				42	* to transform a discard request into the appropriate type for the
				43	* hardware. If none is registered, then discard requests are failed
				44	* with %EOPNOTSUPP.
				45	*
				46	*/
				47	void blk_queue_set_discard(struct request_queue q, prepare_discard_fn dfn)
				48	{
				49	q->prepare_discard_fn = dfn;
				50	}
				51	EXPORT_SYMBOL(blk_queue_set_discard);
				52
				53	/**
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	54	* blk_queue_merge_bvec - set a merge_bvec function for queue
				55	* @q: queue
				56	* @mbfn: merge_bvec_fn
				57	*
				58	* Usually queues have static limitations on the max sectors or segments that
				59	* we can put in a request. Stacking drivers may have some settings that
				60	* are dynamic, and thus we have to query the queue whether it is ok to
				61	* add a new bio_vec to a bio at a given offset or not. If the block device
				62	* has such limitations, it needs to register a merge_bvec_fn to control
				63	* the size of bio's sent to it. Note that a block device must allow a
				64	* single page to be added to an empty bio. The block device driver may want
				65	* to use the bio_split() function to deal with these bio's. By default
				66	* no merge_bvec_fn is defined for a queue, and only the fixed limits are
				67	* honored.
				68	*/
				69	void blk_queue_merge_bvec(struct request_queue q, merge_bvec_fn mbfn)
				70	{
				71	q->merge_bvec_fn = mbfn;
				72	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	73	EXPORT_SYMBOL(blk_queue_merge_bvec);
				74
				75	void blk_queue_softirq_done(struct request_queue q, softirq_done_fn fn)
				76	{
				77	q->softirq_done_fn = fn;
				78	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	79	EXPORT_SYMBOL(blk_queue_softirq_done);
				80
Jens Axboe	242f9dc	2008-09-14 05:55:09 -0700	[diff] [blame]	81	void blk_queue_rq_timeout(struct request_queue *q, unsigned int timeout)
				82	{
				83	q->rq_timeout = timeout;
				84	}
				85	EXPORT_SYMBOL_GPL(blk_queue_rq_timeout);
				86
				87	void blk_queue_rq_timed_out(struct request_queue q, rq_timed_out_fn fn)
				88	{
				89	q->rq_timed_out_fn = fn;
				90	}
				91	EXPORT_SYMBOL_GPL(blk_queue_rq_timed_out);
				92
Kiyoshi Ueda	ef9e3fa	2008-10-01 16:12:15 +0200	[diff] [blame]	93	void blk_queue_lld_busy(struct request_queue q, lld_busy_fn fn)
				94	{
				95	q->lld_busy_fn = fn;
				96	}
				97	EXPORT_SYMBOL_GPL(blk_queue_lld_busy);
				98
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	99	/**
Martin K. Petersen	e475bba	2009-06-16 08:23:52 +0200	[diff] [blame]	100	* blk_set_default_limits - reset limits to default values
Randy Dunlap	f740f5ca	2009-06-19 09:18:32 +0200	[diff] [blame]	101	* @lim: the queue_limits structure to reset
Martin K. Petersen	e475bba	2009-06-16 08:23:52 +0200	[diff] [blame]	102	*
				103	* Description:
				104	* Returns a queue_limit struct to its default state. Can be used by
				105	* stacking drivers like DM that stage table swaps and reuse an
				106	* existing device queue.
				107	*/
				108	void blk_set_default_limits(struct queue_limits *lim)
				109	{
				110	lim->max_phys_segments = MAX_PHYS_SEGMENTS;
				111	lim->max_hw_segments = MAX_HW_SEGMENTS;
				112	lim->seg_boundary_mask = BLK_SEG_BOUNDARY_MASK;
				113	lim->max_segment_size = MAX_SEGMENT_SIZE;
Martin K. Petersen	80ddf24	2009-09-18 22:54:37 +0200	[diff] [blame^]	114	lim->max_sectors = lim->max_hw_sectors = BLK_DEF_MAX_SECTORS;
Martin K. Petersen	e475bba	2009-06-16 08:23:52 +0200	[diff] [blame]	115	lim->logical_block_size = lim->physical_block_size = lim->io_min = 512;
Martin K. Petersen	3a02c8e	2009-06-18 09:56:03 +0200	[diff] [blame]	116	lim->bounce_pfn = (unsigned long)(BLK_BOUNCE_ANY >> PAGE_SHIFT);
Martin K. Petersen	e475bba	2009-06-16 08:23:52 +0200	[diff] [blame]	117	lim->alignment_offset = 0;
				118	lim->io_opt = 0;
				119	lim->misaligned = 0;
				120	lim->no_cluster = 0;
				121	}
				122	EXPORT_SYMBOL(blk_set_default_limits);
				123
				124	/**
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	125	* blk_queue_make_request - define an alternate make_request function for a device
				126	* @q: the request queue for the device to be affected
				127	* @mfn: the alternate make_request function
				128	*
				129	* Description:
				130	* The normal way for &struct bios to be passed to a device
				131	* driver is for them to be collected into requests on a request
				132	* queue, and then to allow the device driver to select requests
				133	* off that queue when it is ready. This works well for many block
				134	* devices. However some block devices (typically virtual devices
				135	* such as md or lvm) do not benefit from the processing on the
				136	* request queue, and are served best by having the requests passed
				137	* directly to them. This can be achieved by providing a function
				138	* to blk_queue_make_request().
				139	*
				140	* Caveat:
				141	* The driver that does this must be able to deal appropriately
				142	* with buffers in "highmemory". This can be accomplished by either calling
				143	* __bio_kmap_atomic() to get a temporary kernel mapping, or by calling
				144	* blk_queue_bounce() to create a buffer in normal memory.
				145	**/
Jens Axboe	6728cb0	2008-01-31 13:03:55 +0100	[diff] [blame]	146	void blk_queue_make_request(struct request_queue q, make_request_fn mfn)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	147	{
				148	/*
				149	* set defaults
				150	*/
				151	q->nr_requests = BLKDEV_MAX_RQ;
Milan Broz	0e435ac	2008-12-03 12:55:08 +0100	[diff] [blame]	152
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	153	q->make_request_fn = mfn;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	154	blk_queue_dma_alignment(q, 511);
				155	blk_queue_congestion_threshold(q);
				156	q->nr_batching = BLK_BATCH_REQ;
				157
				158	q->unplug_thresh = 4; /* hmm */
				159	q->unplug_delay = (3 * HZ) / 1000; /* 3 milliseconds */
				160	if (q->unplug_delay == 0)
				161	q->unplug_delay = 1;
				162
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	163	q->unplug_timer.function = blk_unplug_timeout;
				164	q->unplug_timer.data = (unsigned long)q;
				165
Martin K. Petersen	e475bba	2009-06-16 08:23:52 +0200	[diff] [blame]	166	blk_set_default_limits(&q->limits);
Martin K. Petersen	80ddf24	2009-09-18 22:54:37 +0200	[diff] [blame^]	167	blk_queue_max_sectors(q, SAFE_MAX_SECTORS);
Martin K. Petersen	e475bba	2009-06-16 08:23:52 +0200	[diff] [blame]	168
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	169	/*
Jens Axboe	a4e7d46	2009-07-28 09:07:29 +0200	[diff] [blame]	170	* If the caller didn't supply a lock, fall back to our embedded
				171	* per-queue locks
				172	*/
				173	if (!q->queue_lock)
				174	q->queue_lock = &q->__queue_lock;
				175
				176	/*
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	177	* by default assume old behaviour and bounce for any highmem page
				178	*/
				179	blk_queue_bounce_limit(q, BLK_BOUNCE_HIGH);
				180	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	181	EXPORT_SYMBOL(blk_queue_make_request);
				182
				183	/**
				184	* blk_queue_bounce_limit - set bounce buffer limit for queue
Tejun Heo	cd0aca2	2009-04-15 22:10:25 +0900	[diff] [blame]	185	* @q: the request queue for the device
				186	* @dma_mask: the maximum address the device can handle
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	187	*
				188	* Description:
				189	* Different hardware can have different requirements as to what pages
				190	* it can do I/O directly to. A low level driver can call
				191	* blk_queue_bounce_limit to have lower memory pages allocated as bounce
Tejun Heo	cd0aca2	2009-04-15 22:10:25 +0900	[diff] [blame]	192	* buffers for doing I/O to pages residing above @dma_mask.
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	193	**/
Tejun Heo	cd0aca2	2009-04-15 22:10:25 +0900	[diff] [blame]	194	void blk_queue_bounce_limit(struct request_queue *q, u64 dma_mask)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	195	{
Tejun Heo	cd0aca2	2009-04-15 22:10:25 +0900	[diff] [blame]	196	unsigned long b_pfn = dma_mask >> PAGE_SHIFT;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	197	int dma = 0;
				198
				199	q->bounce_gfp = GFP_NOIO;
				200	#if BITS_PER_LONG == 64
Tejun Heo	cd0aca2	2009-04-15 22:10:25 +0900	[diff] [blame]	201	/*
				202	* Assume anything <= 4GB can be handled by IOMMU. Actually
				203	* some IOMMUs can handle everything, but I don't know of a
				204	* way to test this here.
				205	*/
				206	if (b_pfn < (min_t(u64, 0xffffffffUL, BLK_BOUNCE_HIGH) >> PAGE_SHIFT))
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	207	dma = 1;
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	208	q->limits.bounce_pfn = max_low_pfn;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	209	#else
Jens Axboe	6728cb0	2008-01-31 13:03:55 +0100	[diff] [blame]	210	if (b_pfn < blk_max_low_pfn)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	211	dma = 1;
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	212	q->limits.bounce_pfn = b_pfn;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	213	#endif
				214	if (dma) {
				215	init_emergency_isa_pool();
				216	q->bounce_gfp = GFP_NOIO \| GFP_DMA;
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	217	q->limits.bounce_pfn = b_pfn;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	218	}
				219	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	220	EXPORT_SYMBOL(blk_queue_bounce_limit);
				221
				222	/**
				223	* blk_queue_max_sectors - set max sectors for a request for this queue
				224	* @q: the request queue for the device
				225	* @max_sectors: max sectors in the usual 512b unit
				226	*
				227	* Description:
				228	* Enables a low level driver to set an upper limit on the size of
				229	* received requests.
				230	**/
				231	void blk_queue_max_sectors(struct request_queue *q, unsigned int max_sectors)
				232	{
				233	if ((max_sectors << 9) < PAGE_CACHE_SIZE) {
				234	max_sectors = 1 << (PAGE_CACHE_SHIFT - 9);
Harvey Harrison	24c03d4	2008-05-01 04:35:17 -0700	[diff] [blame]	235	printk(KERN_INFO "%s: set to minimum %d\n",
				236	__func__, max_sectors);
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	237	}
				238
				239	if (BLK_DEF_MAX_SECTORS > max_sectors)
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	240	q->limits.max_hw_sectors = q->limits.max_sectors = max_sectors;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	241	else {
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	242	q->limits.max_sectors = BLK_DEF_MAX_SECTORS;
				243	q->limits.max_hw_sectors = max_sectors;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	244	}
				245	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	246	EXPORT_SYMBOL(blk_queue_max_sectors);
				247
Martin K. Petersen	ae03bf6	2009-05-22 17:17:50 -0400	[diff] [blame]	248	void blk_queue_max_hw_sectors(struct request_queue *q, unsigned int max_sectors)
				249	{
				250	if (BLK_DEF_MAX_SECTORS > max_sectors)
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	251	q->limits.max_hw_sectors = BLK_DEF_MAX_SECTORS;
Martin K. Petersen	ae03bf6	2009-05-22 17:17:50 -0400	[diff] [blame]	252	else
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	253	q->limits.max_hw_sectors = max_sectors;
Martin K. Petersen	ae03bf6	2009-05-22 17:17:50 -0400	[diff] [blame]	254	}
				255	EXPORT_SYMBOL(blk_queue_max_hw_sectors);
				256
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	257	/**
				258	* blk_queue_max_phys_segments - set max phys segments for a request for this queue
				259	* @q: the request queue for the device
				260	* @max_segments: max number of segments
				261	*
				262	* Description:
				263	* Enables a low level driver to set an upper limit on the number of
				264	* physical data segments in a request. This would be the largest sized
				265	* scatter list the driver could handle.
				266	**/
				267	void blk_queue_max_phys_segments(struct request_queue *q,
				268	unsigned short max_segments)
				269	{
				270	if (!max_segments) {
				271	max_segments = 1;
Harvey Harrison	24c03d4	2008-05-01 04:35:17 -0700	[diff] [blame]	272	printk(KERN_INFO "%s: set to minimum %d\n",
				273	__func__, max_segments);
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	274	}
				275
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	276	q->limits.max_phys_segments = max_segments;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	277	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	278	EXPORT_SYMBOL(blk_queue_max_phys_segments);
				279
				280	/**
				281	* blk_queue_max_hw_segments - set max hw segments for a request for this queue
				282	* @q: the request queue for the device
				283	* @max_segments: max number of segments
				284	*
				285	* Description:
				286	* Enables a low level driver to set an upper limit on the number of
				287	* hw data segments in a request. This would be the largest number of
Randy Dunlap	710027a	2008-08-19 20:13:11 +0200	[diff] [blame]	288	* address/length pairs the host adapter can actually give at once
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	289	* to the device.
				290	**/
				291	void blk_queue_max_hw_segments(struct request_queue *q,
				292	unsigned short max_segments)
				293	{
				294	if (!max_segments) {
				295	max_segments = 1;
Harvey Harrison	24c03d4	2008-05-01 04:35:17 -0700	[diff] [blame]	296	printk(KERN_INFO "%s: set to minimum %d\n",
				297	__func__, max_segments);
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	298	}
				299
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	300	q->limits.max_hw_segments = max_segments;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	301	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	302	EXPORT_SYMBOL(blk_queue_max_hw_segments);
				303
				304	/**
				305	* blk_queue_max_segment_size - set max segment size for blk_rq_map_sg
				306	* @q: the request queue for the device
				307	* @max_size: max size of segment in bytes
				308	*
				309	* Description:
				310	* Enables a low level driver to set an upper limit on the size of a
				311	* coalesced segment
				312	**/
				313	void blk_queue_max_segment_size(struct request_queue *q, unsigned int max_size)
				314	{
				315	if (max_size < PAGE_CACHE_SIZE) {
				316	max_size = PAGE_CACHE_SIZE;
Harvey Harrison	24c03d4	2008-05-01 04:35:17 -0700	[diff] [blame]	317	printk(KERN_INFO "%s: set to minimum %d\n",
				318	__func__, max_size);
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	319	}
				320
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	321	q->limits.max_segment_size = max_size;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	322	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	323	EXPORT_SYMBOL(blk_queue_max_segment_size);
				324
				325	/**
Martin K. Petersen	e1defc4	2009-05-22 17:17:49 -0400	[diff] [blame]	326	* blk_queue_logical_block_size - set logical block size for the queue
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	327	* @q: the request queue for the device
Martin K. Petersen	e1defc4	2009-05-22 17:17:49 -0400	[diff] [blame]	328	* @size: the logical block size, in bytes
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	329	*
				330	* Description:
Martin K. Petersen	e1defc4	2009-05-22 17:17:49 -0400	[diff] [blame]	331	* This should be set to the lowest possible block size that the
				332	* storage device can address. The default of 512 covers most
				333	* hardware.
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	334	**/
Martin K. Petersen	e1defc4	2009-05-22 17:17:49 -0400	[diff] [blame]	335	void blk_queue_logical_block_size(struct request_queue *q, unsigned short size)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	336	{
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	337	q->limits.logical_block_size = size;
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	338
				339	if (q->limits.physical_block_size < size)
				340	q->limits.physical_block_size = size;
				341
				342	if (q->limits.io_min < q->limits.physical_block_size)
				343	q->limits.io_min = q->limits.physical_block_size;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	344	}
Martin K. Petersen	e1defc4	2009-05-22 17:17:49 -0400	[diff] [blame]	345	EXPORT_SYMBOL(blk_queue_logical_block_size);
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	346
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	347	/**
				348	* blk_queue_physical_block_size - set physical block size for the queue
				349	* @q: the request queue for the device
				350	* @size: the physical block size, in bytes
				351	*
				352	* Description:
				353	* This should be set to the lowest possible sector size that the
				354	* hardware can operate on without reverting to read-modify-write
				355	* operations.
				356	*/
				357	void blk_queue_physical_block_size(struct request_queue *q, unsigned short size)
				358	{
				359	q->limits.physical_block_size = size;
				360
				361	if (q->limits.physical_block_size < q->limits.logical_block_size)
				362	q->limits.physical_block_size = q->limits.logical_block_size;
				363
				364	if (q->limits.io_min < q->limits.physical_block_size)
				365	q->limits.io_min = q->limits.physical_block_size;
				366	}
				367	EXPORT_SYMBOL(blk_queue_physical_block_size);
				368
				369	/**
				370	* blk_queue_alignment_offset - set physical block alignment offset
				371	* @q: the request queue for the device
Randy Dunlap	8ebf975	2009-06-11 20:00:41 -0700	[diff] [blame]	372	* @offset: alignment offset in bytes
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	373	*
				374	* Description:
				375	* Some devices are naturally misaligned to compensate for things like
				376	* the legacy DOS partition table 63-sector offset. Low-level drivers
				377	* should call this function for devices whose first sector is not
				378	* naturally aligned.
				379	*/
				380	void blk_queue_alignment_offset(struct request_queue *q, unsigned int offset)
				381	{
				382	q->limits.alignment_offset =
				383	offset & (q->limits.physical_block_size - 1);
				384	q->limits.misaligned = 0;
				385	}
				386	EXPORT_SYMBOL(blk_queue_alignment_offset);
				387
				388	/**
Martin K. Petersen	7c958e3	2009-07-31 11:49:11 -0400	[diff] [blame]	389	* blk_limits_io_min - set minimum request size for a device
				390	* @limits: the queue limits
				391	* @min: smallest I/O size in bytes
				392	*
				393	* Description:
				394	* Some devices have an internal block size bigger than the reported
				395	* hardware sector size. This function can be used to signal the
				396	* smallest I/O the device can perform without incurring a performance
				397	* penalty.
				398	*/
				399	void blk_limits_io_min(struct queue_limits *limits, unsigned int min)
				400	{
				401	limits->io_min = min;
				402
				403	if (limits->io_min < limits->logical_block_size)
				404	limits->io_min = limits->logical_block_size;
				405
				406	if (limits->io_min < limits->physical_block_size)
				407	limits->io_min = limits->physical_block_size;
				408	}
				409	EXPORT_SYMBOL(blk_limits_io_min);
				410
				411	/**
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	412	* blk_queue_io_min - set minimum request size for the queue
				413	* @q: the request queue for the device
Randy Dunlap	8ebf975	2009-06-11 20:00:41 -0700	[diff] [blame]	414	* @min: smallest I/O size in bytes
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	415	*
				416	* Description:
Martin K. Petersen	7e5f5fb	2009-07-31 11:49:13 -0400	[diff] [blame]	417	* Storage devices may report a granularity or preferred minimum I/O
				418	* size which is the smallest request the device can perform without
				419	* incurring a performance penalty. For disk drives this is often the
				420	* physical block size. For RAID arrays it is often the stripe chunk
				421	* size. A properly aligned multiple of minimum_io_size is the
				422	* preferred request size for workloads where a high number of I/O
				423	* operations is desired.
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	424	*/
				425	void blk_queue_io_min(struct request_queue *q, unsigned int min)
				426	{
Martin K. Petersen	7c958e3	2009-07-31 11:49:11 -0400	[diff] [blame]	427	blk_limits_io_min(&q->limits, min);
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	428	}
				429	EXPORT_SYMBOL(blk_queue_io_min);
				430
				431	/**
Martin K. Petersen	3c5820c	2009-09-11 21:54:52 +0200	[diff] [blame]	432	* blk_limits_io_opt - set optimal request size for a device
				433	* @limits: the queue limits
				434	* @opt: smallest I/O size in bytes
				435	*
				436	* Description:
				437	* Storage devices may report an optimal I/O size, which is the
				438	* device's preferred unit for sustained I/O. This is rarely reported
				439	* for disk drives. For RAID arrays it is usually the stripe width or
				440	* the internal track size. A properly aligned multiple of
				441	* optimal_io_size is the preferred request size for workloads where
				442	* sustained throughput is desired.
				443	*/
				444	void blk_limits_io_opt(struct queue_limits *limits, unsigned int opt)
				445	{
				446	limits->io_opt = opt;
				447	}
				448	EXPORT_SYMBOL(blk_limits_io_opt);
				449
				450	/**
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	451	* blk_queue_io_opt - set optimal request size for the queue
				452	* @q: the request queue for the device
Randy Dunlap	8ebf975	2009-06-11 20:00:41 -0700	[diff] [blame]	453	* @opt: optimal request size in bytes
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	454	*
				455	* Description:
Martin K. Petersen	7e5f5fb	2009-07-31 11:49:13 -0400	[diff] [blame]	456	* Storage devices may report an optimal I/O size, which is the
				457	* device's preferred unit for sustained I/O. This is rarely reported
				458	* for disk drives. For RAID arrays it is usually the stripe width or
				459	* the internal track size. A properly aligned multiple of
				460	* optimal_io_size is the preferred request size for workloads where
				461	* sustained throughput is desired.
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	462	*/
				463	void blk_queue_io_opt(struct request_queue *q, unsigned int opt)
				464	{
Martin K. Petersen	3c5820c	2009-09-11 21:54:52 +0200	[diff] [blame]	465	blk_limits_io_opt(&q->limits, opt);
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	466	}
				467	EXPORT_SYMBOL(blk_queue_io_opt);
				468
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	469	/*
				470	* Returns the minimum that is _not_ zero, unless both are zero.
				471	*/
				472	#define min_not_zero(l, r) (l == 0) ? r : ((r == 0) ? l : min(l, r))
				473
				474	/**
				475	* blk_queue_stack_limits - inherit underlying queue limits for stacked drivers
				476	* @t: the stacking driver (top)
				477	* @b: the underlying device (bottom)
				478	**/
				479	void blk_queue_stack_limits(struct request_queue t, struct request_queue b)
				480	{
Martin K. Petersen	fef2466	2009-07-31 11:49:10 -0400	[diff] [blame]	481	blk_stack_limits(&t->limits, &b->limits, 0);
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	482
Neil Brown	e7e72bf	2008-05-14 16:05:54 -0700	[diff] [blame]	483	if (!t->queue_lock)
				484	WARN_ON_ONCE(1);
				485	else if (!test_bit(QUEUE_FLAG_CLUSTER, &b->queue_flags)) {
				486	unsigned long flags;
				487	spin_lock_irqsave(t->queue_lock, flags);
Nick Piggin	75ad23b	2008-04-29 14:48:33 +0200	[diff] [blame]	488	queue_flag_clear(QUEUE_FLAG_CLUSTER, t);
Neil Brown	e7e72bf	2008-05-14 16:05:54 -0700	[diff] [blame]	489	spin_unlock_irqrestore(t->queue_lock, flags);
				490	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	491	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	492	EXPORT_SYMBOL(blk_queue_stack_limits);
				493
				494	/**
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	495	* blk_stack_limits - adjust queue_limits for stacked devices
				496	* @t: the stacking driver limits (top)
Martin K. Petersen	77634f3	2009-06-09 06:23:22 +0200	[diff] [blame]	497	* @b: the underlying queue limits (bottom)
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	498	* @offset: offset to beginning of data within component device
				499	*
				500	* Description:
				501	* Merges two queue_limit structs. Returns 0 if alignment didn't
				502	* change. Returns -1 if adding the bottom device caused
				503	* misalignment.
				504	*/
				505	int blk_stack_limits(struct queue_limits t, struct queue_limits b,
				506	sector_t offset)
				507	{
				508	t->max_sectors = min_not_zero(t->max_sectors, b->max_sectors);
				509	t->max_hw_sectors = min_not_zero(t->max_hw_sectors, b->max_hw_sectors);
Martin K. Petersen	77634f3	2009-06-09 06:23:22 +0200	[diff] [blame]	510	t->bounce_pfn = min_not_zero(t->bounce_pfn, b->bounce_pfn);
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	511
				512	t->seg_boundary_mask = min_not_zero(t->seg_boundary_mask,
				513	b->seg_boundary_mask);
				514
				515	t->max_phys_segments = min_not_zero(t->max_phys_segments,
				516	b->max_phys_segments);
				517
				518	t->max_hw_segments = min_not_zero(t->max_hw_segments,
				519	b->max_hw_segments);
				520
				521	t->max_segment_size = min_not_zero(t->max_segment_size,
				522	b->max_segment_size);
				523
				524	t->logical_block_size = max(t->logical_block_size,
				525	b->logical_block_size);
				526
				527	t->physical_block_size = max(t->physical_block_size,
				528	b->physical_block_size);
				529
				530	t->io_min = max(t->io_min, b->io_min);
				531	t->no_cluster \|= b->no_cluster;
				532
				533	/* Bottom device offset aligned? */
				534	if (offset &&
				535	(offset & (b->physical_block_size - 1)) != b->alignment_offset) {
				536	t->misaligned = 1;
				537	return -1;
				538	}
				539
				540	/* If top has no alignment offset, inherit from bottom */
				541	if (!t->alignment_offset)
				542	t->alignment_offset =
				543	b->alignment_offset & (b->physical_block_size - 1);
				544
				545	/* Top device aligned on logical block boundary? */
				546	if (t->alignment_offset & (t->logical_block_size - 1)) {
				547	t->misaligned = 1;
				548	return -1;
				549	}
				550
Martin K. Petersen	70dd5bf	2009-07-31 11:49:12 -0400	[diff] [blame]	551	/* Find lcm() of optimal I/O size */
				552	if (t->io_opt && b->io_opt)
				553	t->io_opt = (t->io_opt * b->io_opt) / gcd(t->io_opt, b->io_opt);
				554	else if (b->io_opt)
				555	t->io_opt = b->io_opt;
				556
				557	/* Verify that optimal I/O size is a multiple of io_min */
				558	if (t->io_min && t->io_opt % t->io_min)
				559	return -1;
				560
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	561	return 0;
				562	}
Mike Snitzer	5d85d32	2009-05-28 11:04:53 +0200	[diff] [blame]	563	EXPORT_SYMBOL(blk_stack_limits);
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	564
				565	/**
				566	* disk_stack_limits - adjust queue limits for stacked drivers
Martin K. Petersen	77634f3	2009-06-09 06:23:22 +0200	[diff] [blame]	567	* @disk: MD/DM gendisk (top)
Martin K. Petersen	c72758f	2009-05-22 17:17:53 -0400	[diff] [blame]	568	* @bdev: the underlying block device (bottom)
				569	* @offset: offset to beginning of data within component device
				570	*
				571	* Description:
				572	* Merges the limits for two queues. Returns 0 if alignment
				573	* didn't change. Returns -1 if adding the bottom device caused
				574	* misalignment.
				575	*/
				576	void disk_stack_limits(struct gendisk disk, struct block_device bdev,
				577	sector_t offset)
				578	{
				579	struct request_queue *t = disk->queue;
				580	struct request_queue *b = bdev_get_queue(bdev);
				581
				582	offset += get_start_sect(bdev) << 9;
				583
				584	if (blk_stack_limits(&t->limits, &b->limits, offset) < 0) {
				585	char top[BDEVNAME_SIZE], bottom[BDEVNAME_SIZE];
				586
				587	disk_name(disk, 0, top);
				588	bdevname(bdev, bottom);
				589
				590	printk(KERN_NOTICE "%s: Warning: Device %s is misaligned\n",
				591	top, bottom);
				592	}
				593
				594	if (!t->queue_lock)
				595	WARN_ON_ONCE(1);
				596	else if (!test_bit(QUEUE_FLAG_CLUSTER, &b->queue_flags)) {
				597	unsigned long flags;
				598
				599	spin_lock_irqsave(t->queue_lock, flags);
				600	if (!test_bit(QUEUE_FLAG_CLUSTER, &b->queue_flags))
				601	queue_flag_clear(QUEUE_FLAG_CLUSTER, t);
				602	spin_unlock_irqrestore(t->queue_lock, flags);
				603	}
				604	}
				605	EXPORT_SYMBOL(disk_stack_limits);
				606
				607	/**
Tejun Heo	e3790c7	2008-03-04 11:18:17 +0100	[diff] [blame]	608	* blk_queue_dma_pad - set pad mask
				609	* @q: the request queue for the device
				610	* @mask: pad mask
				611	*
FUJITA Tomonori	27f8221	2008-07-04 09:30:03 +0200	[diff] [blame]	612	* Set dma pad mask.
Tejun Heo	e3790c7	2008-03-04 11:18:17 +0100	[diff] [blame]	613	*
FUJITA Tomonori	27f8221	2008-07-04 09:30:03 +0200	[diff] [blame]	614	* Appending pad buffer to a request modifies the last entry of a
				615	* scatter list such that it includes the pad buffer.
Tejun Heo	e3790c7	2008-03-04 11:18:17 +0100	[diff] [blame]	616	**/
				617	void blk_queue_dma_pad(struct request_queue *q, unsigned int mask)
				618	{
				619	q->dma_pad_mask = mask;
				620	}
				621	EXPORT_SYMBOL(blk_queue_dma_pad);
				622
				623	/**
FUJITA Tomonori	27f8221	2008-07-04 09:30:03 +0200	[diff] [blame]	624	* blk_queue_update_dma_pad - update pad mask
				625	* @q: the request queue for the device
				626	* @mask: pad mask
				627	*
				628	* Update dma pad mask.
				629	*
				630	* Appending pad buffer to a request modifies the last entry of a
				631	* scatter list such that it includes the pad buffer.
				632	**/
				633	void blk_queue_update_dma_pad(struct request_queue *q, unsigned int mask)
				634	{
				635	if (mask > q->dma_pad_mask)
				636	q->dma_pad_mask = mask;
				637	}
				638	EXPORT_SYMBOL(blk_queue_update_dma_pad);
				639
				640	/**
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	641	* blk_queue_dma_drain - Set up a drain buffer for excess dma.
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	642	* @q: the request queue for the device
Tejun Heo	2fb98e8	2008-02-19 11:36:53 +0100	[diff] [blame]	643	* @dma_drain_needed: fn which returns non-zero if drain is necessary
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	644	* @buf: physically contiguous buffer
				645	* @size: size of the buffer in bytes
				646	*
				647	* Some devices have excess DMA problems and can't simply discard (or
				648	* zero fill) the unwanted piece of the transfer. They have to have a
				649	* real area of memory to transfer it into. The use case for this is
				650	* ATAPI devices in DMA mode. If the packet command causes a transfer
				651	* bigger than the transfer size some HBAs will lock up if there
				652	* aren't DMA elements to contain the excess transfer. What this API
				653	* does is adjust the queue so that the buf is always appended
				654	* silently to the scatterlist.
				655	*
				656	* Note: This routine adjusts max_hw_segments to make room for
				657	* appending the drain buffer. If you call
				658	* blk_queue_max_hw_segments() or blk_queue_max_phys_segments() after
				659	* calling this routine, you must set the limit to one fewer than your
				660	* device can support otherwise there won't be room for the drain
				661	* buffer.
				662	*/
Harvey Harrison	448da4d	2008-03-04 11:30:18 +0100	[diff] [blame]	663	int blk_queue_dma_drain(struct request_queue *q,
Tejun Heo	2fb98e8	2008-02-19 11:36:53 +0100	[diff] [blame]	664	dma_drain_needed_fn *dma_drain_needed,
				665	void *buf, unsigned int size)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	666	{
Martin K. Petersen	ae03bf6	2009-05-22 17:17:50 -0400	[diff] [blame]	667	if (queue_max_hw_segments(q) < 2 \|\| queue_max_phys_segments(q) < 2)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	668	return -EINVAL;
				669	/* make room for appending the drain */
Martin K. Petersen	ae03bf6	2009-05-22 17:17:50 -0400	[diff] [blame]	670	blk_queue_max_hw_segments(q, queue_max_hw_segments(q) - 1);
				671	blk_queue_max_phys_segments(q, queue_max_phys_segments(q) - 1);
Tejun Heo	2fb98e8	2008-02-19 11:36:53 +0100	[diff] [blame]	672	q->dma_drain_needed = dma_drain_needed;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	673	q->dma_drain_buffer = buf;
				674	q->dma_drain_size = size;
				675
				676	return 0;
				677	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	678	EXPORT_SYMBOL_GPL(blk_queue_dma_drain);
				679
				680	/**
				681	* blk_queue_segment_boundary - set boundary rules for segment merging
				682	* @q: the request queue for the device
				683	* @mask: the memory boundary mask
				684	**/
				685	void blk_queue_segment_boundary(struct request_queue *q, unsigned long mask)
				686	{
				687	if (mask < PAGE_CACHE_SIZE - 1) {
				688	mask = PAGE_CACHE_SIZE - 1;
Harvey Harrison	24c03d4	2008-05-01 04:35:17 -0700	[diff] [blame]	689	printk(KERN_INFO "%s: set to minimum %lx\n",
				690	__func__, mask);
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	691	}
				692
Martin K. Petersen	025146e	2009-05-22 17:17:51 -0400	[diff] [blame]	693	q->limits.seg_boundary_mask = mask;
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	694	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	695	EXPORT_SYMBOL(blk_queue_segment_boundary);
				696
				697	/**
				698	* blk_queue_dma_alignment - set dma length and memory alignment
				699	* @q: the request queue for the device
				700	* @mask: alignment mask
				701	*
				702	* description:
Randy Dunlap	710027a	2008-08-19 20:13:11 +0200	[diff] [blame]	703	* set required memory and length alignment for direct dma transactions.
Alan Cox	8feb4d2	2009-04-01 15:01:39 +0100	[diff] [blame]	704	* this is used when building direct io requests for the queue.
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	705	*
				706	**/
				707	void blk_queue_dma_alignment(struct request_queue *q, int mask)
				708	{
				709	q->dma_alignment = mask;
				710	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	711	EXPORT_SYMBOL(blk_queue_dma_alignment);
				712
				713	/**
				714	* blk_queue_update_dma_alignment - update dma length and memory alignment
				715	* @q: the request queue for the device
				716	* @mask: alignment mask
				717	*
				718	* description:
Randy Dunlap	710027a	2008-08-19 20:13:11 +0200	[diff] [blame]	719	* update required memory and length alignment for direct dma transactions.
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	720	* If the requested alignment is larger than the current alignment, then
				721	* the current queue alignment is updated to the new value, otherwise it
				722	* is left alone. The design of this is to allow multiple objects
				723	* (driver, device, transport etc) to set their respective
				724	* alignments without having them interfere.
				725	*
				726	**/
				727	void blk_queue_update_dma_alignment(struct request_queue *q, int mask)
				728	{
				729	BUG_ON(mask > PAGE_SIZE);
				730
				731	if (mask > q->dma_alignment)
				732	q->dma_alignment = mask;
				733	}
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	734	EXPORT_SYMBOL(blk_queue_update_dma_alignment);
				735
Harvey Harrison	aeb3d3a	2008-08-28 09:27:42 +0200	[diff] [blame]	736	static int __init blk_settings_init(void)
Jens Axboe	86db1e2	2008-01-29 14:53:40 +0100	[diff] [blame]	737	{
				738	blk_max_low_pfn = max_low_pfn - 1;
				739	blk_max_pfn = max_pfn - 1;
				740	return 0;
				741	}
				742	subsys_initcall(blk_settings_init);