lib/sbitmap: convert shallow_depth from one word to the whole sbitmap (42e6c6ce) · Commits · git / linux-net

block/bfq-iosched.c

+16 −19

Original line number	Diff line number	Diff line
		@@ -694,17 +694,13 @@ static void bfq_limit_depth(blk_opf_t opf, struct blk_mq_alloc_data *data)
		{
		struct bfq_data *bfqd = data->q->elevator->elevator_data;
		struct bfq_io_cq *bic = bfq_bic_lookup(data->q);
		int depth;
		unsigned limit = data->q->nr_requests;
		unsigned int act_idx;
		unsigned int limit, act_idx;

		/* Sync reads have full depth available */
		if (op_is_sync(opf) && !op_is_write(opf)) {
		depth = 0;
		} else {
		depth = bfqd->word_depths[!!bfqd->wr_busy_queues][op_is_sync(opf)];
		limit = (limit * depth) >> bfqd->full_depth_shift;
		}
		if (op_is_sync(opf) && !op_is_write(opf))
		limit = data->q->nr_requests;
		else
		limit = bfqd->async_depths[!!bfqd->wr_busy_queues][op_is_sync(opf)];

		for (act_idx = 0; bic && act_idx < bfqd->num_actuators; act_idx++) {
		/* Fast path to check if bfqq is already allocated. */
		@@ -718,14 +714,16 @@ static void bfq_limit_depth(blk_opf_t opf, struct blk_mq_alloc_data *data)
		* available requests and thus starve other entities.
		*/
		if (bfqq_request_over_limit(bfqd, bic, opf, act_idx, limit)) {
		depth = 1;
		limit = 1;
		break;
		}
		}

		bfq_log(bfqd, "[%s] wr_busy %d sync %d depth %u",
		__func__, bfqd->wr_busy_queues, op_is_sync(opf), depth);
		if (depth)
		data->shallow_depth = depth;
		__func__, bfqd->wr_busy_queues, op_is_sync(opf), limit);

		if (limit < data->q->nr_requests)
		data->shallow_depth = limit;
		}

		static struct bfq_queue *
		@@ -7114,9 +7112,8 @@ void bfq_put_async_queues(struct bfq_data bfqd, struct bfq_group bfqg)
		*/
		static void bfq_update_depths(struct bfq_data bfqd, struct sbitmap_queue bt)
		{
		unsigned int depth = 1U << bt->sb.shift;
		unsigned int nr_requests = bfqd->queue->nr_requests;

		bfqd->full_depth_shift = bt->sb.shift;
		/*
		* In-word depths if no bfq_queue is being weight-raised:
		* leaving 25% of tags only for sync reads.
		@@ -7128,13 +7125,13 @@ static void bfq_update_depths(struct bfq_data bfqd, struct sbitmap_queue bt)
		* limit 'something'.
		*/
		/* no more than 50% of tags for async I/O */
		bfqd->word_depths[0][0] = max(depth >> 1, 1U);
		bfqd->async_depths[0][0] = max(nr_requests >> 1, 1U);
		/*
		* no more than 75% of tags for sync writes (25% extra tags
		* w.r.t. async I/O, to prevent async I/O from starving sync
		* writes)
		*/
		bfqd->word_depths[0][1] = max((depth * 3) >> 2, 1U);
		bfqd->async_depths[0][1] = max((nr_requests * 3) >> 2, 1U);

		/*
		* In-word depths in case some bfq_queue is being weight-
		@@ -7144,9 +7141,9 @@ static void bfq_update_depths(struct bfq_data bfqd, struct sbitmap_queue bt)
		* shortage.
		*/
		/* no more than ~18% of tags for async I/O */
		bfqd->word_depths[1][0] = max((depth * 3) >> 4, 1U);
		bfqd->async_depths[1][0] = max((nr_requests * 3) >> 4, 1U);
		/* no more than ~37% of tags for sync writes (~20% extra tags) */
		bfqd->word_depths[1][1] = max((depth * 6) >> 4, 1U);
		bfqd->async_depths[1][1] = max((nr_requests * 6) >> 4, 1U);
		}

		static void bfq_depth_updated(struct blk_mq_hw_ctx *hctx)

block/bfq-iosched.h

+1 −2

Original line number	Diff line number	Diff line
		@@ -813,8 +813,7 @@ struct bfq_data {
		* Depth limits used in bfq_limit_depth (see comments on the
		* function)
		*/
		unsigned int word_depths[2][2];
		unsigned int full_depth_shift;
		unsigned int async_depths[2][2];

		/*
		* Number of independent actuators. This is equal to 1 in

block/kyber-iosched.c

+2 −7

Original line number	Diff line number	Diff line
		@@ -157,10 +157,7 @@ struct kyber_queue_data {
		*/
		struct sbitmap_queue domain_tokens[KYBER_NUM_DOMAINS];

		/*
		* Async request percentage, converted to per-word depth for
		* sbitmap_get_shallow().
		*/
		/* Number of allowed async requests. */
		unsigned int async_depth;

		struct kyber_cpu_latency __percpu *cpu_latency;
		@@ -447,10 +444,8 @@ static void kyber_depth_updated(struct blk_mq_hw_ctx *hctx)
		{
		struct kyber_queue_data *kqd = hctx->queue->elevator->elevator_data;
		struct blk_mq_tags *tags = hctx->sched_tags;
		unsigned int shift = tags->bitmap_tags.sb.shift;

		kqd->async_depth = (1U << shift) * KYBER_ASYNC_PERCENT / 100U;

		kqd->async_depth = hctx->queue->nr_requests * KYBER_ASYNC_PERCENT / 100U;
		sbitmap_queue_min_shallow_depth(&tags->bitmap_tags, kqd->async_depth);
		}

block/mq-deadline.c

+1 −15

Original line number	Diff line number	Diff line
		@@ -487,20 +487,6 @@ static struct request dd_dispatch_request(struct blk_mq_hw_ctx hctx)
		return rq;
		}

		/*
		* 'depth' is a number in the range 1..INT_MAX representing a number of
		* requests. Scale it with a factor (1 << bt->sb.shift) / q->nr_requests since
		* 1..(1 << bt->sb.shift) is the range expected by sbitmap_get_shallow().
		* Values larger than q->nr_requests have the same effect as q->nr_requests.
		*/
		static int dd_to_word_depth(struct blk_mq_hw_ctx *hctx, unsigned int qdepth)
		{
		struct sbitmap_queue *bt = &hctx->sched_tags->bitmap_tags;
		const unsigned int nrr = hctx->queue->nr_requests;

		return ((qdepth << bt->sb.shift) + nrr - 1) / nrr;
		}

		/*
		* Called by __blk_mq_alloc_request(). The shallow_depth value set by this
		* function is used by __blk_mq_get_tag().
		@@ -517,7 +503,7 @@ static void dd_limit_depth(blk_opf_t opf, struct blk_mq_alloc_data *data)
		* Throttle asynchronous requests and writes such that these requests
		* do not block the allocation of synchronous requests.
		*/
		data->shallow_depth = dd_to_word_depth(data->hctx, dd->async_depth);
		data->shallow_depth = dd->async_depth;
		}

		/* Called by blk_mq_update_nr_requests(). */

include/linux/sbitmap.h

+3 −3

Original line number	Diff line number	Diff line
		@@ -213,12 +213,12 @@ int sbitmap_get(struct sbitmap *sb);
		* sbitmap_get_shallow() - Try to allocate a free bit from a &struct sbitmap,
		* limiting the depth used from each word.
		* @sb: Bitmap to allocate from.
		* @shallow_depth: The maximum number of bits to allocate from a single word.
		* @shallow_depth: The maximum number of bits to allocate from the bitmap.
		*
		* This rather specific operation allows for having multiple users with
		* different allocation limits. E.g., there can be a high-priority class that
		* uses sbitmap_get() and a low-priority class that uses sbitmap_get_shallow()
		* with a @shallow_depth of (1 << (@sb->shift - 1)). Then, the low-priority
		* with a @shallow_depth of (sb->depth >> 1). Then, the low-priority
		* class can only allocate half of the total bits in the bitmap, preventing it
		* from starving out the high-priority class.
		*
		@@ -478,7 +478,7 @@ unsigned long __sbitmap_queue_get_batch(struct sbitmap_queue *sbq, int nr_tags,
		* sbitmap_queue, limiting the depth used from each word, with preemption
		* already disabled.
		* @sbq: Bitmap queue to allocate from.
		* @shallow_depth: The maximum number of bits to allocate from a single word.
		* @shallow_depth: The maximum number of bits to allocate from the queue.
		* See sbitmap_get_shallow().
		*
		* If you call this, make sure to call sbitmap_queue_min_shallow_depth() after