On 05/25/2017 11:24 AM, Bart Van Assche wrote:
> On Thu, 2017-05-25 at 17:09 +0800, Ming Lei wrote:
>> Another big issue is that 'srcu_struct' is very big, which shouldn't
>> be embedded into hctx, since we only have one real user of
>> BLK_MQ_F_BLOCKING.
>>
>> So I will fix that too.
> 
> Hello Ming,
> 
> Is something like the (untested) patch below perhaps what you had in mind?
> 
> Subject: [PATCH] blk-mq: Reduce blk_mq_hw_ctx size
> 
> Since the srcu structure is rather large (184 bytes on an x86-64
> system), only allocate it if needed.
> 
> Reported-by: Ming Lei <[email protected]>
> ---
>  block/blk-mq.c         | 13 ++++++++++++-
>  include/linux/blk-mq.h |  5 +++--
>  2 files changed, 15 insertions(+), 3 deletions(-)
> 
> diff --git a/block/blk-mq.c b/block/blk-mq.c
> index 1e330de4e3c5..15b7d4077638 100644
> --- a/block/blk-mq.c
> +++ b/block/blk-mq.c
> @@ -2233,6 +2233,17 @@ struct request_queue *blk_mq_init_queue(struct 
> blk_mq_tag_set *set)
>  }
>  EXPORT_SYMBOL(blk_mq_init_queue);
>  
> +static int blk_mq_hw_ctx_size(struct request_queue *q)
> +{
> +     BUILD_BUG_ON(ALIGN(offsetof(struct blk_mq_hw_ctx, queue_rq_srcu) +
> +             sizeof(((struct blk_mq_hw_ctx *)NULL)->queue_rq_srcu), 64) !=
> +             sizeof(struct blk_mq_hw_ctx));
> +
> +     return q->tag_set->flags & BLK_MQ_F_BLOCKING ?
> +             sizeof(struct blk_mq_hw_ctx) :
> +             offsetof(struct blk_mq_hw_ctx, queue_rq_srcu);
> +}
> +
>  static void blk_mq_realloc_hw_ctxs(struct blk_mq_tag_set *set,
>                                               struct request_queue *q)
>  {
> @@ -2247,7 +2258,7 @@ static void blk_mq_realloc_hw_ctxs(struct 
> blk_mq_tag_set *set,
>                       continue;
>  
>               node = blk_mq_hw_queue_to_node(q->mq_map, i);
> -             hctxs[i] = kzalloc_node(sizeof(struct blk_mq_hw_ctx),
> +             hctxs[i] = kzalloc_node(blk_mq_hw_ctx_size(q),
>                                       GFP_KERNEL, node);
>               if (!hctxs[i])
>                       break;
> diff --git a/include/linux/blk-mq.h b/include/linux/blk-mq.h
> index c0d59330b5e0..8467e1f83524 100644
> --- a/include/linux/blk-mq.h
> +++ b/include/linux/blk-mq.h
> @@ -39,8 +39,6 @@ struct blk_mq_hw_ctx {
>       struct blk_mq_tags      *tags;
>       struct blk_mq_tags      *sched_tags;
>  
> -     struct srcu_struct      queue_rq_srcu;
> -
>       unsigned long           queued;
>       unsigned long           run;
>  #define BLK_MQ_MAX_DISPATCH_ORDER    7
> @@ -62,6 +60,9 @@ struct blk_mq_hw_ctx {
>       struct dentry           *debugfs_dir;
>       struct dentry           *sched_debugfs_dir;
>  #endif
> +
> +     /* Must be the last member - see also blk_mq_hw_ctx_size(). */
> +     struct srcu_struct      queue_rq_srcu;
>  };

Why not make it

        /* Must be the last member - see also blk_mq_hw_ctx_size(). */
        struct srcu_struct      queue_rq_srcu[0];

and fixup blk_mq_hw_ctx_size()

static int blk_mq_hw_ctx_size(struct request_queue *q)
{
        int size = sizeof(struct blk_mq_hw_ctx);

        if (q->tag_set->flags & BLK_MQ_F_BLOCKING)
                size += sizeof(struct srcu_struct);

        return size;
}

I think that'd be cleaner. Keep the end-of-struct checking, just to be
on the safe side.

Neither one is super pretty though, and still doesn't fix the fact that
the srcu_struct is _half_ the blk_mq_hw_ctx in total.

-- 
Jens Axboe

Reply via email to