Re: [PATCH v6 5/9] drm/amdgpu: create context space for usermode queue
On Fri, Sep 29, 2023 at 1:50 PM Shashank Sharma wrote: > > > On 20/09/2023 17:21, Alex Deucher wrote: > > On Fri, Sep 8, 2023 at 12:45 PM Shashank Sharma > > wrote: > >> The FW expects us to allocate at least one page as context > >> space to process gang, process, GDS and FW related work. > >> This patch creates a joint object for the same, and calculates > >> GPU space offsets of these spaces. > >> > >> V1: Addressed review comments on RFC patch: > >> Alex: Make this function IP specific > >> > >> V2: Addressed review comments from Christian > >> - Allocate only one object for total FW space, and calculate > >>offsets for each of these objects. > >> > >> V3: Integration with doorbell manager > >> > >> V4: Review comments: > >> - Remove shadow from FW space list from cover letter (Alex) > >> - Alignment of macro (Luben) > >> > >> V5: Merged patches 5 and 6 into this single patch > >> Addressed review comments: > >> - Use lower_32_bits instead of mask (Christian) > >> - gfx_v11_0 instead of gfx_v11 in function names (Alex) > >> - Shadow and GDS objects are now coming from userspace (Christian, > >>Alex) > >> > >> V6: > >> - Add a comment to replace amdgpu_bo_create_kernel() with > >>amdgpu_bo_create() during fw_ctx object creation (Christian). > >> - Move proc_ctx_gpu_addr, gang_ctx_gpu_addr and fw_ctx_gpu_addr out > >>of generic queue structure and make it gen11 specific (Alex). > >> > >> Cc: Alex Deucher > >> Cc: Christian Koenig > >> Signed-off-by: Shashank Sharma > >> Signed-off-by: Arvind Yadav > >> --- > >> drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c| 61 +++ > >> .../gpu/drm/amd/include/amdgpu_userqueue.h| 1 + > >> 2 files changed, 62 insertions(+) > >> > >> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > >> b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > >> index 6760abda08df..8ffb5dee72a9 100644 > >> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > >> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > >> @@ -61,6 +61,9 @@ > >> #define regCGTT_WD_CLK_CTRL_BASE_IDX 1 > >> #define regRLC_RLCS_BOOTLOAD_STATUS_gc_11_0_1 0x4e7e > >> #define regRLC_RLCS_BOOTLOAD_STATUS_gc_11_0_1_BASE_IDX 1 > >> +#define AMDGPU_USERQ_PROC_CTX_SZ PAGE_SIZE > >> +#define AMDGPU_USERQ_GANG_CTX_SZ PAGE_SIZE > >> +#define AMDGPU_USERQ_FW_CTX_SZ PAGE_SIZE > >> > >> MODULE_FIRMWARE("amdgpu/gc_11_0_0_pfp.bin"); > >> MODULE_FIRMWARE("amdgpu/gc_11_0_0_me.bin"); > >> @@ -6424,6 +6427,56 @@ const struct amdgpu_ip_block_version > >> gfx_v11_0_ip_block = > >> .funcs = _v11_0_ip_funcs, > >> }; > >> > >> +static void gfx_v11_0_userq_destroy_ctx_space(struct amdgpu_userq_mgr > >> *uq_mgr, > >> + struct amdgpu_usermode_queue > >> *queue) > >> +{ > >> + struct amdgpu_userq_obj *ctx = >fw_obj; > >> + > >> + amdgpu_bo_free_kernel(>obj, >gpu_addr, >cpu_ptr); > >> +} > >> + > >> +static int gfx_v11_0_userq_create_ctx_space(struct amdgpu_userq_mgr > >> *uq_mgr, > >> + struct amdgpu_usermode_queue > >> *queue, > >> + struct > >> drm_amdgpu_userq_mqd_gfx_v11_0 *mqd_user) > >> +{ > >> + struct amdgpu_device *adev = uq_mgr->adev; > >> + struct amdgpu_userq_obj *ctx = >fw_obj; > >> + struct v11_gfx_mqd *mqd = queue->mqd.cpu_ptr; > >> + uint64_t fw_ctx_gpu_addr; > >> + int r, size; > >> + > >> + /* > >> +* The FW expects at least one page space allocated for > >> +* process ctx, gang ctx and fw ctx each. Create an object > >> +* for the same. > >> +*/ > >> + size = AMDGPU_USERQ_PROC_CTX_SZ + AMDGPU_USERQ_FW_CTX_SZ + > >> + AMDGPU_USERQ_GANG_CTX_SZ; > >> + r = amdgpu_bo_create_kernel(adev, size, PAGE_SIZE, > >> + AMDGPU_GEM_DOMAIN_GTT, > >> + >obj, > >> + >gpu_addr, > >> + >cpu_ptr); > >> + if (r) { > >> + DRM_ERROR("Failed to allocate ctx space bo for userqueue, > >> err:%d\n", r); > >> + return r; > >> + } > >> + > >> + fw_ctx_gpu_addr = ctx->gpu_addr + AMDGPU_USERQ_PROC_CTX_SZ + > >> + AMDGPU_USERQ_GANG_CTX_SZ; > >> + mqd->fw_work_area_base_lo = lower_32_bits(fw_ctx_gpu_addr); > >> + mqd->fw_work_area_base_lo = upper_32_bits(fw_ctx_gpu_addr); > >> + > >> + /* Shadow and GDS objects come directly from userspace */ > >> + mqd->shadow_base_lo = lower_32_bits(mqd_user->shadow_va); > >> + mqd->shadow_base_hi = upper_32_bits(mqd_user->shadow_va); > >> + > >> + mqd->gds_bkup_base_lo = lower_32_bits(mqd_user->gds_va); > >> + mqd->gds_bkup_base_hi = upper_32_bits(mqd_user->gds_va); > >> + > >> + return 0; > >> +} > >> + > >>
Re: [PATCH v6 5/9] drm/amdgpu: create context space for usermode queue
On 20/09/2023 17:21, Alex Deucher wrote: On Fri, Sep 8, 2023 at 12:45 PM Shashank Sharma wrote: The FW expects us to allocate at least one page as context space to process gang, process, GDS and FW related work. This patch creates a joint object for the same, and calculates GPU space offsets of these spaces. V1: Addressed review comments on RFC patch: Alex: Make this function IP specific V2: Addressed review comments from Christian - Allocate only one object for total FW space, and calculate offsets for each of these objects. V3: Integration with doorbell manager V4: Review comments: - Remove shadow from FW space list from cover letter (Alex) - Alignment of macro (Luben) V5: Merged patches 5 and 6 into this single patch Addressed review comments: - Use lower_32_bits instead of mask (Christian) - gfx_v11_0 instead of gfx_v11 in function names (Alex) - Shadow and GDS objects are now coming from userspace (Christian, Alex) V6: - Add a comment to replace amdgpu_bo_create_kernel() with amdgpu_bo_create() during fw_ctx object creation (Christian). - Move proc_ctx_gpu_addr, gang_ctx_gpu_addr and fw_ctx_gpu_addr out of generic queue structure and make it gen11 specific (Alex). Cc: Alex Deucher Cc: Christian Koenig Signed-off-by: Shashank Sharma Signed-off-by: Arvind Yadav --- drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c| 61 +++ .../gpu/drm/amd/include/amdgpu_userqueue.h| 1 + 2 files changed, 62 insertions(+) diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c index 6760abda08df..8ffb5dee72a9 100644 --- a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c @@ -61,6 +61,9 @@ #define regCGTT_WD_CLK_CTRL_BASE_IDX 1 #define regRLC_RLCS_BOOTLOAD_STATUS_gc_11_0_1 0x4e7e #define regRLC_RLCS_BOOTLOAD_STATUS_gc_11_0_1_BASE_IDX 1 +#define AMDGPU_USERQ_PROC_CTX_SZ PAGE_SIZE +#define AMDGPU_USERQ_GANG_CTX_SZ PAGE_SIZE +#define AMDGPU_USERQ_FW_CTX_SZ PAGE_SIZE MODULE_FIRMWARE("amdgpu/gc_11_0_0_pfp.bin"); MODULE_FIRMWARE("amdgpu/gc_11_0_0_me.bin"); @@ -6424,6 +6427,56 @@ const struct amdgpu_ip_block_version gfx_v11_0_ip_block = .funcs = _v11_0_ip_funcs, }; +static void gfx_v11_0_userq_destroy_ctx_space(struct amdgpu_userq_mgr *uq_mgr, + struct amdgpu_usermode_queue *queue) +{ + struct amdgpu_userq_obj *ctx = >fw_obj; + + amdgpu_bo_free_kernel(>obj, >gpu_addr, >cpu_ptr); +} + +static int gfx_v11_0_userq_create_ctx_space(struct amdgpu_userq_mgr *uq_mgr, + struct amdgpu_usermode_queue *queue, + struct drm_amdgpu_userq_mqd_gfx_v11_0 *mqd_user) +{ + struct amdgpu_device *adev = uq_mgr->adev; + struct amdgpu_userq_obj *ctx = >fw_obj; + struct v11_gfx_mqd *mqd = queue->mqd.cpu_ptr; + uint64_t fw_ctx_gpu_addr; + int r, size; + + /* +* The FW expects at least one page space allocated for +* process ctx, gang ctx and fw ctx each. Create an object +* for the same. +*/ + size = AMDGPU_USERQ_PROC_CTX_SZ + AMDGPU_USERQ_FW_CTX_SZ + + AMDGPU_USERQ_GANG_CTX_SZ; + r = amdgpu_bo_create_kernel(adev, size, PAGE_SIZE, + AMDGPU_GEM_DOMAIN_GTT, + >obj, + >gpu_addr, + >cpu_ptr); + if (r) { + DRM_ERROR("Failed to allocate ctx space bo for userqueue, err:%d\n", r); + return r; + } + + fw_ctx_gpu_addr = ctx->gpu_addr + AMDGPU_USERQ_PROC_CTX_SZ + + AMDGPU_USERQ_GANG_CTX_SZ; + mqd->fw_work_area_base_lo = lower_32_bits(fw_ctx_gpu_addr); + mqd->fw_work_area_base_lo = upper_32_bits(fw_ctx_gpu_addr); + + /* Shadow and GDS objects come directly from userspace */ + mqd->shadow_base_lo = lower_32_bits(mqd_user->shadow_va); + mqd->shadow_base_hi = upper_32_bits(mqd_user->shadow_va); + + mqd->gds_bkup_base_lo = lower_32_bits(mqd_user->gds_va); + mqd->gds_bkup_base_hi = upper_32_bits(mqd_user->gds_va); + + return 0; +} + static int gfx_v11_0_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr, struct drm_amdgpu_userq_in *args_in, struct amdgpu_usermode_queue *queue) @@ -6480,6 +6533,13 @@ static int gfx_v11_0_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr, goto free_mqd; } + /* Create BO for FW operations */ + r = gfx_v11_0_userq_create_ctx_space(uq_mgr, queue, _user); + if (r) { + DRM_ERROR("Failed to allocate BO for userqueue (%d)", r); + goto free_mqd; + } + return 0; free_mqd: @@
Re: [PATCH v6 5/9] drm/amdgpu: create context space for usermode queue
On Fri, Sep 8, 2023 at 12:45 PM Shashank Sharma wrote: > > The FW expects us to allocate at least one page as context > space to process gang, process, GDS and FW related work. > This patch creates a joint object for the same, and calculates > GPU space offsets of these spaces. > > V1: Addressed review comments on RFC patch: > Alex: Make this function IP specific > > V2: Addressed review comments from Christian > - Allocate only one object for total FW space, and calculate > offsets for each of these objects. > > V3: Integration with doorbell manager > > V4: Review comments: > - Remove shadow from FW space list from cover letter (Alex) > - Alignment of macro (Luben) > > V5: Merged patches 5 and 6 into this single patch > Addressed review comments: > - Use lower_32_bits instead of mask (Christian) > - gfx_v11_0 instead of gfx_v11 in function names (Alex) > - Shadow and GDS objects are now coming from userspace (Christian, > Alex) > > V6: > - Add a comment to replace amdgpu_bo_create_kernel() with > amdgpu_bo_create() during fw_ctx object creation (Christian). > - Move proc_ctx_gpu_addr, gang_ctx_gpu_addr and fw_ctx_gpu_addr out > of generic queue structure and make it gen11 specific (Alex). > > Cc: Alex Deucher > Cc: Christian Koenig > Signed-off-by: Shashank Sharma > Signed-off-by: Arvind Yadav > --- > drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c| 61 +++ > .../gpu/drm/amd/include/amdgpu_userqueue.h| 1 + > 2 files changed, 62 insertions(+) > > diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > index 6760abda08df..8ffb5dee72a9 100644 > --- a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > @@ -61,6 +61,9 @@ > #define regCGTT_WD_CLK_CTRL_BASE_IDX 1 > #define regRLC_RLCS_BOOTLOAD_STATUS_gc_11_0_1 0x4e7e > #define regRLC_RLCS_BOOTLOAD_STATUS_gc_11_0_1_BASE_IDX 1 > +#define AMDGPU_USERQ_PROC_CTX_SZ PAGE_SIZE > +#define AMDGPU_USERQ_GANG_CTX_SZ PAGE_SIZE > +#define AMDGPU_USERQ_FW_CTX_SZ PAGE_SIZE > > MODULE_FIRMWARE("amdgpu/gc_11_0_0_pfp.bin"); > MODULE_FIRMWARE("amdgpu/gc_11_0_0_me.bin"); > @@ -6424,6 +6427,56 @@ const struct amdgpu_ip_block_version > gfx_v11_0_ip_block = > .funcs = _v11_0_ip_funcs, > }; > > +static void gfx_v11_0_userq_destroy_ctx_space(struct amdgpu_userq_mgr > *uq_mgr, > + struct amdgpu_usermode_queue > *queue) > +{ > + struct amdgpu_userq_obj *ctx = >fw_obj; > + > + amdgpu_bo_free_kernel(>obj, >gpu_addr, >cpu_ptr); > +} > + > +static int gfx_v11_0_userq_create_ctx_space(struct amdgpu_userq_mgr *uq_mgr, > + struct amdgpu_usermode_queue > *queue, > + struct > drm_amdgpu_userq_mqd_gfx_v11_0 *mqd_user) > +{ > + struct amdgpu_device *adev = uq_mgr->adev; > + struct amdgpu_userq_obj *ctx = >fw_obj; > + struct v11_gfx_mqd *mqd = queue->mqd.cpu_ptr; > + uint64_t fw_ctx_gpu_addr; > + int r, size; > + > + /* > +* The FW expects at least one page space allocated for > +* process ctx, gang ctx and fw ctx each. Create an object > +* for the same. > +*/ > + size = AMDGPU_USERQ_PROC_CTX_SZ + AMDGPU_USERQ_FW_CTX_SZ + > + AMDGPU_USERQ_GANG_CTX_SZ; > + r = amdgpu_bo_create_kernel(adev, size, PAGE_SIZE, > + AMDGPU_GEM_DOMAIN_GTT, > + >obj, > + >gpu_addr, > + >cpu_ptr); > + if (r) { > + DRM_ERROR("Failed to allocate ctx space bo for userqueue, > err:%d\n", r); > + return r; > + } > + > + fw_ctx_gpu_addr = ctx->gpu_addr + AMDGPU_USERQ_PROC_CTX_SZ + > + AMDGPU_USERQ_GANG_CTX_SZ; > + mqd->fw_work_area_base_lo = lower_32_bits(fw_ctx_gpu_addr); > + mqd->fw_work_area_base_lo = upper_32_bits(fw_ctx_gpu_addr); > + > + /* Shadow and GDS objects come directly from userspace */ > + mqd->shadow_base_lo = lower_32_bits(mqd_user->shadow_va); > + mqd->shadow_base_hi = upper_32_bits(mqd_user->shadow_va); > + > + mqd->gds_bkup_base_lo = lower_32_bits(mqd_user->gds_va); > + mqd->gds_bkup_base_hi = upper_32_bits(mqd_user->gds_va); > + > + return 0; > +} > + > static int gfx_v11_0_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr, > struct drm_amdgpu_userq_in *args_in, > struct amdgpu_usermode_queue *queue) > @@ -6480,6 +6533,13 @@ static int gfx_v11_0_userq_mqd_create(struct > amdgpu_userq_mgr *uq_mgr, > goto free_mqd; > } > > + /* Create BO for FW operations */ > + r = gfx_v11_0_userq_create_ctx_space(uq_mgr, queue, _user); > +