Re: [PATCH 1/4] drm/amdgpu/gmc9: rework stolen vga memory handling

2018-09-02 Thread Alex Deucher
On Fri, Aug 31, 2018 at 4:20 AM Christian König
 wrote:
>
> Am 30.08.2018 um 16:53 schrieb Alex Deucher:
> > No functional change, just rework it in order to adjust the
> > behavior on a per asic level.  The problem is that on vega10,
> > something corrupts the lower 8 MB of vram on the second
> > resume from S3.
>
> Is that tested with engineering samples or production level hardware?
> Maybe it is just a leftover from BIOS bringup?

It happens reliably across a bunch of internal boards.  Not sure if
anyone has tried with OEM boards.

Alex

>
> > This does not seem to affect Raven, other
> > gmc9 based asics need testing.
> >
> > Signed-off-by: Alex Deucher 
>
> Acked-by: Christian König  for the series.
>
> > ---
> >   drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c | 48 
> > +--
> >   1 file changed, 29 insertions(+), 19 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c 
> > b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> > index 04d50893a6f2..46cff7d8b375 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> > @@ -692,6 +692,28 @@ static int gmc_v9_0_ecc_available(struct amdgpu_device 
> > *adev)
> >   return lost_sheep == 0;
> >   }
> >
> > +static bool gmc_v9_0_keep_stolen_memory(struct amdgpu_device *adev)
> > +{
> > +
> > + /*
> > +  * TODO:
> > +  * Currently there is a bug where some memory client outside
> > +  * of the driver writes to first 8M of VRAM on S3 resume,
> > +  * this overrides GART which by default gets placed in first 8M and
> > +  * causes VM_FAULTS once GTT is accessed.
> > +  * Keep the stolen memory reservation until the while this is not 
> > solved.
> > +  * Also check code in gmc_v9_0_get_vbios_fb_size and 
> > gmc_v9_0_late_init
> > +  */
> > + switch (adev->asic_type) {
> > + case CHIP_RAVEN:
> > + case CHIP_VEGA10:
> > + case CHIP_VEGA12:
> > + case CHIP_VEGA20:
> > + default:
> > + return true;
> > + }
> > +}
> > +
> >   static int gmc_v9_0_late_init(void *handle)
> >   {
> >   struct amdgpu_device *adev = (struct amdgpu_device *)handle;
> > @@ -708,10 +730,8 @@ static int gmc_v9_0_late_init(void *handle)
> >   unsigned i;
> >   int r;
> >
> > - /*
> > -  * TODO - Uncomment once GART corruption issue is fixed.
> > -  */
> > - /* amdgpu_bo_late_init(adev); */
> > + if (!gmc_v9_0_keep_stolen_memory(adev))
> > + amdgpu_bo_late_init(adev);
> >
> >   for(i = 0; i < adev->num_rings; ++i) {
> >   struct amdgpu_ring *ring = adev->rings[i];
> > @@ -848,18 +868,16 @@ static int gmc_v9_0_gart_init(struct amdgpu_device 
> > *adev)
> >
> >   static unsigned gmc_v9_0_get_vbios_fb_size(struct amdgpu_device *adev)
> >   {
> > -#if 0
> >   u32 d1vga_control = RREG32_SOC15(DCE, 0, mmD1VGA_CONTROL);
> > -#endif
> >   unsigned size;
> >
> >   /*
> >* TODO Remove once GART corruption is resolved
> >* Check related code in gmc_v9_0_sw_fini
> >* */
> > - size = 9 * 1024 * 1024;
> > + if (gmc_v9_0_keep_stolen_memory(adev))
> > + return 9 * 1024 * 1024;
> >
> > -#if 0
> >   if (REG_GET_FIELD(d1vga_control, D1VGA_CONTROL, D1VGA_MODE_ENABLE)) {
> >   size = 9 * 1024 * 1024; /* reserve 8MB for vga emulator and 1 
> > MB for FB */
> >   } else {
> > @@ -876,6 +894,7 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
> > amdgpu_device *adev)
> >   break;
> >   case CHIP_VEGA10:
> >   case CHIP_VEGA12:
> > + case CHIP_VEGA20:
> >   default:
> >   viewport = RREG32_SOC15(DCE, 0, mmSCL0_VIEWPORT_SIZE);
> >   size = (REG_GET_FIELD(viewport, SCL0_VIEWPORT_SIZE, 
> > VIEWPORT_HEIGHT) *
> > @@ -888,7 +907,6 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
> > amdgpu_device *adev)
> >   if ((adev->gmc.real_vram_size - size) < (8 * 1024 * 1024))
> >   return 0;
> >
> > -#endif
> >   return size;
> >   }
> >
> > @@ -1000,16 +1018,8 @@ static int gmc_v9_0_sw_fini(void *handle)
> >   amdgpu_gem_force_release(adev);
> >   amdgpu_vm_manager_fini(adev);
> >
> > - /*
> > - * TODO:
> > - * Currently there is a bug where some memory client outside
> > - * of the driver writes to first 8M of VRAM on S3 resume,
> > - * this overrides GART which by default gets placed in first 8M and
> > - * causes VM_FAULTS once GTT is accessed.
> > - * Keep the stolen memory reservation until the while this is not 
> > solved.
> > - * Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
> > - */
> > - amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
> > + if (gmc_v9_0_keep_stolen_memory(adev))
> > + amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
> >
> >   amdgpu_gart_table_vram_free(adev);
> >   

Re: [PATCH 1/4] drm/amdgpu/gmc9: rework stolen vga memory handling

2018-08-31 Thread Christian König

Am 30.08.2018 um 16:53 schrieb Alex Deucher:

No functional change, just rework it in order to adjust the
behavior on a per asic level.  The problem is that on vega10,
something corrupts the lower 8 MB of vram on the second
resume from S3.


Is that tested with engineering samples or production level hardware? 
Maybe it is just a leftover from BIOS bringup?



This does not seem to affect Raven, other
gmc9 based asics need testing.

Signed-off-by: Alex Deucher 


Acked-by: Christian König  for the series.


---
  drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c | 48 +--
  1 file changed, 29 insertions(+), 19 deletions(-)

diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c 
b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
index 04d50893a6f2..46cff7d8b375 100644
--- a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
+++ b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
@@ -692,6 +692,28 @@ static int gmc_v9_0_ecc_available(struct amdgpu_device 
*adev)
return lost_sheep == 0;
  }
  
+static bool gmc_v9_0_keep_stolen_memory(struct amdgpu_device *adev)

+{
+
+   /*
+* TODO:
+* Currently there is a bug where some memory client outside
+* of the driver writes to first 8M of VRAM on S3 resume,
+* this overrides GART which by default gets placed in first 8M and
+* causes VM_FAULTS once GTT is accessed.
+* Keep the stolen memory reservation until the while this is not 
solved.
+* Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
+*/
+   switch (adev->asic_type) {
+   case CHIP_RAVEN:
+   case CHIP_VEGA10:
+   case CHIP_VEGA12:
+   case CHIP_VEGA20:
+   default:
+   return true;
+   }
+}
+
  static int gmc_v9_0_late_init(void *handle)
  {
struct amdgpu_device *adev = (struct amdgpu_device *)handle;
@@ -708,10 +730,8 @@ static int gmc_v9_0_late_init(void *handle)
unsigned i;
int r;
  
-	/*

-* TODO - Uncomment once GART corruption issue is fixed.
-*/
-   /* amdgpu_bo_late_init(adev); */
+   if (!gmc_v9_0_keep_stolen_memory(adev))
+   amdgpu_bo_late_init(adev);
  
  	for(i = 0; i < adev->num_rings; ++i) {

struct amdgpu_ring *ring = adev->rings[i];
@@ -848,18 +868,16 @@ static int gmc_v9_0_gart_init(struct amdgpu_device *adev)
  
  static unsigned gmc_v9_0_get_vbios_fb_size(struct amdgpu_device *adev)

  {
-#if 0
u32 d1vga_control = RREG32_SOC15(DCE, 0, mmD1VGA_CONTROL);
-#endif
unsigned size;
  
  	/*

 * TODO Remove once GART corruption is resolved
 * Check related code in gmc_v9_0_sw_fini
 * */
-   size = 9 * 1024 * 1024;
+   if (gmc_v9_0_keep_stolen_memory(adev))
+   return 9 * 1024 * 1024;
  
-#if 0

if (REG_GET_FIELD(d1vga_control, D1VGA_CONTROL, D1VGA_MODE_ENABLE)) {
size = 9 * 1024 * 1024; /* reserve 8MB for vga emulator and 1 
MB for FB */
} else {
@@ -876,6 +894,7 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
amdgpu_device *adev)
break;
case CHIP_VEGA10:
case CHIP_VEGA12:
+   case CHIP_VEGA20:
default:
viewport = RREG32_SOC15(DCE, 0, mmSCL0_VIEWPORT_SIZE);
size = (REG_GET_FIELD(viewport, SCL0_VIEWPORT_SIZE, 
VIEWPORT_HEIGHT) *
@@ -888,7 +907,6 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
amdgpu_device *adev)
if ((adev->gmc.real_vram_size - size) < (8 * 1024 * 1024))
return 0;
  
-#endif

return size;
  }
  
@@ -1000,16 +1018,8 @@ static int gmc_v9_0_sw_fini(void *handle)

amdgpu_gem_force_release(adev);
amdgpu_vm_manager_fini(adev);
  
-	/*

-   * TODO:
-   * Currently there is a bug where some memory client outside
-   * of the driver writes to first 8M of VRAM on S3 resume,
-   * this overrides GART which by default gets placed in first 8M and
-   * causes VM_FAULTS once GTT is accessed.
-   * Keep the stolen memory reservation until the while this is not solved.
-   * Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
-   */
-   amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
+   if (gmc_v9_0_keep_stolen_memory(adev))
+   amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
  
  	amdgpu_gart_table_vram_free(adev);

amdgpu_bo_fini(adev);


___
amd-gfx mailing list
amd-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/amd-gfx


Re: [PATCH 1/4] drm/amdgpu/gmc9: rework stolen vga memory handling

2018-08-30 Thread Zhang, Jerry (Junwei)

On 08/30/2018 10:53 PM, Alex Deucher wrote:

No functional change, just rework it in order to adjust the
behavior on a per asic level.  The problem is that on vega10,
something corrupts the lower 8 MB of vram on the second
resume from S3.  This does not seem to affect Raven, other
gmc9 based asics need testing.

Signed-off-by: Alex Deucher 


Reviewed-by: Junwei Zhang 


---
  drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c | 48 +--
  1 file changed, 29 insertions(+), 19 deletions(-)

diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c 
b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
index 04d50893a6f2..46cff7d8b375 100644
--- a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
+++ b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
@@ -692,6 +692,28 @@ static int gmc_v9_0_ecc_available(struct amdgpu_device 
*adev)
return lost_sheep == 0;
  }

+static bool gmc_v9_0_keep_stolen_memory(struct amdgpu_device *adev)
+{
+
+   /*
+* TODO:
+* Currently there is a bug where some memory client outside
+* of the driver writes to first 8M of VRAM on S3 resume,
+* this overrides GART which by default gets placed in first 8M and
+* causes VM_FAULTS once GTT is accessed.
+* Keep the stolen memory reservation until the while this is not 
solved.
+* Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
+*/
+   switch (adev->asic_type) {
+   case CHIP_RAVEN:
+   case CHIP_VEGA10:
+   case CHIP_VEGA12:
+   case CHIP_VEGA20:
+   default:
+   return true;
+   }
+}
+
  static int gmc_v9_0_late_init(void *handle)
  {
struct amdgpu_device *adev = (struct amdgpu_device *)handle;
@@ -708,10 +730,8 @@ static int gmc_v9_0_late_init(void *handle)
unsigned i;
int r;

-   /*
-* TODO - Uncomment once GART corruption issue is fixed.
-*/
-   /* amdgpu_bo_late_init(adev); */
+   if (!gmc_v9_0_keep_stolen_memory(adev))
+   amdgpu_bo_late_init(adev);

for(i = 0; i < adev->num_rings; ++i) {
struct amdgpu_ring *ring = adev->rings[i];
@@ -848,18 +868,16 @@ static int gmc_v9_0_gart_init(struct amdgpu_device *adev)

  static unsigned gmc_v9_0_get_vbios_fb_size(struct amdgpu_device *adev)
  {
-#if 0
u32 d1vga_control = RREG32_SOC15(DCE, 0, mmD1VGA_CONTROL);
-#endif
unsigned size;

/*
 * TODO Remove once GART corruption is resolved
 * Check related code in gmc_v9_0_sw_fini
 * */
-   size = 9 * 1024 * 1024;
+   if (gmc_v9_0_keep_stolen_memory(adev))
+   return 9 * 1024 * 1024;

-#if 0
if (REG_GET_FIELD(d1vga_control, D1VGA_CONTROL, D1VGA_MODE_ENABLE)) {
size = 9 * 1024 * 1024; /* reserve 8MB for vga emulator and 1 
MB for FB */
} else {
@@ -876,6 +894,7 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
amdgpu_device *adev)
break;
case CHIP_VEGA10:
case CHIP_VEGA12:
+   case CHIP_VEGA20:
default:
viewport = RREG32_SOC15(DCE, 0, mmSCL0_VIEWPORT_SIZE);
size = (REG_GET_FIELD(viewport, SCL0_VIEWPORT_SIZE, 
VIEWPORT_HEIGHT) *
@@ -888,7 +907,6 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
amdgpu_device *adev)
if ((adev->gmc.real_vram_size - size) < (8 * 1024 * 1024))
return 0;

-#endif
return size;
  }

@@ -1000,16 +1018,8 @@ static int gmc_v9_0_sw_fini(void *handle)
amdgpu_gem_force_release(adev);
amdgpu_vm_manager_fini(adev);

-   /*
-   * TODO:
-   * Currently there is a bug where some memory client outside
-   * of the driver writes to first 8M of VRAM on S3 resume,
-   * this overrides GART which by default gets placed in first 8M and
-   * causes VM_FAULTS once GTT is accessed.
-   * Keep the stolen memory reservation until the while this is not solved.
-   * Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
-   */
-   amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
+   if (gmc_v9_0_keep_stolen_memory(adev))
+   amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);

amdgpu_gart_table_vram_free(adev);
amdgpu_bo_fini(adev);


___
amd-gfx mailing list
amd-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/amd-gfx


[PATCH 1/4] drm/amdgpu/gmc9: rework stolen vga memory handling

2018-08-30 Thread Alex Deucher
No functional change, just rework it in order to adjust the
behavior on a per asic level.  The problem is that on vega10,
something corrupts the lower 8 MB of vram on the second
resume from S3.  This does not seem to affect Raven, other
gmc9 based asics need testing.

Signed-off-by: Alex Deucher 
---
 drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c | 48 +--
 1 file changed, 29 insertions(+), 19 deletions(-)

diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c 
b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
index 04d50893a6f2..46cff7d8b375 100644
--- a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
+++ b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
@@ -692,6 +692,28 @@ static int gmc_v9_0_ecc_available(struct amdgpu_device 
*adev)
return lost_sheep == 0;
 }
 
+static bool gmc_v9_0_keep_stolen_memory(struct amdgpu_device *adev)
+{
+
+   /*
+* TODO:
+* Currently there is a bug where some memory client outside
+* of the driver writes to first 8M of VRAM on S3 resume,
+* this overrides GART which by default gets placed in first 8M and
+* causes VM_FAULTS once GTT is accessed.
+* Keep the stolen memory reservation until the while this is not 
solved.
+* Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
+*/
+   switch (adev->asic_type) {
+   case CHIP_RAVEN:
+   case CHIP_VEGA10:
+   case CHIP_VEGA12:
+   case CHIP_VEGA20:
+   default:
+   return true;
+   }
+}
+
 static int gmc_v9_0_late_init(void *handle)
 {
struct amdgpu_device *adev = (struct amdgpu_device *)handle;
@@ -708,10 +730,8 @@ static int gmc_v9_0_late_init(void *handle)
unsigned i;
int r;
 
-   /*
-* TODO - Uncomment once GART corruption issue is fixed.
-*/
-   /* amdgpu_bo_late_init(adev); */
+   if (!gmc_v9_0_keep_stolen_memory(adev))
+   amdgpu_bo_late_init(adev);
 
for(i = 0; i < adev->num_rings; ++i) {
struct amdgpu_ring *ring = adev->rings[i];
@@ -848,18 +868,16 @@ static int gmc_v9_0_gart_init(struct amdgpu_device *adev)
 
 static unsigned gmc_v9_0_get_vbios_fb_size(struct amdgpu_device *adev)
 {
-#if 0
u32 d1vga_control = RREG32_SOC15(DCE, 0, mmD1VGA_CONTROL);
-#endif
unsigned size;
 
/*
 * TODO Remove once GART corruption is resolved
 * Check related code in gmc_v9_0_sw_fini
 * */
-   size = 9 * 1024 * 1024;
+   if (gmc_v9_0_keep_stolen_memory(adev))
+   return 9 * 1024 * 1024;
 
-#if 0
if (REG_GET_FIELD(d1vga_control, D1VGA_CONTROL, D1VGA_MODE_ENABLE)) {
size = 9 * 1024 * 1024; /* reserve 8MB for vga emulator and 1 
MB for FB */
} else {
@@ -876,6 +894,7 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
amdgpu_device *adev)
break;
case CHIP_VEGA10:
case CHIP_VEGA12:
+   case CHIP_VEGA20:
default:
viewport = RREG32_SOC15(DCE, 0, mmSCL0_VIEWPORT_SIZE);
size = (REG_GET_FIELD(viewport, SCL0_VIEWPORT_SIZE, 
VIEWPORT_HEIGHT) *
@@ -888,7 +907,6 @@ static unsigned gmc_v9_0_get_vbios_fb_size(struct 
amdgpu_device *adev)
if ((adev->gmc.real_vram_size - size) < (8 * 1024 * 1024))
return 0;
 
-#endif
return size;
 }
 
@@ -1000,16 +1018,8 @@ static int gmc_v9_0_sw_fini(void *handle)
amdgpu_gem_force_release(adev);
amdgpu_vm_manager_fini(adev);
 
-   /*
-   * TODO:
-   * Currently there is a bug where some memory client outside
-   * of the driver writes to first 8M of VRAM on S3 resume,
-   * this overrides GART which by default gets placed in first 8M and
-   * causes VM_FAULTS once GTT is accessed.
-   * Keep the stolen memory reservation until the while this is not solved.
-   * Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
-   */
-   amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
+   if (gmc_v9_0_keep_stolen_memory(adev))
+   amdgpu_bo_free_kernel(>stolen_vga_memory, NULL, NULL);
 
amdgpu_gart_table_vram_free(adev);
amdgpu_bo_fini(adev);
-- 
2.13.6

___
amd-gfx mailing list
amd-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/amd-gfx