提交 9fadb352 编写于 作者: M Marek Olšák 提交者: Alex Deucher

drm/radeon: fix render backend setup for SI and CIK

Only the render backends of the first shader engine were enabled. The others
were erroneously disabled. Enabling the other render backends improves
performance a lot.

Unigine Sanctuary on Bonaire:
  Before: 15 fps
  After:  90 fps

Judging from the fan noise, the GPU was also underclocked when the other
render backends were disabled, resulting in horrible performance. The fan is
a lot noisy under load now.
Signed-off-by: NMarek Olšák <marek.olsak@amd.com>
Signed-off-by: NAlex Deucher <alexander.deucher@amd.com>
Cc: stable@vger.kernel.org
上级 d00adcc8
...@@ -3057,7 +3057,7 @@ static u32 cik_create_bitmask(u32 bit_width) ...@@ -3057,7 +3057,7 @@ static u32 cik_create_bitmask(u32 bit_width)
* Returns the disabled RB bitmask. * Returns the disabled RB bitmask.
*/ */
static u32 cik_get_rb_disabled(struct radeon_device *rdev, static u32 cik_get_rb_disabled(struct radeon_device *rdev,
u32 max_rb_num, u32 se_num, u32 max_rb_num_per_se,
u32 sh_per_se) u32 sh_per_se)
{ {
u32 data, mask; u32 data, mask;
...@@ -3071,7 +3071,7 @@ static u32 cik_get_rb_disabled(struct radeon_device *rdev, ...@@ -3071,7 +3071,7 @@ static u32 cik_get_rb_disabled(struct radeon_device *rdev,
data >>= BACKEND_DISABLE_SHIFT; data >>= BACKEND_DISABLE_SHIFT;
mask = cik_create_bitmask(max_rb_num / se_num / sh_per_se); mask = cik_create_bitmask(max_rb_num_per_se / sh_per_se);
return data & mask; return data & mask;
} }
...@@ -3088,7 +3088,7 @@ static u32 cik_get_rb_disabled(struct radeon_device *rdev, ...@@ -3088,7 +3088,7 @@ static u32 cik_get_rb_disabled(struct radeon_device *rdev,
*/ */
static void cik_setup_rb(struct radeon_device *rdev, static void cik_setup_rb(struct radeon_device *rdev,
u32 se_num, u32 sh_per_se, u32 se_num, u32 sh_per_se,
u32 max_rb_num) u32 max_rb_num_per_se)
{ {
int i, j; int i, j;
u32 data, mask; u32 data, mask;
...@@ -3098,7 +3098,7 @@ static void cik_setup_rb(struct radeon_device *rdev, ...@@ -3098,7 +3098,7 @@ static void cik_setup_rb(struct radeon_device *rdev,
for (i = 0; i < se_num; i++) { for (i = 0; i < se_num; i++) {
for (j = 0; j < sh_per_se; j++) { for (j = 0; j < sh_per_se; j++) {
cik_select_se_sh(rdev, i, j); cik_select_se_sh(rdev, i, j);
data = cik_get_rb_disabled(rdev, max_rb_num, se_num, sh_per_se); data = cik_get_rb_disabled(rdev, max_rb_num_per_se, sh_per_se);
if (rdev->family == CHIP_HAWAII) if (rdev->family == CHIP_HAWAII)
disabled_rbs |= data << ((i * sh_per_se + j) * HAWAII_RB_BITMAP_WIDTH_PER_SH); disabled_rbs |= data << ((i * sh_per_se + j) * HAWAII_RB_BITMAP_WIDTH_PER_SH);
else else
...@@ -3108,7 +3108,7 @@ static void cik_setup_rb(struct radeon_device *rdev, ...@@ -3108,7 +3108,7 @@ static void cik_setup_rb(struct radeon_device *rdev,
cik_select_se_sh(rdev, 0xffffffff, 0xffffffff); cik_select_se_sh(rdev, 0xffffffff, 0xffffffff);
mask = 1; mask = 1;
for (i = 0; i < max_rb_num; i++) { for (i = 0; i < max_rb_num_per_se * se_num; i++) {
if (!(disabled_rbs & mask)) if (!(disabled_rbs & mask))
enabled_rbs |= mask; enabled_rbs |= mask;
mask <<= 1; mask <<= 1;
......
...@@ -2811,7 +2811,7 @@ static void si_setup_spi(struct radeon_device *rdev, ...@@ -2811,7 +2811,7 @@ static void si_setup_spi(struct radeon_device *rdev,
} }
static u32 si_get_rb_disabled(struct radeon_device *rdev, static u32 si_get_rb_disabled(struct radeon_device *rdev,
u32 max_rb_num, u32 se_num, u32 max_rb_num_per_se,
u32 sh_per_se) u32 sh_per_se)
{ {
u32 data, mask; u32 data, mask;
...@@ -2825,14 +2825,14 @@ static u32 si_get_rb_disabled(struct radeon_device *rdev, ...@@ -2825,14 +2825,14 @@ static u32 si_get_rb_disabled(struct radeon_device *rdev,
data >>= BACKEND_DISABLE_SHIFT; data >>= BACKEND_DISABLE_SHIFT;
mask = si_create_bitmask(max_rb_num / se_num / sh_per_se); mask = si_create_bitmask(max_rb_num_per_se / sh_per_se);
return data & mask; return data & mask;
} }
static void si_setup_rb(struct radeon_device *rdev, static void si_setup_rb(struct radeon_device *rdev,
u32 se_num, u32 sh_per_se, u32 se_num, u32 sh_per_se,
u32 max_rb_num) u32 max_rb_num_per_se)
{ {
int i, j; int i, j;
u32 data, mask; u32 data, mask;
...@@ -2842,14 +2842,14 @@ static void si_setup_rb(struct radeon_device *rdev, ...@@ -2842,14 +2842,14 @@ static void si_setup_rb(struct radeon_device *rdev,
for (i = 0; i < se_num; i++) { for (i = 0; i < se_num; i++) {
for (j = 0; j < sh_per_se; j++) { for (j = 0; j < sh_per_se; j++) {
si_select_se_sh(rdev, i, j); si_select_se_sh(rdev, i, j);
data = si_get_rb_disabled(rdev, max_rb_num, se_num, sh_per_se); data = si_get_rb_disabled(rdev, max_rb_num_per_se, sh_per_se);
disabled_rbs |= data << ((i * sh_per_se + j) * TAHITI_RB_BITMAP_WIDTH_PER_SH); disabled_rbs |= data << ((i * sh_per_se + j) * TAHITI_RB_BITMAP_WIDTH_PER_SH);
} }
} }
si_select_se_sh(rdev, 0xffffffff, 0xffffffff); si_select_se_sh(rdev, 0xffffffff, 0xffffffff);
mask = 1; mask = 1;
for (i = 0; i < max_rb_num; i++) { for (i = 0; i < max_rb_num_per_se * se_num; i++) {
if (!(disabled_rbs & mask)) if (!(disabled_rbs & mask))
enabled_rbs |= mask; enabled_rbs |= mask;
mask <<= 1; mask <<= 1;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册