Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux

drm/amdgpu: add ih 6.1 support

Add initial support for IH 6.1.

v2: Fix copyright date (Alex)

Signed-off-by: Ben Li <ben.li@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>

authored by

Ben Li and committed by
Alex Deucher
0ba96fd3 85c391ab

+799 -1
+2 -1
drivers/gpu/drm/amd/amdgpu/Makefile
··· 129 129 vega10_ih.o \ 130 130 vega20_ih.o \ 131 131 navi10_ih.o \ 132 - ih_v6_0.o 132 + ih_v6_0.o \ 133 + ih_v6_1.o 133 134 134 135 # add PSP block 135 136 amdgpu-y += \
+769
drivers/gpu/drm/amd/amdgpu/ih_v6_1.c
··· 1 + /* 2 + * Copyright 2023 Advanced Micro Devices, Inc. 3 + * 4 + * Permission is hereby granted, free of charge, to any person obtaining a 5 + * copy of this software and associated documentation files (the "Software"), 6 + * to deal in the Software without restriction, including without limitation 7 + * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 + * and/or sell copies of the Software, and to permit persons to whom the 9 + * Software is furnished to do so, subject to the following conditions: 10 + * 11 + * The above copyright notice and this permission notice shall be included in 12 + * all copies or substantial portions of the Software. 13 + * 14 + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 + * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 + * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 + * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 + * OTHER DEALINGS IN THE SOFTWARE. 21 + * 22 + */ 23 + 24 + #include <linux/pci.h> 25 + 26 + #include "amdgpu.h" 27 + #include "amdgpu_ih.h" 28 + 29 + #include "oss/osssys_6_1_0_offset.h" 30 + #include "oss/osssys_6_1_0_sh_mask.h" 31 + 32 + #include "soc15_common.h" 33 + #include "ih_v6_1.h" 34 + 35 + #define MAX_REARM_RETRY 10 36 + 37 + static void ih_v6_1_set_interrupt_funcs(struct amdgpu_device *adev); 38 + 39 + /** 40 + * ih_v6_1_init_register_offset - Initialize register offset for ih rings 41 + * 42 + * @adev: amdgpu_device pointer 43 + * 44 + * Initialize register offset ih rings (IH_V6_0). 45 + */ 46 + static void ih_v6_1_init_register_offset(struct amdgpu_device *adev) 47 + { 48 + struct amdgpu_ih_regs *ih_regs; 49 + 50 + /* ih ring 2 is removed 51 + * ih ring and ih ring 1 are available */ 52 + if (adev->irq.ih.ring_size) { 53 + ih_regs = &adev->irq.ih.ih_regs; 54 + ih_regs->ih_rb_base = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_BASE); 55 + ih_regs->ih_rb_base_hi = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_BASE_HI); 56 + ih_regs->ih_rb_cntl = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_CNTL); 57 + ih_regs->ih_rb_wptr = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_WPTR); 58 + ih_regs->ih_rb_rptr = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_RPTR); 59 + ih_regs->ih_doorbell_rptr = SOC15_REG_OFFSET(OSSSYS, 0, regIH_DOORBELL_RPTR); 60 + ih_regs->ih_rb_wptr_addr_lo = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_WPTR_ADDR_LO); 61 + ih_regs->ih_rb_wptr_addr_hi = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_WPTR_ADDR_HI); 62 + ih_regs->psp_reg_id = PSP_REG_IH_RB_CNTL; 63 + } 64 + 65 + if (adev->irq.ih1.ring_size) { 66 + ih_regs = &adev->irq.ih1.ih_regs; 67 + ih_regs->ih_rb_base = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_BASE_RING1); 68 + ih_regs->ih_rb_base_hi = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_BASE_HI_RING1); 69 + ih_regs->ih_rb_cntl = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_CNTL_RING1); 70 + ih_regs->ih_rb_wptr = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_WPTR_RING1); 71 + ih_regs->ih_rb_rptr = SOC15_REG_OFFSET(OSSSYS, 0, regIH_RB_RPTR_RING1); 72 + ih_regs->ih_doorbell_rptr = SOC15_REG_OFFSET(OSSSYS, 0, regIH_DOORBELL_RPTR_RING1); 73 + ih_regs->psp_reg_id = PSP_REG_IH_RB_CNTL_RING1; 74 + } 75 + } 76 + 77 + /** 78 + * force_update_wptr_for_self_int - Force update the wptr for self interrupt 79 + * 80 + * @adev: amdgpu_device pointer 81 + * @threshold: threshold to trigger the wptr reporting 82 + * @timeout: timeout to trigger the wptr reporting 83 + * @enabled: Enable/disable timeout flush mechanism 84 + * 85 + * threshold input range: 0 ~ 15, default 0, 86 + * real_threshold = 2^threshold 87 + * timeout input range: 0 ~ 20, default 8, 88 + * real_timeout = (2^timeout) * 1024 / (socclk_freq) 89 + * 90 + * Force update wptr for self interrupt ( >= SIENNA_CICHLID). 91 + */ 92 + static void 93 + force_update_wptr_for_self_int(struct amdgpu_device *adev, 94 + u32 threshold, u32 timeout, bool enabled) 95 + { 96 + u32 ih_cntl, ih_rb_cntl; 97 + 98 + ih_cntl = RREG32_SOC15(OSSSYS, 0, regIH_CNTL2); 99 + ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, regIH_RB_CNTL_RING1); 100 + 101 + ih_cntl = REG_SET_FIELD(ih_cntl, IH_CNTL2, 102 + SELF_IV_FORCE_WPTR_UPDATE_TIMEOUT, timeout); 103 + ih_cntl = REG_SET_FIELD(ih_cntl, IH_CNTL2, 104 + SELF_IV_FORCE_WPTR_UPDATE_ENABLE, enabled); 105 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING1, 106 + RB_USED_INT_THRESHOLD, threshold); 107 + 108 + if (amdgpu_sriov_vf(adev) && amdgpu_sriov_reg_indirect_ih(adev)) { 109 + if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING1, ih_rb_cntl)) 110 + return; 111 + } else { 112 + WREG32_SOC15(OSSSYS, 0, regIH_RB_CNTL_RING1, ih_rb_cntl); 113 + } 114 + 115 + WREG32_SOC15(OSSSYS, 0, regIH_CNTL2, ih_cntl); 116 + } 117 + 118 + /** 119 + * ih_v6_1_toggle_ring_interrupts - toggle the interrupt ring buffer 120 + * 121 + * @adev: amdgpu_device pointer 122 + * @ih: amdgpu_ih_ring pointer 123 + * @enable: true - enable the interrupts, false - disable the interrupts 124 + * 125 + * Toggle the interrupt ring buffer (IH_V6_0) 126 + */ 127 + static int ih_v6_1_toggle_ring_interrupts(struct amdgpu_device *adev, 128 + struct amdgpu_ih_ring *ih, 129 + bool enable) 130 + { 131 + struct amdgpu_ih_regs *ih_regs; 132 + uint32_t tmp; 133 + 134 + ih_regs = &ih->ih_regs; 135 + 136 + tmp = RREG32(ih_regs->ih_rb_cntl); 137 + tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, RB_ENABLE, (enable ? 1 : 0)); 138 + /* enable_intr field is only valid in ring0 */ 139 + if (ih == &adev->irq.ih) 140 + tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, ENABLE_INTR, (enable ? 1 : 0)); 141 + 142 + if (amdgpu_sriov_vf(adev) && amdgpu_sriov_reg_indirect_ih(adev)) { 143 + if (psp_reg_program(&adev->psp, ih_regs->psp_reg_id, tmp)) 144 + return -ETIMEDOUT; 145 + } else { 146 + WREG32(ih_regs->ih_rb_cntl, tmp); 147 + } 148 + 149 + if (enable) { 150 + ih->enabled = true; 151 + } else { 152 + /* set rptr, wptr to 0 */ 153 + WREG32(ih_regs->ih_rb_rptr, 0); 154 + WREG32(ih_regs->ih_rb_wptr, 0); 155 + ih->enabled = false; 156 + ih->rptr = 0; 157 + } 158 + 159 + return 0; 160 + } 161 + 162 + /** 163 + * ih_v6_1_toggle_interrupts - Toggle all the available interrupt ring buffers 164 + * 165 + * @adev: amdgpu_device pointer 166 + * @enable: enable or disable interrupt ring buffers 167 + * 168 + * Toggle all the available interrupt ring buffers (IH_V6_0). 169 + */ 170 + static int ih_v6_1_toggle_interrupts(struct amdgpu_device *adev, bool enable) 171 + { 172 + struct amdgpu_ih_ring *ih[] = {&adev->irq.ih, &adev->irq.ih1}; 173 + int i; 174 + int r; 175 + 176 + for (i = 0; i < ARRAY_SIZE(ih); i++) { 177 + if (ih[i]->ring_size) { 178 + r = ih_v6_1_toggle_ring_interrupts(adev, ih[i], enable); 179 + if (r) 180 + return r; 181 + } 182 + } 183 + 184 + return 0; 185 + } 186 + 187 + static uint32_t ih_v6_1_rb_cntl(struct amdgpu_ih_ring *ih, uint32_t ih_rb_cntl) 188 + { 189 + int rb_bufsz = order_base_2(ih->ring_size / 4); 190 + 191 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, 192 + MC_SPACE, ih->use_bus_addr ? 2 : 4); 193 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, 194 + WPTR_OVERFLOW_CLEAR, 1); 195 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, 196 + WPTR_OVERFLOW_ENABLE, 1); 197 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_SIZE, rb_bufsz); 198 + /* Ring Buffer write pointer writeback. If enabled, IH_RB_WPTR register 199 + * value is written to memory 200 + */ 201 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, 202 + WPTR_WRITEBACK_ENABLE, 1); 203 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_SNOOP, 1); 204 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_RO, 0); 205 + ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_VMID, 0); 206 + 207 + return ih_rb_cntl; 208 + } 209 + 210 + static uint32_t ih_v6_1_doorbell_rptr(struct amdgpu_ih_ring *ih) 211 + { 212 + u32 ih_doorbell_rtpr = 0; 213 + 214 + if (ih->use_doorbell) { 215 + ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr, 216 + IH_DOORBELL_RPTR, OFFSET, 217 + ih->doorbell_index); 218 + ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr, 219 + IH_DOORBELL_RPTR, 220 + ENABLE, 1); 221 + } else { 222 + ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr, 223 + IH_DOORBELL_RPTR, 224 + ENABLE, 0); 225 + } 226 + return ih_doorbell_rtpr; 227 + } 228 + 229 + /** 230 + * ih_v6_1_enable_ring - enable an ih ring buffer 231 + * 232 + * @adev: amdgpu_device pointer 233 + * @ih: amdgpu_ih_ring pointer 234 + * 235 + * Enable an ih ring buffer (IH_V6_0) 236 + */ 237 + static int ih_v6_1_enable_ring(struct amdgpu_device *adev, 238 + struct amdgpu_ih_ring *ih) 239 + { 240 + struct amdgpu_ih_regs *ih_regs; 241 + uint32_t tmp; 242 + 243 + ih_regs = &ih->ih_regs; 244 + 245 + /* Ring Buffer base. [39:8] of 40-bit address of the beginning of the ring buffer*/ 246 + WREG32(ih_regs->ih_rb_base, ih->gpu_addr >> 8); 247 + WREG32(ih_regs->ih_rb_base_hi, (ih->gpu_addr >> 40) & 0xff); 248 + 249 + tmp = RREG32(ih_regs->ih_rb_cntl); 250 + tmp = ih_v6_1_rb_cntl(ih, tmp); 251 + if (ih == &adev->irq.ih) 252 + tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, RPTR_REARM, !!adev->irq.msi_enabled); 253 + if (ih == &adev->irq.ih1) { 254 + tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, WPTR_OVERFLOW_ENABLE, 0); 255 + tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, RB_FULL_DRAIN_ENABLE, 1); 256 + } 257 + 258 + if (amdgpu_sriov_vf(adev) && amdgpu_sriov_reg_indirect_ih(adev)) { 259 + if (psp_reg_program(&adev->psp, ih_regs->psp_reg_id, tmp)) { 260 + DRM_ERROR("PSP program IH_RB_CNTL failed!\n"); 261 + return -ETIMEDOUT; 262 + } 263 + } else { 264 + WREG32(ih_regs->ih_rb_cntl, tmp); 265 + } 266 + 267 + if (ih == &adev->irq.ih) { 268 + /* set the ih ring 0 writeback address whether it's enabled or not */ 269 + WREG32(ih_regs->ih_rb_wptr_addr_lo, lower_32_bits(ih->wptr_addr)); 270 + WREG32(ih_regs->ih_rb_wptr_addr_hi, upper_32_bits(ih->wptr_addr) & 0xFFFF); 271 + } 272 + 273 + /* set rptr, wptr to 0 */ 274 + WREG32(ih_regs->ih_rb_wptr, 0); 275 + WREG32(ih_regs->ih_rb_rptr, 0); 276 + 277 + WREG32(ih_regs->ih_doorbell_rptr, ih_v6_1_doorbell_rptr(ih)); 278 + 279 + return 0; 280 + } 281 + 282 + /** 283 + * ih_v6_1_irq_init - init and enable the interrupt ring 284 + * 285 + * @adev: amdgpu_device pointer 286 + * 287 + * Allocate a ring buffer for the interrupt controller, 288 + * enable the RLC, disable interrupts, enable the IH 289 + * ring buffer and enable it. 290 + * Called at device load and reume. 291 + * Returns 0 for success, errors for failure. 292 + */ 293 + static int ih_v6_1_irq_init(struct amdgpu_device *adev) 294 + { 295 + struct amdgpu_ih_ring *ih[] = {&adev->irq.ih, &adev->irq.ih1}; 296 + u32 ih_chicken; 297 + u32 tmp; 298 + int ret; 299 + int i; 300 + 301 + /* disable irqs */ 302 + ret = ih_v6_1_toggle_interrupts(adev, false); 303 + if (ret) 304 + return ret; 305 + 306 + adev->nbio.funcs->ih_control(adev); 307 + 308 + if (unlikely((adev->firmware.load_type == AMDGPU_FW_LOAD_DIRECT) || 309 + (adev->firmware.load_type == AMDGPU_FW_LOAD_RLC_BACKDOOR_AUTO))) { 310 + if (ih[0]->use_bus_addr) { 311 + ih_chicken = RREG32_SOC15(OSSSYS, 0, regIH_CHICKEN); 312 + ih_chicken = REG_SET_FIELD(ih_chicken, 313 + IH_CHICKEN, MC_SPACE_GPA_ENABLE, 1); 314 + WREG32_SOC15(OSSSYS, 0, regIH_CHICKEN, ih_chicken); 315 + } 316 + } 317 + 318 + for (i = 0; i < ARRAY_SIZE(ih); i++) { 319 + if (ih[i]->ring_size) { 320 + ret = ih_v6_1_enable_ring(adev, ih[i]); 321 + if (ret) 322 + return ret; 323 + } 324 + } 325 + 326 + /* update doorbell range for ih ring 0 */ 327 + adev->nbio.funcs->ih_doorbell_range(adev, ih[0]->use_doorbell, 328 + ih[0]->doorbell_index); 329 + 330 + tmp = RREG32_SOC15(OSSSYS, 0, regIH_STORM_CLIENT_LIST_CNTL); 331 + tmp = REG_SET_FIELD(tmp, IH_STORM_CLIENT_LIST_CNTL, 332 + CLIENT18_IS_STORM_CLIENT, 1); 333 + WREG32_SOC15(OSSSYS, 0, regIH_STORM_CLIENT_LIST_CNTL, tmp); 334 + 335 + tmp = RREG32_SOC15(OSSSYS, 0, regIH_INT_FLOOD_CNTL); 336 + tmp = REG_SET_FIELD(tmp, IH_INT_FLOOD_CNTL, FLOOD_CNTL_ENABLE, 1); 337 + WREG32_SOC15(OSSSYS, 0, regIH_INT_FLOOD_CNTL, tmp); 338 + 339 + /* GC/MMHUB UTCL2 page fault interrupts are configured as 340 + * MSI storm capable interrupts by deafult. The delay is 341 + * used to avoid ISR being called too frequently 342 + * when page fault happens on several continuous page 343 + * and thus avoid MSI storm */ 344 + tmp = RREG32_SOC15(OSSSYS, 0, regIH_MSI_STORM_CTRL); 345 + tmp = REG_SET_FIELD(tmp, IH_MSI_STORM_CTRL, 346 + DELAY, 3); 347 + WREG32_SOC15(OSSSYS, 0, regIH_MSI_STORM_CTRL, tmp); 348 + 349 + pci_set_master(adev->pdev); 350 + 351 + /* enable interrupts */ 352 + ret = ih_v6_1_toggle_interrupts(adev, true); 353 + if (ret) 354 + return ret; 355 + /* enable wptr force update for self int */ 356 + force_update_wptr_for_self_int(adev, 0, 8, true); 357 + 358 + if (adev->irq.ih_soft.ring_size) 359 + adev->irq.ih_soft.enabled = true; 360 + 361 + return 0; 362 + } 363 + 364 + /** 365 + * ih_v6_1_irq_disable - disable interrupts 366 + * 367 + * @adev: amdgpu_device pointer 368 + * 369 + * Disable interrupts on the hw. 370 + */ 371 + static void ih_v6_1_irq_disable(struct amdgpu_device *adev) 372 + { 373 + force_update_wptr_for_self_int(adev, 0, 8, false); 374 + ih_v6_1_toggle_interrupts(adev, false); 375 + 376 + /* Wait and acknowledge irq */ 377 + mdelay(1); 378 + } 379 + 380 + /** 381 + * ih_v6_1_get_wptr - get the IH ring buffer wptr 382 + * 383 + * @adev: amdgpu_device pointer 384 + * @ih: amdgpu_ih_ring pointer 385 + * 386 + * Get the IH ring buffer wptr from either the register 387 + * or the writeback memory buffer. Also check for 388 + * ring buffer overflow and deal with it. 389 + * Returns the value of the wptr. 390 + */ 391 + static u32 ih_v6_1_get_wptr(struct amdgpu_device *adev, 392 + struct amdgpu_ih_ring *ih) 393 + { 394 + u32 wptr, tmp; 395 + struct amdgpu_ih_regs *ih_regs; 396 + 397 + wptr = le32_to_cpu(*ih->wptr_cpu); 398 + ih_regs = &ih->ih_regs; 399 + 400 + if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW)) 401 + goto out; 402 + 403 + wptr = RREG32_NO_KIQ(ih_regs->ih_rb_wptr); 404 + if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW)) 405 + goto out; 406 + wptr = REG_SET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW, 0); 407 + 408 + /* When a ring buffer overflow happen start parsing interrupt 409 + * from the last not overwritten vector (wptr + 32). Hopefully 410 + * this should allow us to catch up. 411 + */ 412 + tmp = (wptr + 32) & ih->ptr_mask; 413 + dev_warn(adev->dev, "IH ring buffer overflow " 414 + "(0x%08X, 0x%08X, 0x%08X)\n", 415 + wptr, ih->rptr, tmp); 416 + ih->rptr = tmp; 417 + 418 + tmp = RREG32_NO_KIQ(ih_regs->ih_rb_cntl); 419 + tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, WPTR_OVERFLOW_CLEAR, 1); 420 + WREG32_NO_KIQ(ih_regs->ih_rb_cntl, tmp); 421 + out: 422 + return (wptr & ih->ptr_mask); 423 + } 424 + 425 + /** 426 + * ih_v6_1_irq_rearm - rearm IRQ if lost 427 + * 428 + * @adev: amdgpu_device pointer 429 + * @ih: amdgpu_ih_ring pointer 430 + * 431 + */ 432 + static void ih_v6_1_irq_rearm(struct amdgpu_device *adev, 433 + struct amdgpu_ih_ring *ih) 434 + { 435 + uint32_t v = 0; 436 + uint32_t i = 0; 437 + struct amdgpu_ih_regs *ih_regs; 438 + 439 + ih_regs = &ih->ih_regs; 440 + 441 + /* Rearm IRQ / re-write doorbell if doorbell write is lost */ 442 + for (i = 0; i < MAX_REARM_RETRY; i++) { 443 + v = RREG32_NO_KIQ(ih_regs->ih_rb_rptr); 444 + if ((v < ih->ring_size) && (v != ih->rptr)) 445 + WDOORBELL32(ih->doorbell_index, ih->rptr); 446 + else 447 + break; 448 + } 449 + } 450 + 451 + /** 452 + * ih_v6_1_set_rptr - set the IH ring buffer rptr 453 + * 454 + * @adev: amdgpu_device pointer 455 + * @ih: amdgpu_ih_ring pointer 456 + * 457 + * Set the IH ring buffer rptr. 458 + */ 459 + static void ih_v6_1_set_rptr(struct amdgpu_device *adev, 460 + struct amdgpu_ih_ring *ih) 461 + { 462 + struct amdgpu_ih_regs *ih_regs; 463 + 464 + if (ih->use_doorbell) { 465 + /* XXX check if swapping is necessary on BE */ 466 + *ih->rptr_cpu = ih->rptr; 467 + WDOORBELL32(ih->doorbell_index, ih->rptr); 468 + 469 + if (amdgpu_sriov_vf(adev)) 470 + ih_v6_1_irq_rearm(adev, ih); 471 + } else { 472 + ih_regs = &ih->ih_regs; 473 + WREG32(ih_regs->ih_rb_rptr, ih->rptr); 474 + } 475 + } 476 + 477 + /** 478 + * ih_v6_1_self_irq - dispatch work for ring 1 479 + * 480 + * @adev: amdgpu_device pointer 481 + * @source: irq source 482 + * @entry: IV with WPTR update 483 + * 484 + * Update the WPTR from the IV and schedule work to handle the entries. 485 + */ 486 + static int ih_v6_1_self_irq(struct amdgpu_device *adev, 487 + struct amdgpu_irq_src *source, 488 + struct amdgpu_iv_entry *entry) 489 + { 490 + uint32_t wptr = cpu_to_le32(entry->src_data[0]); 491 + 492 + switch (entry->ring_id) { 493 + case 1: 494 + *adev->irq.ih1.wptr_cpu = wptr; 495 + schedule_work(&adev->irq.ih1_work); 496 + break; 497 + default: 498 + break; 499 + } 500 + return 0; 501 + } 502 + 503 + static const struct amdgpu_irq_src_funcs ih_v6_1_self_irq_funcs = { 504 + .process = ih_v6_1_self_irq, 505 + }; 506 + 507 + static void ih_v6_1_set_self_irq_funcs(struct amdgpu_device *adev) 508 + { 509 + adev->irq.self_irq.num_types = 0; 510 + adev->irq.self_irq.funcs = &ih_v6_1_self_irq_funcs; 511 + } 512 + 513 + static int ih_v6_1_early_init(void *handle) 514 + { 515 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 516 + 517 + ih_v6_1_set_interrupt_funcs(adev); 518 + ih_v6_1_set_self_irq_funcs(adev); 519 + return 0; 520 + } 521 + 522 + static int ih_v6_1_sw_init(void *handle) 523 + { 524 + int r; 525 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 526 + bool use_bus_addr; 527 + 528 + r = amdgpu_irq_add_id(adev, SOC21_IH_CLIENTID_IH, 0, 529 + &adev->irq.self_irq); 530 + 531 + if (r) 532 + return r; 533 + 534 + /* use gpu virtual address for ih ring 535 + * until ih_checken is programmed to allow 536 + * use bus address for ih ring by psp bl */ 537 + use_bus_addr = 538 + (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) ? false : true; 539 + r = amdgpu_ih_ring_init(adev, &adev->irq.ih, 256 * 1024, use_bus_addr); 540 + if (r) 541 + return r; 542 + 543 + adev->irq.ih.use_doorbell = true; 544 + adev->irq.ih.doorbell_index = adev->doorbell_index.ih << 1; 545 + 546 + adev->irq.ih1.ring_size = 0; 547 + adev->irq.ih2.ring_size = 0; 548 + 549 + /* initialize ih control register offset */ 550 + ih_v6_1_init_register_offset(adev); 551 + 552 + r = amdgpu_ih_ring_init(adev, &adev->irq.ih_soft, PAGE_SIZE, true); 553 + if (r) 554 + return r; 555 + 556 + r = amdgpu_irq_init(adev); 557 + 558 + return r; 559 + } 560 + 561 + static int ih_v6_1_sw_fini(void *handle) 562 + { 563 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 564 + 565 + amdgpu_irq_fini_sw(adev); 566 + 567 + return 0; 568 + } 569 + 570 + static int ih_v6_1_hw_init(void *handle) 571 + { 572 + int r; 573 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 574 + 575 + r = ih_v6_1_irq_init(adev); 576 + if (r) 577 + return r; 578 + 579 + return 0; 580 + } 581 + 582 + static int ih_v6_1_hw_fini(void *handle) 583 + { 584 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 585 + 586 + ih_v6_1_irq_disable(adev); 587 + 588 + return 0; 589 + } 590 + 591 + static int ih_v6_1_suspend(void *handle) 592 + { 593 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 594 + 595 + return ih_v6_1_hw_fini(adev); 596 + } 597 + 598 + static int ih_v6_1_resume(void *handle) 599 + { 600 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 601 + 602 + return ih_v6_1_hw_init(adev); 603 + } 604 + 605 + static bool ih_v6_1_is_idle(void *handle) 606 + { 607 + /* todo */ 608 + return true; 609 + } 610 + 611 + static int ih_v6_1_wait_for_idle(void *handle) 612 + { 613 + /* todo */ 614 + return -ETIMEDOUT; 615 + } 616 + 617 + static int ih_v6_1_soft_reset(void *handle) 618 + { 619 + /* todo */ 620 + return 0; 621 + } 622 + 623 + static void ih_v6_1_update_clockgating_state(struct amdgpu_device *adev, 624 + bool enable) 625 + { 626 + uint32_t data, def, field_val; 627 + 628 + if (adev->cg_flags & AMD_CG_SUPPORT_IH_CG) { 629 + def = data = RREG32_SOC15(OSSSYS, 0, regIH_CLK_CTRL); 630 + field_val = enable ? 0 : 1; 631 + data = REG_SET_FIELD(data, IH_CLK_CTRL, 632 + DBUS_MUX_CLK_SOFT_OVERRIDE, field_val); 633 + data = REG_SET_FIELD(data, IH_CLK_CTRL, 634 + OSSSYS_SHARE_CLK_SOFT_OVERRIDE, field_val); 635 + data = REG_SET_FIELD(data, IH_CLK_CTRL, 636 + LIMIT_SMN_CLK_SOFT_OVERRIDE, field_val); 637 + data = REG_SET_FIELD(data, IH_CLK_CTRL, 638 + DYN_CLK_SOFT_OVERRIDE, field_val); 639 + data = REG_SET_FIELD(data, IH_CLK_CTRL, 640 + REG_CLK_SOFT_OVERRIDE, field_val); 641 + if (def != data) 642 + WREG32_SOC15(OSSSYS, 0, regIH_CLK_CTRL, data); 643 + } 644 + 645 + return; 646 + } 647 + 648 + static int ih_v6_1_set_clockgating_state(void *handle, 649 + enum amd_clockgating_state state) 650 + { 651 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 652 + 653 + ih_v6_1_update_clockgating_state(adev, 654 + state == AMD_CG_STATE_GATE); 655 + return 0; 656 + } 657 + 658 + static void ih_v6_1_update_ih_mem_power_gating(struct amdgpu_device *adev, 659 + bool enable) 660 + { 661 + uint32_t ih_mem_pwr_cntl; 662 + 663 + /* Disable ih sram power cntl before switch powergating mode */ 664 + ih_mem_pwr_cntl = RREG32_SOC15(OSSSYS, 0, regIH_MEM_POWER_CTRL); 665 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 666 + IH_BUFFER_MEM_POWER_CTRL_EN, 0); 667 + WREG32_SOC15(OSSSYS, 0, regIH_MEM_POWER_CTRL, ih_mem_pwr_cntl); 668 + 669 + /* It is recommended to set mem powergating mode to DS mode */ 670 + if (enable) { 671 + /* mem power mode */ 672 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 673 + IH_BUFFER_MEM_POWER_LS_EN, 0); 674 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 675 + IH_BUFFER_MEM_POWER_DS_EN, 1); 676 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 677 + IH_BUFFER_MEM_POWER_SD_EN, 0); 678 + /* cam mem power mode */ 679 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 680 + IH_RETRY_INT_CAM_MEM_POWER_LS_EN, 0); 681 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 682 + IH_RETRY_INT_CAM_MEM_POWER_DS_EN, 1); 683 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 684 + IH_RETRY_INT_CAM_MEM_POWER_SD_EN, 0); 685 + /* re-enable power cntl */ 686 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 687 + IH_BUFFER_MEM_POWER_CTRL_EN, 1); 688 + } else { 689 + /* mem power mode */ 690 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 691 + IH_BUFFER_MEM_POWER_LS_EN, 0); 692 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 693 + IH_BUFFER_MEM_POWER_DS_EN, 0); 694 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 695 + IH_BUFFER_MEM_POWER_SD_EN, 0); 696 + /* cam mem power mode */ 697 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 698 + IH_RETRY_INT_CAM_MEM_POWER_LS_EN, 0); 699 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 700 + IH_RETRY_INT_CAM_MEM_POWER_DS_EN, 0); 701 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 702 + IH_RETRY_INT_CAM_MEM_POWER_SD_EN, 0); 703 + /* re-enable power cntl*/ 704 + ih_mem_pwr_cntl = REG_SET_FIELD(ih_mem_pwr_cntl, IH_MEM_POWER_CTRL, 705 + IH_BUFFER_MEM_POWER_CTRL_EN, 1); 706 + } 707 + 708 + WREG32_SOC15(OSSSYS, 0, regIH_MEM_POWER_CTRL, ih_mem_pwr_cntl); 709 + } 710 + 711 + static int ih_v6_1_set_powergating_state(void *handle, 712 + enum amd_powergating_state state) 713 + { 714 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 715 + bool enable = (state == AMD_PG_STATE_GATE); 716 + 717 + if (adev->pg_flags & AMD_PG_SUPPORT_IH_SRAM_PG) 718 + ih_v6_1_update_ih_mem_power_gating(adev, enable); 719 + 720 + return 0; 721 + } 722 + 723 + static void ih_v6_1_get_clockgating_state(void *handle, u64 *flags) 724 + { 725 + struct amdgpu_device *adev = (struct amdgpu_device *)handle; 726 + 727 + if (!RREG32_SOC15(OSSSYS, 0, regIH_CLK_CTRL)) 728 + *flags |= AMD_CG_SUPPORT_IH_CG; 729 + 730 + return; 731 + } 732 + 733 + static const struct amd_ip_funcs ih_v6_1_ip_funcs = { 734 + .name = "ih_v6_1", 735 + .early_init = ih_v6_1_early_init, 736 + .late_init = NULL, 737 + .sw_init = ih_v6_1_sw_init, 738 + .sw_fini = ih_v6_1_sw_fini, 739 + .hw_init = ih_v6_1_hw_init, 740 + .hw_fini = ih_v6_1_hw_fini, 741 + .suspend = ih_v6_1_suspend, 742 + .resume = ih_v6_1_resume, 743 + .is_idle = ih_v6_1_is_idle, 744 + .wait_for_idle = ih_v6_1_wait_for_idle, 745 + .soft_reset = ih_v6_1_soft_reset, 746 + .set_clockgating_state = ih_v6_1_set_clockgating_state, 747 + .set_powergating_state = ih_v6_1_set_powergating_state, 748 + .get_clockgating_state = ih_v6_1_get_clockgating_state, 749 + }; 750 + 751 + static const struct amdgpu_ih_funcs ih_v6_1_funcs = { 752 + .get_wptr = ih_v6_1_get_wptr, 753 + .decode_iv = amdgpu_ih_decode_iv_helper, 754 + .decode_iv_ts = amdgpu_ih_decode_iv_ts_helper, 755 + .set_rptr = ih_v6_1_set_rptr 756 + }; 757 + 758 + static void ih_v6_1_set_interrupt_funcs(struct amdgpu_device *adev) 759 + { 760 + adev->irq.ih_funcs = &ih_v6_1_funcs; 761 + } 762 + 763 + const struct amdgpu_ip_block_version ih_v6_1_ip_block = { 764 + .type = AMD_IP_BLOCK_TYPE_IH, 765 + .major = 6, 766 + .minor = 0, 767 + .rev = 0, 768 + .funcs = &ih_v6_1_ip_funcs, 769 + };
+28
drivers/gpu/drm/amd/amdgpu/ih_v6_1.h
··· 1 + /* 2 + * Copyright 2023 Advanced Micro Devices, Inc. 3 + * 4 + * Permission is hereby granted, free of charge, to any person obtaining a 5 + * copy of this software and associated documentation files (the "Software"), 6 + * to deal in the Software without restriction, including without limitation 7 + * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 + * and/or sell copies of the Software, and to permit persons to whom the 9 + * Software is furnished to do so, subject to the following conditions: 10 + * 11 + * The above copyright notice and this permission notice shall be included in 12 + * all copies or substantial portions of the Software. 13 + * 14 + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 + * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 + * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 + * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 + * OTHER DEALINGS IN THE SOFTWARE. 21 + * 22 + */ 23 + #ifndef __IH_V6_1_IH_H__ 24 + #define __IH_V6_1_IH_H__ 25 + 26 + extern const struct amdgpu_ip_block_version ih_v6_1_ip_block; 27 + 28 + #endif