Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1/*
2 * Copyright 2019 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23
24#include <linux/pci.h>
25
26#include "amdgpu.h"
27#include "amdgpu_ih.h"
28
29#include "oss/osssys_5_0_0_offset.h"
30#include "oss/osssys_5_0_0_sh_mask.h"
31
32#include "soc15_common.h"
33#include "navi10_ih.h"
34
35#define MAX_REARM_RETRY 10
36
37static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev);
38
39/**
40 * navi10_ih_enable_interrupts - Enable the interrupt ring buffer
41 *
42 * @adev: amdgpu_device pointer
43 *
44 * Enable the interrupt ring buffer (NAVI10).
45 */
46static void navi10_ih_enable_interrupts(struct amdgpu_device *adev)
47{
48 u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
49
50 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 1);
51 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 1);
52 WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
53 adev->irq.ih.enabled = true;
54}
55
56/**
57 * navi10_ih_disable_interrupts - Disable the interrupt ring buffer
58 *
59 * @adev: amdgpu_device pointer
60 *
61 * Disable the interrupt ring buffer (NAVI10).
62 */
63static void navi10_ih_disable_interrupts(struct amdgpu_device *adev)
64{
65 u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
66
67 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 0);
68 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 0);
69 WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
70 /* set rptr, wptr to 0 */
71 WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
72 WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
73 adev->irq.ih.enabled = false;
74 adev->irq.ih.rptr = 0;
75}
76
77static uint32_t navi10_ih_rb_cntl(struct amdgpu_ih_ring *ih, uint32_t ih_rb_cntl)
78{
79 int rb_bufsz = order_base_2(ih->ring_size / 4);
80
81 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
82 MC_SPACE, ih->use_bus_addr ? 1 : 4);
83 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
84 WPTR_OVERFLOW_CLEAR, 1);
85 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
86 WPTR_OVERFLOW_ENABLE, 1);
87 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_SIZE, rb_bufsz);
88 /* Ring Buffer write pointer writeback. If enabled, IH_RB_WPTR register
89 * value is written to memory
90 */
91 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
92 WPTR_WRITEBACK_ENABLE, 1);
93 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_SNOOP, 1);
94 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_RO, 0);
95 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_VMID, 0);
96
97 return ih_rb_cntl;
98}
99
100/**
101 * navi10_ih_irq_init - init and enable the interrupt ring
102 *
103 * @adev: amdgpu_device pointer
104 *
105 * Allocate a ring buffer for the interrupt controller,
106 * enable the RLC, disable interrupts, enable the IH
107 * ring buffer and enable it (NAVI).
108 * Called at device load and reume.
109 * Returns 0 for success, errors for failure.
110 */
111static int navi10_ih_irq_init(struct amdgpu_device *adev)
112{
113 struct amdgpu_ih_ring *ih = &adev->irq.ih;
114 u32 ih_rb_cntl, ih_doorbell_rtpr, ih_chicken;
115 u32 tmp;
116
117 /* disable irqs */
118 navi10_ih_disable_interrupts(adev);
119
120 adev->nbio.funcs->ih_control(adev);
121
122 /* Ring Buffer base. [39:8] of 40-bit address of the beginning of the ring buffer*/
123 WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE, ih->gpu_addr >> 8);
124 WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_HI, (ih->gpu_addr >> 40) & 0xff);
125
126 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
127 ih_rb_cntl = navi10_ih_rb_cntl(ih, ih_rb_cntl);
128 ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RPTR_REARM,
129 !!adev->irq.msi_enabled);
130
131 if (unlikely(adev->firmware.load_type == AMDGPU_FW_LOAD_DIRECT)) {
132 if (ih->use_bus_addr) {
133 ih_chicken = RREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN);
134 ih_chicken = REG_SET_FIELD(ih_chicken,
135 IH_CHICKEN, MC_SPACE_GPA_ENABLE, 1);
136 WREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN, ih_chicken);
137 }
138 }
139
140 WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
141
142 /* set the writeback address whether it's enabled or not */
143 WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_LO,
144 lower_32_bits(ih->wptr_addr));
145 WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_HI,
146 upper_32_bits(ih->wptr_addr) & 0xFFFF);
147
148 /* set rptr, wptr to 0 */
149 WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
150 WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
151
152 ih_doorbell_rtpr = RREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR);
153 if (ih->use_doorbell) {
154 ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
155 IH_DOORBELL_RPTR, OFFSET,
156 ih->doorbell_index);
157 ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
158 IH_DOORBELL_RPTR, ENABLE, 1);
159 } else {
160 ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
161 IH_DOORBELL_RPTR, ENABLE, 0);
162 }
163 WREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR, ih_doorbell_rtpr);
164
165 adev->nbio.funcs->ih_doorbell_range(adev, ih->use_doorbell,
166 ih->doorbell_index);
167
168 tmp = RREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL);
169 tmp = REG_SET_FIELD(tmp, IH_STORM_CLIENT_LIST_CNTL,
170 CLIENT18_IS_STORM_CLIENT, 1);
171 WREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL, tmp);
172
173 tmp = RREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL);
174 tmp = REG_SET_FIELD(tmp, IH_INT_FLOOD_CNTL, FLOOD_CNTL_ENABLE, 1);
175 WREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL, tmp);
176
177 pci_set_master(adev->pdev);
178
179 /* enable interrupts */
180 navi10_ih_enable_interrupts(adev);
181
182 return 0;
183}
184
185/**
186 * navi10_ih_irq_disable - disable interrupts
187 *
188 * @adev: amdgpu_device pointer
189 *
190 * Disable interrupts on the hw (NAVI10).
191 */
192static void navi10_ih_irq_disable(struct amdgpu_device *adev)
193{
194 navi10_ih_disable_interrupts(adev);
195
196 /* Wait and acknowledge irq */
197 mdelay(1);
198}
199
200/**
201 * navi10_ih_get_wptr - get the IH ring buffer wptr
202 *
203 * @adev: amdgpu_device pointer
204 *
205 * Get the IH ring buffer wptr from either the register
206 * or the writeback memory buffer (NAVI10). Also check for
207 * ring buffer overflow and deal with it.
208 * Returns the value of the wptr.
209 */
210static u32 navi10_ih_get_wptr(struct amdgpu_device *adev,
211 struct amdgpu_ih_ring *ih)
212{
213 u32 wptr, reg, tmp;
214
215 wptr = le32_to_cpu(*ih->wptr_cpu);
216
217 if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
218 goto out;
219
220 reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_WPTR);
221 wptr = RREG32_NO_KIQ(reg);
222 if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
223 goto out;
224 wptr = REG_SET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW, 0);
225
226 /* When a ring buffer overflow happen start parsing interrupt
227 * from the last not overwritten vector (wptr + 32). Hopefully
228 * this should allow us to catch up.
229 */
230 tmp = (wptr + 32) & ih->ptr_mask;
231 dev_warn(adev->dev, "IH ring buffer overflow "
232 "(0x%08X, 0x%08X, 0x%08X)\n",
233 wptr, ih->rptr, tmp);
234 ih->rptr = tmp;
235
236 reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_CNTL);
237 tmp = RREG32_NO_KIQ(reg);
238 tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, WPTR_OVERFLOW_CLEAR, 1);
239 WREG32_NO_KIQ(reg, tmp);
240out:
241 return (wptr & ih->ptr_mask);
242}
243
244/**
245 * navi10_ih_decode_iv - decode an interrupt vector
246 *
247 * @adev: amdgpu_device pointer
248 *
249 * Decodes the interrupt vector at the current rptr
250 * position and also advance the position.
251 */
252static void navi10_ih_decode_iv(struct amdgpu_device *adev,
253 struct amdgpu_ih_ring *ih,
254 struct amdgpu_iv_entry *entry)
255{
256 /* wptr/rptr are in bytes! */
257 u32 ring_index = ih->rptr >> 2;
258 uint32_t dw[8];
259
260 dw[0] = le32_to_cpu(ih->ring[ring_index + 0]);
261 dw[1] = le32_to_cpu(ih->ring[ring_index + 1]);
262 dw[2] = le32_to_cpu(ih->ring[ring_index + 2]);
263 dw[3] = le32_to_cpu(ih->ring[ring_index + 3]);
264 dw[4] = le32_to_cpu(ih->ring[ring_index + 4]);
265 dw[5] = le32_to_cpu(ih->ring[ring_index + 5]);
266 dw[6] = le32_to_cpu(ih->ring[ring_index + 6]);
267 dw[7] = le32_to_cpu(ih->ring[ring_index + 7]);
268
269 entry->client_id = dw[0] & 0xff;
270 entry->src_id = (dw[0] >> 8) & 0xff;
271 entry->ring_id = (dw[0] >> 16) & 0xff;
272 entry->vmid = (dw[0] >> 24) & 0xf;
273 entry->vmid_src = (dw[0] >> 31);
274 entry->timestamp = dw[1] | ((u64)(dw[2] & 0xffff) << 32);
275 entry->timestamp_src = dw[2] >> 31;
276 entry->pasid = dw[3] & 0xffff;
277 entry->pasid_src = dw[3] >> 31;
278 entry->src_data[0] = dw[4];
279 entry->src_data[1] = dw[5];
280 entry->src_data[2] = dw[6];
281 entry->src_data[3] = dw[7];
282
283 /* wptr/rptr are in bytes! */
284 ih->rptr += 32;
285}
286
287/**
288 * navi10_ih_irq_rearm - rearm IRQ if lost
289 *
290 * @adev: amdgpu_device pointer
291 *
292 */
293static void navi10_ih_irq_rearm(struct amdgpu_device *adev,
294 struct amdgpu_ih_ring *ih)
295{
296 uint32_t reg_rptr = 0;
297 uint32_t v = 0;
298 uint32_t i = 0;
299
300 if (ih == &adev->irq.ih)
301 reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR);
302 else if (ih == &adev->irq.ih1)
303 reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR_RING1);
304 else if (ih == &adev->irq.ih2)
305 reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR_RING2);
306 else
307 return;
308
309 /* Rearm IRQ / re-write doorbell if doorbell write is lost */
310 for (i = 0; i < MAX_REARM_RETRY; i++) {
311 v = RREG32_NO_KIQ(reg_rptr);
312 if ((v < ih->ring_size) && (v != ih->rptr))
313 WDOORBELL32(ih->doorbell_index, ih->rptr);
314 else
315 break;
316 }
317}
318
319/**
320 * navi10_ih_set_rptr - set the IH ring buffer rptr
321 *
322 * @adev: amdgpu_device pointer
323 *
324 * Set the IH ring buffer rptr.
325 */
326static void navi10_ih_set_rptr(struct amdgpu_device *adev,
327 struct amdgpu_ih_ring *ih)
328{
329 if (ih->use_doorbell) {
330 /* XXX check if swapping is necessary on BE */
331 *ih->rptr_cpu = ih->rptr;
332 WDOORBELL32(ih->doorbell_index, ih->rptr);
333
334 if (amdgpu_sriov_vf(adev))
335 navi10_ih_irq_rearm(adev, ih);
336 } else
337 WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, ih->rptr);
338}
339
340static int navi10_ih_early_init(void *handle)
341{
342 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
343
344 navi10_ih_set_interrupt_funcs(adev);
345 return 0;
346}
347
348static int navi10_ih_sw_init(void *handle)
349{
350 int r;
351 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
352 bool use_bus_addr;
353
354 /* use gpu virtual address for ih ring
355 * until ih_checken is programmed to allow
356 * use bus address for ih ring by psp bl */
357 use_bus_addr =
358 (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) ? false : true;
359 r = amdgpu_ih_ring_init(adev, &adev->irq.ih, 256 * 1024, use_bus_addr);
360 if (r)
361 return r;
362
363 adev->irq.ih.use_doorbell = true;
364 adev->irq.ih.doorbell_index = adev->doorbell_index.ih << 1;
365
366 r = amdgpu_irq_init(adev);
367
368 return r;
369}
370
371static int navi10_ih_sw_fini(void *handle)
372{
373 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
374
375 amdgpu_irq_fini(adev);
376 amdgpu_ih_ring_fini(adev, &adev->irq.ih);
377
378 return 0;
379}
380
381static int navi10_ih_hw_init(void *handle)
382{
383 int r;
384 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
385
386 r = navi10_ih_irq_init(adev);
387 if (r)
388 return r;
389
390 return 0;
391}
392
393static int navi10_ih_hw_fini(void *handle)
394{
395 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
396
397 navi10_ih_irq_disable(adev);
398
399 return 0;
400}
401
402static int navi10_ih_suspend(void *handle)
403{
404 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
405
406 return navi10_ih_hw_fini(adev);
407}
408
409static int navi10_ih_resume(void *handle)
410{
411 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
412
413 return navi10_ih_hw_init(adev);
414}
415
416static bool navi10_ih_is_idle(void *handle)
417{
418 /* todo */
419 return true;
420}
421
422static int navi10_ih_wait_for_idle(void *handle)
423{
424 /* todo */
425 return -ETIMEDOUT;
426}
427
428static int navi10_ih_soft_reset(void *handle)
429{
430 /* todo */
431 return 0;
432}
433
434static void navi10_ih_update_clockgating_state(struct amdgpu_device *adev,
435 bool enable)
436{
437 uint32_t data, def, field_val;
438
439 if (adev->cg_flags & AMD_CG_SUPPORT_IH_CG) {
440 def = data = RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL);
441 field_val = enable ? 0 : 1;
442 data = REG_SET_FIELD(data, IH_CLK_CTRL,
443 DBUS_MUX_CLK_SOFT_OVERRIDE, field_val);
444 data = REG_SET_FIELD(data, IH_CLK_CTRL,
445 OSSSYS_SHARE_CLK_SOFT_OVERRIDE, field_val);
446 data = REG_SET_FIELD(data, IH_CLK_CTRL,
447 LIMIT_SMN_CLK_SOFT_OVERRIDE, field_val);
448 data = REG_SET_FIELD(data, IH_CLK_CTRL,
449 DYN_CLK_SOFT_OVERRIDE, field_val);
450 data = REG_SET_FIELD(data, IH_CLK_CTRL,
451 REG_CLK_SOFT_OVERRIDE, field_val);
452 if (def != data)
453 WREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL, data);
454 }
455
456 return;
457}
458
459static int navi10_ih_set_clockgating_state(void *handle,
460 enum amd_clockgating_state state)
461{
462 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
463
464 navi10_ih_update_clockgating_state(adev,
465 state == AMD_CG_STATE_GATE);
466 return 0;
467}
468
469static int navi10_ih_set_powergating_state(void *handle,
470 enum amd_powergating_state state)
471{
472 return 0;
473}
474
475static void navi10_ih_get_clockgating_state(void *handle, u32 *flags)
476{
477 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
478
479 if (!RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL))
480 *flags |= AMD_CG_SUPPORT_IH_CG;
481
482 return;
483}
484
485static const struct amd_ip_funcs navi10_ih_ip_funcs = {
486 .name = "navi10_ih",
487 .early_init = navi10_ih_early_init,
488 .late_init = NULL,
489 .sw_init = navi10_ih_sw_init,
490 .sw_fini = navi10_ih_sw_fini,
491 .hw_init = navi10_ih_hw_init,
492 .hw_fini = navi10_ih_hw_fini,
493 .suspend = navi10_ih_suspend,
494 .resume = navi10_ih_resume,
495 .is_idle = navi10_ih_is_idle,
496 .wait_for_idle = navi10_ih_wait_for_idle,
497 .soft_reset = navi10_ih_soft_reset,
498 .set_clockgating_state = navi10_ih_set_clockgating_state,
499 .set_powergating_state = navi10_ih_set_powergating_state,
500 .get_clockgating_state = navi10_ih_get_clockgating_state,
501};
502
503static const struct amdgpu_ih_funcs navi10_ih_funcs = {
504 .get_wptr = navi10_ih_get_wptr,
505 .decode_iv = navi10_ih_decode_iv,
506 .set_rptr = navi10_ih_set_rptr
507};
508
509static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev)
510{
511 if (adev->irq.ih_funcs == NULL)
512 adev->irq.ih_funcs = &navi10_ih_funcs;
513}
514
515const struct amdgpu_ip_block_version navi10_ih_ip_block =
516{
517 .type = AMD_IP_BLOCK_TYPE_IH,
518 .major = 5,
519 .minor = 0,
520 .rev = 0,
521 .funcs = &navi10_ih_ip_funcs,
522};