Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1/*
2 * Copyright 2016 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23#include <linux/firmware.h>
24#include <linux/slab.h>
25#include <linux/module.h>
26#include <linux/pci.h>
27
28#include <drm/amdgpu_drm.h>
29
30#include "amdgpu.h"
31#include "amdgpu_ih.h"
32#include "amdgpu_uvd.h"
33#include "amdgpu_vce.h"
34#include "amdgpu_ucode.h"
35#include "amdgpu_psp.h"
36#include "atom.h"
37#include "amd_pcie.h"
38
39#include "uvd/uvd_7_0_offset.h"
40#include "gc/gc_9_0_offset.h"
41#include "gc/gc_9_0_sh_mask.h"
42#include "sdma0/sdma0_4_0_offset.h"
43#include "sdma1/sdma1_4_0_offset.h"
44#include "nbio/nbio_7_0_default.h"
45#include "nbio/nbio_7_0_offset.h"
46#include "nbio/nbio_7_0_sh_mask.h"
47#include "nbio/nbio_7_0_smn.h"
48#include "mp/mp_9_0_offset.h"
49
50#include "soc15.h"
51#include "soc15_common.h"
52#include "gfx_v9_0.h"
53#include "gmc_v9_0.h"
54#include "gfxhub_v1_0.h"
55#include "mmhub_v1_0.h"
56#include "df_v1_7.h"
57#include "df_v3_6.h"
58#include "nbio_v6_1.h"
59#include "nbio_v7_0.h"
60#include "nbio_v7_4.h"
61#include "hdp_v4_0.h"
62#include "vega10_ih.h"
63#include "vega20_ih.h"
64#include "navi10_ih.h"
65#include "sdma_v4_0.h"
66#include "uvd_v7_0.h"
67#include "vce_v4_0.h"
68#include "vcn_v1_0.h"
69#include "vcn_v2_0.h"
70#include "jpeg_v2_0.h"
71#include "vcn_v2_5.h"
72#include "jpeg_v2_5.h"
73#include "smuio_v9_0.h"
74#include "smuio_v11_0.h"
75#include "smuio_v13_0.h"
76#include "amdgpu_vkms.h"
77#include "mxgpu_ai.h"
78#include "amdgpu_ras.h"
79#include "amdgpu_xgmi.h"
80#include <uapi/linux/kfd_ioctl.h>
81
82#define mmMP0_MISC_CGTT_CTRL0 0x01b9
83#define mmMP0_MISC_CGTT_CTRL0_BASE_IDX 0
84#define mmMP0_MISC_LIGHT_SLEEP_CTRL 0x01ba
85#define mmMP0_MISC_LIGHT_SLEEP_CTRL_BASE_IDX 0
86
87static const struct amd_ip_funcs soc15_common_ip_funcs;
88
89/* Vega, Raven, Arcturus */
90static const struct amdgpu_video_codec_info vega_video_codecs_encode_array[] =
91{
92 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4096, 0)},
93 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 4096, 4096, 0)},
94};
95
96static const struct amdgpu_video_codecs vega_video_codecs_encode =
97{
98 .codec_count = ARRAY_SIZE(vega_video_codecs_encode_array),
99 .codec_array = vega_video_codecs_encode_array,
100};
101
102/* Vega */
103static const struct amdgpu_video_codec_info vega_video_codecs_decode_array[] =
104{
105 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG2, 1920, 1088, 3)},
106 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4, 1920, 1088, 5)},
107 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4096, 52)},
108 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VC1, 1920, 1088, 4)},
109 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 4096, 4096, 186)},
110};
111
112static const struct amdgpu_video_codecs vega_video_codecs_decode =
113{
114 .codec_count = ARRAY_SIZE(vega_video_codecs_decode_array),
115 .codec_array = vega_video_codecs_decode_array,
116};
117
118/* Raven */
119static const struct amdgpu_video_codec_info rv_video_codecs_decode_array[] =
120{
121 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG2, 1920, 1088, 3)},
122 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4, 1920, 1088, 5)},
123 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4096, 52)},
124 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VC1, 1920, 1088, 4)},
125 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 4096, 4096, 186)},
126 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 8192, 8192, 0)},
127 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VP9, 4096, 4096, 0)},
128};
129
130static const struct amdgpu_video_codecs rv_video_codecs_decode =
131{
132 .codec_count = ARRAY_SIZE(rv_video_codecs_decode_array),
133 .codec_array = rv_video_codecs_decode_array,
134};
135
136/* Renoir, Arcturus */
137static const struct amdgpu_video_codec_info rn_video_codecs_decode_array[] =
138{
139 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG2, 1920, 1088, 3)},
140 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4, 1920, 1088, 5)},
141 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4096, 52)},
142 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VC1, 1920, 1088, 4)},
143 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 8192, 4352, 186)},
144 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 16384, 16384, 0)},
145 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VP9, 8192, 4352, 0)},
146};
147
148static const struct amdgpu_video_codecs rn_video_codecs_decode =
149{
150 .codec_count = ARRAY_SIZE(rn_video_codecs_decode_array),
151 .codec_array = rn_video_codecs_decode_array,
152};
153
154static const struct amdgpu_video_codec_info vcn_4_0_3_video_codecs_decode_array[] = {
155 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4096, 52)},
156 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 8192, 4352, 186)},
157 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 16384, 16384, 0)},
158 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VP9, 8192, 4352, 0)},
159 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_AV1, 8192, 4352, 0)},
160};
161
162static const struct amdgpu_video_codecs vcn_4_0_3_video_codecs_decode = {
163 .codec_count = ARRAY_SIZE(vcn_4_0_3_video_codecs_decode_array),
164 .codec_array = vcn_4_0_3_video_codecs_decode_array,
165};
166
167static const struct amdgpu_video_codecs vcn_4_0_3_video_codecs_encode = {
168 .codec_count = 0,
169 .codec_array = NULL,
170};
171
172static const struct amdgpu_video_codecs vcn_5_0_1_video_codecs_encode_vcn0 = {
173 .codec_count = 0,
174 .codec_array = NULL,
175};
176
177static const struct amdgpu_video_codec_info vcn_5_0_1_video_codecs_decode_array_vcn0[] = {
178 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4096, 52)},
179 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 8192, 4352, 186)},
180 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 16384, 16384, 0)},
181 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VP9, 8192, 4352, 0)},
182 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_AV1, 8192, 4352, 0)},
183};
184
185static const struct amdgpu_video_codecs vcn_5_0_1_video_codecs_decode_vcn0 = {
186 .codec_count = ARRAY_SIZE(vcn_5_0_1_video_codecs_decode_array_vcn0),
187 .codec_array = vcn_5_0_1_video_codecs_decode_array_vcn0,
188};
189
190static int soc15_query_video_codecs(struct amdgpu_device *adev, bool encode,
191 const struct amdgpu_video_codecs **codecs)
192{
193 if (amdgpu_ip_version(adev, VCE_HWIP, 0)) {
194 switch (amdgpu_ip_version(adev, VCE_HWIP, 0)) {
195 case IP_VERSION(4, 0, 0):
196 case IP_VERSION(4, 1, 0):
197 if (encode)
198 *codecs = &vega_video_codecs_encode;
199 else
200 *codecs = &vega_video_codecs_decode;
201 return 0;
202 default:
203 return -EINVAL;
204 }
205 } else {
206 switch (amdgpu_ip_version(adev, UVD_HWIP, 0)) {
207 case IP_VERSION(1, 0, 0):
208 case IP_VERSION(1, 0, 1):
209 if (encode)
210 *codecs = &vega_video_codecs_encode;
211 else
212 *codecs = &rv_video_codecs_decode;
213 return 0;
214 case IP_VERSION(2, 5, 0):
215 case IP_VERSION(2, 6, 0):
216 case IP_VERSION(2, 2, 0):
217 if (encode)
218 *codecs = &vega_video_codecs_encode;
219 else
220 *codecs = &rn_video_codecs_decode;
221 return 0;
222 case IP_VERSION(4, 0, 3):
223 if (encode)
224 *codecs = &vcn_4_0_3_video_codecs_encode;
225 else
226 *codecs = &vcn_4_0_3_video_codecs_decode;
227 return 0;
228 case IP_VERSION(5, 0, 1):
229 if (encode)
230 *codecs = &vcn_5_0_1_video_codecs_encode_vcn0;
231 else
232 *codecs = &vcn_5_0_1_video_codecs_decode_vcn0;
233 return 0;
234 default:
235 return -EINVAL;
236 }
237 }
238}
239
240static u32 soc15_uvd_ctx_rreg(struct amdgpu_device *adev, u32 reg)
241{
242 unsigned long flags, address, data;
243 u32 r;
244
245 address = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_INDEX);
246 data = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_DATA);
247
248 spin_lock_irqsave(&adev->uvd_ctx_idx_lock, flags);
249 WREG32(address, ((reg) & 0x1ff));
250 r = RREG32(data);
251 spin_unlock_irqrestore(&adev->uvd_ctx_idx_lock, flags);
252 return r;
253}
254
255static void soc15_uvd_ctx_wreg(struct amdgpu_device *adev, u32 reg, u32 v)
256{
257 unsigned long flags, address, data;
258
259 address = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_INDEX);
260 data = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_DATA);
261
262 spin_lock_irqsave(&adev->uvd_ctx_idx_lock, flags);
263 WREG32(address, ((reg) & 0x1ff));
264 WREG32(data, (v));
265 spin_unlock_irqrestore(&adev->uvd_ctx_idx_lock, flags);
266}
267
268static u32 soc15_didt_rreg(struct amdgpu_device *adev, u32 reg)
269{
270 unsigned long flags, address, data;
271 u32 r;
272
273 address = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_INDEX);
274 data = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_DATA);
275
276 spin_lock_irqsave(&adev->didt_idx_lock, flags);
277 WREG32(address, (reg));
278 r = RREG32(data);
279 spin_unlock_irqrestore(&adev->didt_idx_lock, flags);
280 return r;
281}
282
283static void soc15_didt_wreg(struct amdgpu_device *adev, u32 reg, u32 v)
284{
285 unsigned long flags, address, data;
286
287 address = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_INDEX);
288 data = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_DATA);
289
290 spin_lock_irqsave(&adev->didt_idx_lock, flags);
291 WREG32(address, (reg));
292 WREG32(data, (v));
293 spin_unlock_irqrestore(&adev->didt_idx_lock, flags);
294}
295
296static u32 soc15_gc_cac_rreg(struct amdgpu_device *adev, u32 reg)
297{
298 unsigned long flags;
299 u32 r;
300
301 spin_lock_irqsave(&adev->gc_cac_idx_lock, flags);
302 WREG32_SOC15(GC, 0, mmGC_CAC_IND_INDEX, (reg));
303 r = RREG32_SOC15(GC, 0, mmGC_CAC_IND_DATA);
304 spin_unlock_irqrestore(&adev->gc_cac_idx_lock, flags);
305 return r;
306}
307
308static void soc15_gc_cac_wreg(struct amdgpu_device *adev, u32 reg, u32 v)
309{
310 unsigned long flags;
311
312 spin_lock_irqsave(&adev->gc_cac_idx_lock, flags);
313 WREG32_SOC15(GC, 0, mmGC_CAC_IND_INDEX, (reg));
314 WREG32_SOC15(GC, 0, mmGC_CAC_IND_DATA, (v));
315 spin_unlock_irqrestore(&adev->gc_cac_idx_lock, flags);
316}
317
318static u32 soc15_se_cac_rreg(struct amdgpu_device *adev, u32 reg)
319{
320 unsigned long flags;
321 u32 r;
322
323 spin_lock_irqsave(&adev->se_cac_idx_lock, flags);
324 WREG32_SOC15(GC, 0, mmSE_CAC_IND_INDEX, (reg));
325 r = RREG32_SOC15(GC, 0, mmSE_CAC_IND_DATA);
326 spin_unlock_irqrestore(&adev->se_cac_idx_lock, flags);
327 return r;
328}
329
330static void soc15_se_cac_wreg(struct amdgpu_device *adev, u32 reg, u32 v)
331{
332 unsigned long flags;
333
334 spin_lock_irqsave(&adev->se_cac_idx_lock, flags);
335 WREG32_SOC15(GC, 0, mmSE_CAC_IND_INDEX, (reg));
336 WREG32_SOC15(GC, 0, mmSE_CAC_IND_DATA, (v));
337 spin_unlock_irqrestore(&adev->se_cac_idx_lock, flags);
338}
339
340static u32 soc15_get_config_memsize(struct amdgpu_device *adev)
341{
342 return adev->nbio.funcs->get_memsize(adev);
343}
344
345static u32 soc15_get_xclk(struct amdgpu_device *adev)
346{
347 u32 reference_clock = adev->clock.spll.reference_freq;
348
349 if (amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(12, 0, 0) ||
350 amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(12, 0, 1) ||
351 amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(13, 0, 6) ||
352 amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(13, 0, 12) ||
353 amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(13, 0, 14))
354 return 10000;
355 if (amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(10, 0, 0) ||
356 amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(10, 0, 1))
357 return reference_clock / 4;
358
359 return reference_clock;
360}
361
362
363void soc15_grbm_select(struct amdgpu_device *adev,
364 u32 me, u32 pipe, u32 queue, u32 vmid, int xcc_id)
365{
366 u32 grbm_gfx_cntl = 0;
367 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, PIPEID, pipe);
368 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, MEID, me);
369 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, VMID, vmid);
370 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, QUEUEID, queue);
371
372 WREG32_SOC15_RLC_SHADOW(GC, xcc_id, mmGRBM_GFX_CNTL, grbm_gfx_cntl);
373}
374
375static bool soc15_read_disabled_bios(struct amdgpu_device *adev)
376{
377 /* todo */
378 return false;
379}
380
381static struct soc15_allowed_register_entry soc15_allowed_read_registers[] = {
382 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS)},
383 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS2)},
384 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE0)},
385 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE1)},
386 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE2)},
387 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE3)},
388 { SOC15_REG_ENTRY(SDMA0, 0, mmSDMA0_STATUS_REG)},
389 { SOC15_REG_ENTRY(SDMA1, 0, mmSDMA1_STATUS_REG)},
390 { SOC15_REG_ENTRY(GC, 0, mmCP_STAT)},
391 { SOC15_REG_ENTRY(GC, 0, mmCP_STALLED_STAT1)},
392 { SOC15_REG_ENTRY(GC, 0, mmCP_STALLED_STAT2)},
393 { SOC15_REG_ENTRY(GC, 0, mmCP_STALLED_STAT3)},
394 { SOC15_REG_ENTRY(GC, 0, mmCP_CPF_BUSY_STAT)},
395 { SOC15_REG_ENTRY(GC, 0, mmCP_CPF_STALLED_STAT1)},
396 { SOC15_REG_ENTRY(GC, 0, mmCP_CPF_STATUS)},
397 { SOC15_REG_ENTRY(GC, 0, mmCP_CPC_BUSY_STAT)},
398 { SOC15_REG_ENTRY(GC, 0, mmCP_CPC_STALLED_STAT1)},
399 { SOC15_REG_ENTRY(GC, 0, mmCP_CPC_STATUS)},
400 { SOC15_REG_ENTRY(GC, 0, mmGB_ADDR_CONFIG)},
401 { SOC15_REG_ENTRY(GC, 0, mmDB_DEBUG2)},
402};
403
404static uint32_t soc15_read_indexed_register(struct amdgpu_device *adev, u32 se_num,
405 u32 sh_num, u32 reg_offset)
406{
407 uint32_t val;
408
409 mutex_lock(&adev->grbm_idx_mutex);
410 if (se_num != 0xffffffff || sh_num != 0xffffffff)
411 amdgpu_gfx_select_se_sh(adev, se_num, sh_num, 0xffffffff, 0);
412
413 val = RREG32(reg_offset);
414
415 if (se_num != 0xffffffff || sh_num != 0xffffffff)
416 amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff, 0);
417 mutex_unlock(&adev->grbm_idx_mutex);
418 return val;
419}
420
421static uint32_t soc15_get_register_value(struct amdgpu_device *adev,
422 bool indexed, u32 se_num,
423 u32 sh_num, u32 reg_offset)
424{
425 if (indexed) {
426 return soc15_read_indexed_register(adev, se_num, sh_num, reg_offset);
427 } else {
428 if (reg_offset == SOC15_REG_OFFSET(GC, 0, mmGB_ADDR_CONFIG))
429 return adev->gfx.config.gb_addr_config;
430 else if (reg_offset == SOC15_REG_OFFSET(GC, 0, mmDB_DEBUG2))
431 return adev->gfx.config.db_debug2;
432 return RREG32(reg_offset);
433 }
434}
435
436static int soc15_read_register(struct amdgpu_device *adev, u32 se_num,
437 u32 sh_num, u32 reg_offset, u32 *value)
438{
439 uint32_t i;
440 struct soc15_allowed_register_entry *en;
441
442 *value = 0;
443 for (i = 0; i < ARRAY_SIZE(soc15_allowed_read_registers); i++) {
444 en = &soc15_allowed_read_registers[i];
445 if (!adev->reg_offset[en->hwip][en->inst])
446 continue;
447 else if (reg_offset != (adev->reg_offset[en->hwip][en->inst][en->seg]
448 + en->reg_offset))
449 continue;
450
451 *value = soc15_get_register_value(adev,
452 soc15_allowed_read_registers[i].grbm_indexed,
453 se_num, sh_num, reg_offset);
454 return 0;
455 }
456 return -EINVAL;
457}
458
459
460/**
461 * soc15_program_register_sequence - program an array of registers.
462 *
463 * @adev: amdgpu_device pointer
464 * @regs: pointer to the register array
465 * @array_size: size of the register array
466 *
467 * Programs an array or registers with and and or masks.
468 * This is a helper for setting golden registers.
469 */
470
471void soc15_program_register_sequence(struct amdgpu_device *adev,
472 const struct soc15_reg_golden *regs,
473 const u32 array_size)
474{
475 const struct soc15_reg_golden *entry;
476 u32 tmp, reg;
477 int i;
478
479 for (i = 0; i < array_size; ++i) {
480 entry = ®s[i];
481 reg = adev->reg_offset[entry->hwip][entry->instance][entry->segment] + entry->reg;
482
483 if (entry->and_mask == 0xffffffff) {
484 tmp = entry->or_mask;
485 } else {
486 tmp = (entry->hwip == GC_HWIP) ?
487 RREG32_SOC15_IP(GC, reg) : RREG32(reg);
488
489 tmp &= ~(entry->and_mask);
490 tmp |= (entry->or_mask & entry->and_mask);
491 }
492
493 if (reg == SOC15_REG_OFFSET(GC, 0, mmPA_SC_BINNER_EVENT_CNTL_3) ||
494 reg == SOC15_REG_OFFSET(GC, 0, mmPA_SC_ENHANCE) ||
495 reg == SOC15_REG_OFFSET(GC, 0, mmPA_SC_ENHANCE_1) ||
496 reg == SOC15_REG_OFFSET(GC, 0, mmSH_MEM_CONFIG))
497 WREG32_RLC(reg, tmp);
498 else
499 (entry->hwip == GC_HWIP) ?
500 WREG32_SOC15_IP(GC, reg, tmp) : WREG32(reg, tmp);
501
502 }
503
504}
505
506static int soc15_asic_baco_reset(struct amdgpu_device *adev)
507{
508 struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
509 int ret = 0;
510
511 /* avoid NBIF got stuck when do RAS recovery in BACO reset */
512 if (ras && adev->ras_enabled)
513 adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
514
515 ret = amdgpu_dpm_baco_reset(adev);
516 if (ret)
517 return ret;
518
519 /* re-enable doorbell interrupt after BACO exit */
520 if (ras && adev->ras_enabled)
521 adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
522
523 return 0;
524}
525
526static enum amd_reset_method
527soc15_asic_reset_method(struct amdgpu_device *adev)
528{
529 int baco_reset = 0;
530 bool connected_to_cpu = false;
531 struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
532
533 if (adev->gmc.xgmi.supported && adev->gmc.xgmi.connected_to_cpu)
534 connected_to_cpu = true;
535
536 if (amdgpu_reset_method == AMD_RESET_METHOD_MODE1 ||
537 amdgpu_reset_method == AMD_RESET_METHOD_MODE2 ||
538 amdgpu_reset_method == AMD_RESET_METHOD_BACO ||
539 amdgpu_reset_method == AMD_RESET_METHOD_PCI) {
540 /* If connected to cpu, driver only support mode2 */
541 if (connected_to_cpu)
542 return AMD_RESET_METHOD_MODE2;
543 return amdgpu_reset_method;
544 }
545
546 if (amdgpu_reset_method != -1)
547 dev_warn(adev->dev, "Specified reset method:%d isn't supported, using AUTO instead.\n",
548 amdgpu_reset_method);
549
550 switch (amdgpu_ip_version(adev, MP1_HWIP, 0)) {
551 case IP_VERSION(10, 0, 0):
552 case IP_VERSION(10, 0, 1):
553 case IP_VERSION(12, 0, 0):
554 case IP_VERSION(12, 0, 1):
555 return AMD_RESET_METHOD_MODE2;
556 case IP_VERSION(9, 0, 0):
557 case IP_VERSION(11, 0, 2):
558 if (adev->asic_type == CHIP_VEGA20) {
559 if (adev->psp.sos.fw_version >= 0x80067)
560 baco_reset = amdgpu_dpm_is_baco_supported(adev);
561 /*
562 * 1. PMFW version > 0x284300: all cases use baco
563 * 2. PMFW version <= 0x284300: only sGPU w/o RAS use baco
564 */
565 if (ras && adev->ras_enabled &&
566 adev->pm.fw_version <= 0x283400)
567 baco_reset = 0;
568 } else {
569 baco_reset = amdgpu_dpm_is_baco_supported(adev);
570 }
571 break;
572 case IP_VERSION(13, 0, 2):
573 /*
574 * 1.connected to cpu: driver issue mode2 reset
575 * 2.discret gpu: driver issue mode1 reset
576 */
577 if (connected_to_cpu)
578 return AMD_RESET_METHOD_MODE2;
579 break;
580 case IP_VERSION(13, 0, 6):
581 case IP_VERSION(13, 0, 14):
582 case IP_VERSION(13, 0, 12):
583 /* Use gpu_recovery param to target a reset method.
584 * Enable triggering of GPU reset only if specified
585 * by module parameter.
586 */
587 if (adev->pcie_reset_ctx.in_link_reset)
588 return AMD_RESET_METHOD_LINK;
589 if (amdgpu_gpu_recovery == 4 || amdgpu_gpu_recovery == 5)
590 return AMD_RESET_METHOD_MODE2;
591 else if (!(adev->flags & AMD_IS_APU))
592 return AMD_RESET_METHOD_MODE1;
593 else
594 return AMD_RESET_METHOD_MODE2;
595 default:
596 break;
597 }
598
599 if (baco_reset)
600 return AMD_RESET_METHOD_BACO;
601 else
602 return AMD_RESET_METHOD_MODE1;
603}
604
605static bool soc15_need_reset_on_resume(struct amdgpu_device *adev)
606{
607 /* Will reset for the following suspend abort cases.
608 * 1) S3 suspend aborted in the normal S3 suspend
609 * 2) S3 suspend aborted in performing pm core test.
610 */
611 if (adev->in_s3 && !pm_resume_via_firmware())
612 return true;
613 else
614 return false;
615}
616
617static int soc15_asic_reset(struct amdgpu_device *adev)
618{
619 /* original raven doesn't have full asic reset */
620 /* On the latest Raven, the GPU reset can be performed
621 * successfully. So now, temporarily enable it for the
622 * S3 suspend abort case.
623 */
624
625 if ((adev->apu_flags & AMD_APU_IS_PICASSO ||
626 !(adev->apu_flags & AMD_APU_IS_RAVEN)) &&
627 soc15_need_reset_on_resume(adev))
628 goto asic_reset;
629
630 if ((adev->apu_flags & AMD_APU_IS_RAVEN) ||
631 (adev->apu_flags & AMD_APU_IS_RAVEN2))
632 return 0;
633
634asic_reset:
635 switch (soc15_asic_reset_method(adev)) {
636 case AMD_RESET_METHOD_PCI:
637 dev_info(adev->dev, "PCI reset\n");
638 return amdgpu_device_pci_reset(adev);
639 case AMD_RESET_METHOD_BACO:
640 dev_info(adev->dev, "BACO reset\n");
641 return soc15_asic_baco_reset(adev);
642 case AMD_RESET_METHOD_MODE2:
643 dev_info(adev->dev, "MODE2 reset\n");
644 return amdgpu_dpm_mode2_reset(adev);
645 case AMD_RESET_METHOD_LINK:
646 dev_info(adev->dev, "Link reset\n");
647 return amdgpu_device_link_reset(adev);
648 default:
649 dev_info(adev->dev, "MODE1 reset\n");
650 return amdgpu_device_mode1_reset(adev);
651 }
652}
653
654static int soc15_supports_baco(struct amdgpu_device *adev)
655{
656 switch (amdgpu_ip_version(adev, MP1_HWIP, 0)) {
657 case IP_VERSION(9, 0, 0):
658 case IP_VERSION(11, 0, 2):
659 if (adev->asic_type == CHIP_VEGA20) {
660 if (adev->psp.sos.fw_version >= 0x80067)
661 return amdgpu_dpm_is_baco_supported(adev);
662 return 0;
663 } else {
664 return amdgpu_dpm_is_baco_supported(adev);
665 }
666 break;
667 default:
668 return 0;
669 }
670}
671
672/*static int soc15_set_uvd_clock(struct amdgpu_device *adev, u32 clock,
673 u32 cntl_reg, u32 status_reg)
674{
675 return 0;
676}*/
677
678static int soc15_set_uvd_clocks(struct amdgpu_device *adev, u32 vclk, u32 dclk)
679{
680 /*int r;
681
682 r = soc15_set_uvd_clock(adev, vclk, ixCG_VCLK_CNTL, ixCG_VCLK_STATUS);
683 if (r)
684 return r;
685
686 r = soc15_set_uvd_clock(adev, dclk, ixCG_DCLK_CNTL, ixCG_DCLK_STATUS);
687 */
688 return 0;
689}
690
691static int soc15_set_vce_clocks(struct amdgpu_device *adev, u32 evclk, u32 ecclk)
692{
693 /* todo */
694
695 return 0;
696}
697
698static void soc15_program_aspm(struct amdgpu_device *adev)
699{
700 if (!amdgpu_device_should_use_aspm(adev))
701 return;
702
703 if (adev->nbio.funcs->program_aspm)
704 adev->nbio.funcs->program_aspm(adev);
705}
706
707const struct amdgpu_ip_block_version vega10_common_ip_block =
708{
709 .type = AMD_IP_BLOCK_TYPE_COMMON,
710 .major = 2,
711 .minor = 0,
712 .rev = 0,
713 .funcs = &soc15_common_ip_funcs,
714};
715
716static void soc15_reg_base_init(struct amdgpu_device *adev)
717{
718 /* Set IP register base before any HW register access */
719 switch (adev->asic_type) {
720 case CHIP_VEGA10:
721 case CHIP_VEGA12:
722 case CHIP_RAVEN:
723 case CHIP_RENOIR:
724 vega10_reg_base_init(adev);
725 break;
726 case CHIP_VEGA20:
727 vega20_reg_base_init(adev);
728 break;
729 case CHIP_ARCTURUS:
730 arct_reg_base_init(adev);
731 break;
732 case CHIP_ALDEBARAN:
733 aldebaran_reg_base_init(adev);
734 break;
735 default:
736 DRM_ERROR("Unsupported asic type: %d!\n", adev->asic_type);
737 break;
738 }
739}
740
741void soc15_set_virt_ops(struct amdgpu_device *adev)
742{
743 adev->virt.ops = &xgpu_ai_virt_ops;
744
745 /* init soc15 reg base early enough so we can
746 * request request full access for sriov before
747 * set_ip_blocks. */
748 soc15_reg_base_init(adev);
749}
750
751static bool soc15_need_full_reset(struct amdgpu_device *adev)
752{
753 /* change this when we implement soft reset */
754 return true;
755}
756
757static void soc15_get_pcie_usage(struct amdgpu_device *adev, uint64_t *count0,
758 uint64_t *count1)
759{
760 uint32_t perfctr = 0;
761 uint64_t cnt0_of, cnt1_of;
762 int tmp;
763
764 /* This reports 0 on APUs, so return to avoid writing/reading registers
765 * that may or may not be different from their GPU counterparts
766 */
767 if (adev->flags & AMD_IS_APU)
768 return;
769
770 /* Set the 2 events that we wish to watch, defined above */
771 /* Reg 40 is # received msgs */
772 /* Reg 104 is # of posted requests sent */
773 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK, EVENT0_SEL, 40);
774 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK, EVENT1_SEL, 104);
775
776 /* Write to enable desired perf counters */
777 WREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK, perfctr);
778 /* Zero out and enable the perf counters
779 * Write 0x5:
780 * Bit 0 = Start all counters(1)
781 * Bit 2 = Global counter reset enable(1)
782 */
783 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000005);
784
785 msleep(1000);
786
787 /* Load the shadow and disable the perf counters
788 * Write 0x2:
789 * Bit 0 = Stop counters(0)
790 * Bit 1 = Load the shadow counters(1)
791 */
792 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000002);
793
794 /* Read register values to get any >32bit overflow */
795 tmp = RREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK);
796 cnt0_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK, COUNTER0_UPPER);
797 cnt1_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK, COUNTER1_UPPER);
798
799 /* Get the values and add the overflow */
800 *count0 = RREG32_PCIE(smnPCIE_PERF_COUNT0_TXCLK) | (cnt0_of << 32);
801 *count1 = RREG32_PCIE(smnPCIE_PERF_COUNT1_TXCLK) | (cnt1_of << 32);
802}
803
804static void vega20_get_pcie_usage(struct amdgpu_device *adev, uint64_t *count0,
805 uint64_t *count1)
806{
807 uint32_t perfctr = 0;
808 uint64_t cnt0_of, cnt1_of;
809 int tmp;
810
811 /* This reports 0 on APUs, so return to avoid writing/reading registers
812 * that may or may not be different from their GPU counterparts
813 */
814 if (adev->flags & AMD_IS_APU)
815 return;
816
817 /* Set the 2 events that we wish to watch, defined above */
818 /* Reg 40 is # received msgs */
819 /* Reg 108 is # of posted requests sent on VG20 */
820 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK3,
821 EVENT0_SEL, 40);
822 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK3,
823 EVENT1_SEL, 108);
824
825 /* Write to enable desired perf counters */
826 WREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK3, perfctr);
827 /* Zero out and enable the perf counters
828 * Write 0x5:
829 * Bit 0 = Start all counters(1)
830 * Bit 2 = Global counter reset enable(1)
831 */
832 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000005);
833
834 msleep(1000);
835
836 /* Load the shadow and disable the perf counters
837 * Write 0x2:
838 * Bit 0 = Stop counters(0)
839 * Bit 1 = Load the shadow counters(1)
840 */
841 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000002);
842
843 /* Read register values to get any >32bit overflow */
844 tmp = RREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK3);
845 cnt0_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK3, COUNTER0_UPPER);
846 cnt1_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK3, COUNTER1_UPPER);
847
848 /* Get the values and add the overflow */
849 *count0 = RREG32_PCIE(smnPCIE_PERF_COUNT0_TXCLK3) | (cnt0_of << 32);
850 *count1 = RREG32_PCIE(smnPCIE_PERF_COUNT1_TXCLK3) | (cnt1_of << 32);
851}
852
853static bool soc15_need_reset_on_init(struct amdgpu_device *adev)
854{
855 u32 sol_reg;
856
857 /* CP hangs in IGT reloading test on RN, reset to WA */
858 if (adev->asic_type == CHIP_RENOIR)
859 return true;
860
861 if (amdgpu_gmc_need_reset_on_init(adev))
862 return true;
863 if (amdgpu_psp_tos_reload_needed(adev))
864 return true;
865 /* Just return false for soc15 GPUs. Reset does not seem to
866 * be necessary.
867 */
868 if (!amdgpu_passthrough(adev))
869 return false;
870
871 if (adev->flags & AMD_IS_APU)
872 return false;
873
874 /* Check sOS sign of life register to confirm sys driver and sOS
875 * are already been loaded.
876 */
877 sol_reg = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_81);
878 if (sol_reg)
879 return true;
880
881 return false;
882}
883
884static uint64_t soc15_get_pcie_replay_count(struct amdgpu_device *adev)
885{
886 uint64_t nak_r, nak_g;
887
888 /* Get the number of NAKs received and generated */
889 nak_r = RREG32_PCIE(smnPCIE_RX_NUM_NAK);
890 nak_g = RREG32_PCIE(smnPCIE_RX_NUM_NAK_GENERATED);
891
892 /* Add the total number of NAKs, i.e the number of replays */
893 return (nak_r + nak_g);
894}
895
896static void soc15_pre_asic_init(struct amdgpu_device *adev)
897{
898 gmc_v9_0_restore_registers(adev);
899}
900
901static const struct amdgpu_asic_funcs soc15_asic_funcs =
902{
903 .read_disabled_bios = &soc15_read_disabled_bios,
904 .read_bios_from_rom = &amdgpu_soc15_read_bios_from_rom,
905 .read_register = &soc15_read_register,
906 .reset = &soc15_asic_reset,
907 .reset_method = &soc15_asic_reset_method,
908 .get_xclk = &soc15_get_xclk,
909 .set_uvd_clocks = &soc15_set_uvd_clocks,
910 .set_vce_clocks = &soc15_set_vce_clocks,
911 .get_config_memsize = &soc15_get_config_memsize,
912 .need_full_reset = &soc15_need_full_reset,
913 .init_doorbell_index = &vega10_doorbell_index_init,
914 .get_pcie_usage = &soc15_get_pcie_usage,
915 .need_reset_on_init = &soc15_need_reset_on_init,
916 .get_pcie_replay_count = &soc15_get_pcie_replay_count,
917 .supports_baco = &soc15_supports_baco,
918 .pre_asic_init = &soc15_pre_asic_init,
919 .query_video_codecs = &soc15_query_video_codecs,
920};
921
922static const struct amdgpu_asic_funcs vega20_asic_funcs =
923{
924 .read_disabled_bios = &soc15_read_disabled_bios,
925 .read_bios_from_rom = &amdgpu_soc15_read_bios_from_rom,
926 .read_register = &soc15_read_register,
927 .reset = &soc15_asic_reset,
928 .reset_method = &soc15_asic_reset_method,
929 .get_xclk = &soc15_get_xclk,
930 .set_uvd_clocks = &soc15_set_uvd_clocks,
931 .set_vce_clocks = &soc15_set_vce_clocks,
932 .get_config_memsize = &soc15_get_config_memsize,
933 .need_full_reset = &soc15_need_full_reset,
934 .init_doorbell_index = &vega20_doorbell_index_init,
935 .get_pcie_usage = &vega20_get_pcie_usage,
936 .need_reset_on_init = &soc15_need_reset_on_init,
937 .get_pcie_replay_count = &soc15_get_pcie_replay_count,
938 .supports_baco = &soc15_supports_baco,
939 .pre_asic_init = &soc15_pre_asic_init,
940 .query_video_codecs = &soc15_query_video_codecs,
941};
942
943static const struct amdgpu_asic_funcs aqua_vanjaram_asic_funcs =
944{
945 .read_disabled_bios = &soc15_read_disabled_bios,
946 .read_bios_from_rom = &amdgpu_soc15_read_bios_from_rom,
947 .read_register = &soc15_read_register,
948 .reset = &soc15_asic_reset,
949 .reset_method = &soc15_asic_reset_method,
950 .get_xclk = &soc15_get_xclk,
951 .set_uvd_clocks = &soc15_set_uvd_clocks,
952 .set_vce_clocks = &soc15_set_vce_clocks,
953 .get_config_memsize = &soc15_get_config_memsize,
954 .need_full_reset = &soc15_need_full_reset,
955 .init_doorbell_index = &aqua_vanjaram_doorbell_index_init,
956 .need_reset_on_init = &soc15_need_reset_on_init,
957 .get_pcie_replay_count = &amdgpu_nbio_get_pcie_replay_count,
958 .supports_baco = &soc15_supports_baco,
959 .pre_asic_init = &soc15_pre_asic_init,
960 .query_video_codecs = &soc15_query_video_codecs,
961 .encode_ext_smn_addressing = &aqua_vanjaram_encode_ext_smn_addressing,
962 .get_reg_state = &aqua_vanjaram_get_reg_state,
963};
964
965static int soc15_common_early_init(struct amdgpu_ip_block *ip_block)
966{
967 struct amdgpu_device *adev = ip_block->adev;
968
969 adev->nbio.funcs->set_reg_remap(adev);
970 adev->smc_rreg = NULL;
971 adev->smc_wreg = NULL;
972 adev->pcie_rreg = &amdgpu_device_indirect_rreg;
973 adev->pcie_wreg = &amdgpu_device_indirect_wreg;
974 adev->pcie_rreg_ext = &amdgpu_device_indirect_rreg_ext;
975 adev->pcie_wreg_ext = &amdgpu_device_indirect_wreg_ext;
976 adev->pcie_rreg64 = &amdgpu_device_indirect_rreg64;
977 adev->pcie_wreg64 = &amdgpu_device_indirect_wreg64;
978 adev->pcie_rreg64_ext = &amdgpu_device_indirect_rreg64_ext;
979 adev->pcie_wreg64_ext = &amdgpu_device_indirect_wreg64_ext;
980 adev->uvd_ctx_rreg = &soc15_uvd_ctx_rreg;
981 adev->uvd_ctx_wreg = &soc15_uvd_ctx_wreg;
982 adev->didt_rreg = &soc15_didt_rreg;
983 adev->didt_wreg = &soc15_didt_wreg;
984 adev->gc_cac_rreg = &soc15_gc_cac_rreg;
985 adev->gc_cac_wreg = &soc15_gc_cac_wreg;
986 adev->se_cac_rreg = &soc15_se_cac_rreg;
987 adev->se_cac_wreg = &soc15_se_cac_wreg;
988
989 adev->rev_id = amdgpu_device_get_rev_id(adev);
990 adev->external_rev_id = 0xFF;
991 /* TODO: split the GC and PG flags based on the relevant IP version for which
992 * they are relevant.
993 */
994 switch (amdgpu_ip_version(adev, GC_HWIP, 0)) {
995 case IP_VERSION(9, 0, 1):
996 adev->asic_funcs = &soc15_asic_funcs;
997 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
998 AMD_CG_SUPPORT_GFX_MGLS |
999 AMD_CG_SUPPORT_GFX_RLC_LS |
1000 AMD_CG_SUPPORT_GFX_CP_LS |
1001 AMD_CG_SUPPORT_GFX_3D_CGCG |
1002 AMD_CG_SUPPORT_GFX_3D_CGLS |
1003 AMD_CG_SUPPORT_GFX_CGCG |
1004 AMD_CG_SUPPORT_GFX_CGLS |
1005 AMD_CG_SUPPORT_BIF_MGCG |
1006 AMD_CG_SUPPORT_BIF_LS |
1007 AMD_CG_SUPPORT_HDP_LS |
1008 AMD_CG_SUPPORT_DRM_MGCG |
1009 AMD_CG_SUPPORT_DRM_LS |
1010 AMD_CG_SUPPORT_ROM_MGCG |
1011 AMD_CG_SUPPORT_DF_MGCG |
1012 AMD_CG_SUPPORT_SDMA_MGCG |
1013 AMD_CG_SUPPORT_SDMA_LS |
1014 AMD_CG_SUPPORT_MC_MGCG |
1015 AMD_CG_SUPPORT_MC_LS;
1016 adev->pg_flags = 0;
1017 adev->external_rev_id = 0x1;
1018 break;
1019 case IP_VERSION(9, 2, 1):
1020 adev->asic_funcs = &soc15_asic_funcs;
1021 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1022 AMD_CG_SUPPORT_GFX_MGLS |
1023 AMD_CG_SUPPORT_GFX_CGCG |
1024 AMD_CG_SUPPORT_GFX_CGLS |
1025 AMD_CG_SUPPORT_GFX_3D_CGCG |
1026 AMD_CG_SUPPORT_GFX_3D_CGLS |
1027 AMD_CG_SUPPORT_GFX_CP_LS |
1028 AMD_CG_SUPPORT_MC_LS |
1029 AMD_CG_SUPPORT_MC_MGCG |
1030 AMD_CG_SUPPORT_SDMA_MGCG |
1031 AMD_CG_SUPPORT_SDMA_LS |
1032 AMD_CG_SUPPORT_BIF_MGCG |
1033 AMD_CG_SUPPORT_BIF_LS |
1034 AMD_CG_SUPPORT_HDP_MGCG |
1035 AMD_CG_SUPPORT_HDP_LS |
1036 AMD_CG_SUPPORT_ROM_MGCG |
1037 AMD_CG_SUPPORT_VCE_MGCG |
1038 AMD_CG_SUPPORT_UVD_MGCG;
1039 adev->pg_flags = 0;
1040 adev->external_rev_id = adev->rev_id + 0x14;
1041 break;
1042 case IP_VERSION(9, 4, 0):
1043 adev->asic_funcs = &vega20_asic_funcs;
1044 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1045 AMD_CG_SUPPORT_GFX_MGLS |
1046 AMD_CG_SUPPORT_GFX_CGCG |
1047 AMD_CG_SUPPORT_GFX_CGLS |
1048 AMD_CG_SUPPORT_GFX_3D_CGCG |
1049 AMD_CG_SUPPORT_GFX_3D_CGLS |
1050 AMD_CG_SUPPORT_GFX_CP_LS |
1051 AMD_CG_SUPPORT_MC_LS |
1052 AMD_CG_SUPPORT_MC_MGCG |
1053 AMD_CG_SUPPORT_SDMA_MGCG |
1054 AMD_CG_SUPPORT_SDMA_LS |
1055 AMD_CG_SUPPORT_BIF_MGCG |
1056 AMD_CG_SUPPORT_BIF_LS |
1057 AMD_CG_SUPPORT_HDP_MGCG |
1058 AMD_CG_SUPPORT_HDP_LS |
1059 AMD_CG_SUPPORT_ROM_MGCG |
1060 AMD_CG_SUPPORT_VCE_MGCG |
1061 AMD_CG_SUPPORT_UVD_MGCG;
1062 adev->pg_flags = 0;
1063 adev->external_rev_id = adev->rev_id + 0x28;
1064 break;
1065 case IP_VERSION(9, 1, 0):
1066 case IP_VERSION(9, 2, 2):
1067 adev->asic_funcs = &soc15_asic_funcs;
1068
1069 if (adev->rev_id >= 0x8)
1070 adev->apu_flags |= AMD_APU_IS_RAVEN2;
1071
1072 if (adev->apu_flags & AMD_APU_IS_RAVEN2)
1073 adev->external_rev_id = adev->rev_id + 0x79;
1074 else if (adev->apu_flags & AMD_APU_IS_PICASSO)
1075 adev->external_rev_id = adev->rev_id + 0x41;
1076 else if (adev->rev_id == 1)
1077 adev->external_rev_id = adev->rev_id + 0x20;
1078 else
1079 adev->external_rev_id = adev->rev_id + 0x01;
1080
1081 if (adev->apu_flags & AMD_APU_IS_RAVEN2) {
1082 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1083 AMD_CG_SUPPORT_GFX_MGLS |
1084 AMD_CG_SUPPORT_GFX_CP_LS |
1085 AMD_CG_SUPPORT_GFX_3D_CGCG |
1086 AMD_CG_SUPPORT_GFX_3D_CGLS |
1087 AMD_CG_SUPPORT_GFX_CGCG |
1088 AMD_CG_SUPPORT_GFX_CGLS |
1089 AMD_CG_SUPPORT_BIF_LS |
1090 AMD_CG_SUPPORT_HDP_LS |
1091 AMD_CG_SUPPORT_MC_MGCG |
1092 AMD_CG_SUPPORT_MC_LS |
1093 AMD_CG_SUPPORT_SDMA_MGCG |
1094 AMD_CG_SUPPORT_SDMA_LS |
1095 AMD_CG_SUPPORT_VCN_MGCG;
1096
1097 adev->pg_flags = AMD_PG_SUPPORT_SDMA | AMD_PG_SUPPORT_VCN;
1098 } else if (adev->apu_flags & AMD_APU_IS_PICASSO) {
1099 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1100 AMD_CG_SUPPORT_GFX_MGLS |
1101 AMD_CG_SUPPORT_GFX_CP_LS |
1102 AMD_CG_SUPPORT_GFX_3D_CGLS |
1103 AMD_CG_SUPPORT_GFX_CGCG |
1104 AMD_CG_SUPPORT_GFX_CGLS |
1105 AMD_CG_SUPPORT_BIF_LS |
1106 AMD_CG_SUPPORT_HDP_LS |
1107 AMD_CG_SUPPORT_MC_MGCG |
1108 AMD_CG_SUPPORT_MC_LS |
1109 AMD_CG_SUPPORT_SDMA_MGCG |
1110 AMD_CG_SUPPORT_SDMA_LS |
1111 AMD_CG_SUPPORT_VCN_MGCG;
1112
1113 /*
1114 * MMHUB PG needs to be disabled for Picasso for
1115 * stability reasons.
1116 */
1117 adev->pg_flags = AMD_PG_SUPPORT_SDMA |
1118 AMD_PG_SUPPORT_VCN;
1119 } else {
1120 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1121 AMD_CG_SUPPORT_GFX_MGLS |
1122 AMD_CG_SUPPORT_GFX_RLC_LS |
1123 AMD_CG_SUPPORT_GFX_CP_LS |
1124 AMD_CG_SUPPORT_GFX_3D_CGLS |
1125 AMD_CG_SUPPORT_GFX_CGCG |
1126 AMD_CG_SUPPORT_GFX_CGLS |
1127 AMD_CG_SUPPORT_BIF_MGCG |
1128 AMD_CG_SUPPORT_BIF_LS |
1129 AMD_CG_SUPPORT_HDP_MGCG |
1130 AMD_CG_SUPPORT_HDP_LS |
1131 AMD_CG_SUPPORT_DRM_MGCG |
1132 AMD_CG_SUPPORT_DRM_LS |
1133 AMD_CG_SUPPORT_MC_MGCG |
1134 AMD_CG_SUPPORT_MC_LS |
1135 AMD_CG_SUPPORT_SDMA_MGCG |
1136 AMD_CG_SUPPORT_SDMA_LS |
1137 AMD_CG_SUPPORT_VCN_MGCG;
1138
1139 adev->pg_flags = AMD_PG_SUPPORT_SDMA | AMD_PG_SUPPORT_VCN;
1140 }
1141 break;
1142 case IP_VERSION(9, 4, 1):
1143 adev->asic_funcs = &vega20_asic_funcs;
1144 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1145 AMD_CG_SUPPORT_GFX_MGLS |
1146 AMD_CG_SUPPORT_GFX_CGCG |
1147 AMD_CG_SUPPORT_GFX_CGLS |
1148 AMD_CG_SUPPORT_GFX_CP_LS |
1149 AMD_CG_SUPPORT_HDP_MGCG |
1150 AMD_CG_SUPPORT_HDP_LS |
1151 AMD_CG_SUPPORT_SDMA_MGCG |
1152 AMD_CG_SUPPORT_SDMA_LS |
1153 AMD_CG_SUPPORT_MC_MGCG |
1154 AMD_CG_SUPPORT_MC_LS |
1155 AMD_CG_SUPPORT_IH_CG |
1156 AMD_CG_SUPPORT_VCN_MGCG |
1157 AMD_CG_SUPPORT_JPEG_MGCG;
1158 adev->pg_flags = AMD_PG_SUPPORT_VCN | AMD_PG_SUPPORT_VCN_DPG;
1159 adev->external_rev_id = adev->rev_id + 0x32;
1160 break;
1161 case IP_VERSION(9, 3, 0):
1162 adev->asic_funcs = &soc15_asic_funcs;
1163
1164 if (adev->apu_flags & AMD_APU_IS_RENOIR)
1165 adev->external_rev_id = adev->rev_id + 0x91;
1166 else
1167 adev->external_rev_id = adev->rev_id + 0xa1;
1168 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1169 AMD_CG_SUPPORT_GFX_MGLS |
1170 AMD_CG_SUPPORT_GFX_3D_CGCG |
1171 AMD_CG_SUPPORT_GFX_3D_CGLS |
1172 AMD_CG_SUPPORT_GFX_CGCG |
1173 AMD_CG_SUPPORT_GFX_CGLS |
1174 AMD_CG_SUPPORT_GFX_CP_LS |
1175 AMD_CG_SUPPORT_MC_MGCG |
1176 AMD_CG_SUPPORT_MC_LS |
1177 AMD_CG_SUPPORT_SDMA_MGCG |
1178 AMD_CG_SUPPORT_SDMA_LS |
1179 AMD_CG_SUPPORT_BIF_LS |
1180 AMD_CG_SUPPORT_HDP_LS |
1181 AMD_CG_SUPPORT_VCN_MGCG |
1182 AMD_CG_SUPPORT_JPEG_MGCG |
1183 AMD_CG_SUPPORT_IH_CG |
1184 AMD_CG_SUPPORT_ATHUB_LS |
1185 AMD_CG_SUPPORT_ATHUB_MGCG |
1186 AMD_CG_SUPPORT_DF_MGCG;
1187 adev->pg_flags = AMD_PG_SUPPORT_SDMA |
1188 AMD_PG_SUPPORT_VCN |
1189 AMD_PG_SUPPORT_JPEG |
1190 AMD_PG_SUPPORT_VCN_DPG;
1191 break;
1192 case IP_VERSION(9, 4, 2):
1193 adev->asic_funcs = &vega20_asic_funcs;
1194 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG |
1195 AMD_CG_SUPPORT_GFX_MGLS |
1196 AMD_CG_SUPPORT_GFX_CP_LS |
1197 AMD_CG_SUPPORT_HDP_LS |
1198 AMD_CG_SUPPORT_SDMA_MGCG |
1199 AMD_CG_SUPPORT_SDMA_LS |
1200 AMD_CG_SUPPORT_IH_CG |
1201 AMD_CG_SUPPORT_VCN_MGCG | AMD_CG_SUPPORT_JPEG_MGCG;
1202 adev->pg_flags = AMD_PG_SUPPORT_VCN_DPG;
1203 adev->external_rev_id = adev->rev_id + 0x3c;
1204 break;
1205 case IP_VERSION(9, 4, 3):
1206 case IP_VERSION(9, 4, 4):
1207 case IP_VERSION(9, 5, 0):
1208 adev->asic_funcs = &aqua_vanjaram_asic_funcs;
1209 adev->cg_flags =
1210 AMD_CG_SUPPORT_GFX_MGCG | AMD_CG_SUPPORT_GFX_CGCG |
1211 AMD_CG_SUPPORT_GFX_CGLS | AMD_CG_SUPPORT_SDMA_MGCG |
1212 AMD_CG_SUPPORT_GFX_FGCG | AMD_CG_SUPPORT_REPEATER_FGCG |
1213 AMD_CG_SUPPORT_VCN_MGCG | AMD_CG_SUPPORT_JPEG_MGCG |
1214 AMD_CG_SUPPORT_IH_CG;
1215 adev->pg_flags =
1216 AMD_PG_SUPPORT_VCN |
1217 AMD_PG_SUPPORT_VCN_DPG |
1218 AMD_PG_SUPPORT_JPEG;
1219 /*TODO: need a new external_rev_id for GC 9.4.4? */
1220 adev->external_rev_id = adev->rev_id + 0x46;
1221 if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 5, 0))
1222 adev->external_rev_id = adev->rev_id + 0x50;
1223 break;
1224 default:
1225 /* FIXME: not supported yet */
1226 return -EINVAL;
1227 }
1228
1229 if (amdgpu_sriov_vf(adev)) {
1230 amdgpu_virt_init_setting(adev);
1231 xgpu_ai_mailbox_set_irq_funcs(adev);
1232 }
1233
1234 return 0;
1235}
1236
1237static int soc15_common_late_init(struct amdgpu_ip_block *ip_block)
1238{
1239 struct amdgpu_device *adev = ip_block->adev;
1240
1241 if (amdgpu_sriov_vf(adev))
1242 xgpu_ai_mailbox_get_irq(adev);
1243
1244 /* Enable selfring doorbell aperture late because doorbell BAR
1245 * aperture will change if resize BAR successfully in gmc sw_init.
1246 */
1247 adev->nbio.funcs->enable_doorbell_selfring_aperture(adev, true);
1248
1249 return 0;
1250}
1251
1252static int soc15_common_sw_init(struct amdgpu_ip_block *ip_block)
1253{
1254 struct amdgpu_device *adev = ip_block->adev;
1255
1256 if (amdgpu_sriov_vf(adev))
1257 xgpu_ai_mailbox_add_irq_id(adev);
1258
1259 if (adev->df.funcs &&
1260 adev->df.funcs->sw_init)
1261 adev->df.funcs->sw_init(adev);
1262
1263 return 0;
1264}
1265
1266static int soc15_common_sw_fini(struct amdgpu_ip_block *ip_block)
1267{
1268 struct amdgpu_device *adev = ip_block->adev;
1269
1270 if (adev->df.funcs &&
1271 adev->df.funcs->sw_fini)
1272 adev->df.funcs->sw_fini(adev);
1273 return 0;
1274}
1275
1276static void soc15_sdma_doorbell_range_init(struct amdgpu_device *adev)
1277{
1278 int i;
1279
1280 /* sdma doorbell range is programed by hypervisor */
1281 if (!amdgpu_sriov_vf(adev)) {
1282 for (i = 0; i < adev->sdma.num_instances; i++) {
1283 adev->nbio.funcs->sdma_doorbell_range(adev, i,
1284 true, adev->doorbell_index.sdma_engine[i] << 1,
1285 adev->doorbell_index.sdma_doorbell_range);
1286 }
1287 }
1288}
1289
1290static int soc15_common_hw_init(struct amdgpu_ip_block *ip_block)
1291{
1292 struct amdgpu_device *adev = ip_block->adev;
1293
1294 /* enable aspm */
1295 soc15_program_aspm(adev);
1296 /* setup nbio registers */
1297 adev->nbio.funcs->init_registers(adev);
1298 /* remap HDP registers to a hole in mmio space,
1299 * for the purpose of expose those registers
1300 * to process space
1301 */
1302 if (adev->nbio.funcs->remap_hdp_registers && !amdgpu_sriov_vf(adev))
1303 adev->nbio.funcs->remap_hdp_registers(adev);
1304
1305 /* enable the doorbell aperture */
1306 adev->nbio.funcs->enable_doorbell_aperture(adev, true);
1307
1308 /* HW doorbell routing policy: doorbell writing not
1309 * in SDMA/IH/MM/ACV range will be routed to CP. So
1310 * we need to init SDMA doorbell range prior
1311 * to CP ip block init and ring test. IH already
1312 * happens before CP.
1313 */
1314 soc15_sdma_doorbell_range_init(adev);
1315
1316 return 0;
1317}
1318
1319static int soc15_common_hw_fini(struct amdgpu_ip_block *ip_block)
1320{
1321 struct amdgpu_device *adev = ip_block->adev;
1322
1323 /* Disable the doorbell aperture and selfring doorbell aperture
1324 * separately in hw_fini because soc15_enable_doorbell_aperture
1325 * has been removed and there is no need to delay disabling
1326 * selfring doorbell.
1327 */
1328 adev->nbio.funcs->enable_doorbell_aperture(adev, false);
1329 adev->nbio.funcs->enable_doorbell_selfring_aperture(adev, false);
1330
1331 if (amdgpu_sriov_vf(adev))
1332 xgpu_ai_mailbox_put_irq(adev);
1333
1334 /*
1335 * For minimal init, late_init is not called, hence RAS irqs are not
1336 * enabled.
1337 */
1338 if ((!amdgpu_sriov_vf(adev)) &&
1339 (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI) &&
1340 adev->nbio.ras_if &&
1341 amdgpu_ras_is_supported(adev, adev->nbio.ras_if->block)) {
1342 if (adev->nbio.ras &&
1343 adev->nbio.ras->init_ras_controller_interrupt)
1344 amdgpu_irq_put(adev, &adev->nbio.ras_controller_irq, 0);
1345 if (adev->nbio.ras &&
1346 adev->nbio.ras->init_ras_err_event_athub_interrupt)
1347 amdgpu_irq_put(adev, &adev->nbio.ras_err_event_athub_irq, 0);
1348 }
1349
1350 return 0;
1351}
1352
1353static int soc15_common_suspend(struct amdgpu_ip_block *ip_block)
1354{
1355 return soc15_common_hw_fini(ip_block);
1356}
1357
1358static int soc15_common_resume(struct amdgpu_ip_block *ip_block)
1359{
1360 struct amdgpu_device *adev = ip_block->adev;
1361
1362 if (soc15_need_reset_on_resume(adev)) {
1363 dev_info(adev->dev, "S3 suspend abort case, let's reset ASIC.\n");
1364 soc15_asic_reset(adev);
1365 }
1366 return soc15_common_hw_init(ip_block);
1367}
1368
1369static bool soc15_common_is_idle(struct amdgpu_ip_block *ip_block)
1370{
1371 return true;
1372}
1373
1374static void soc15_update_drm_clock_gating(struct amdgpu_device *adev, bool enable)
1375{
1376 uint32_t def, data;
1377
1378 def = data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_CGTT_CTRL0));
1379
1380 if (enable && (adev->cg_flags & AMD_CG_SUPPORT_DRM_MGCG))
1381 data &= ~(0x01000000 |
1382 0x02000000 |
1383 0x04000000 |
1384 0x08000000 |
1385 0x10000000 |
1386 0x20000000 |
1387 0x40000000 |
1388 0x80000000);
1389 else
1390 data |= (0x01000000 |
1391 0x02000000 |
1392 0x04000000 |
1393 0x08000000 |
1394 0x10000000 |
1395 0x20000000 |
1396 0x40000000 |
1397 0x80000000);
1398
1399 if (def != data)
1400 WREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_CGTT_CTRL0), data);
1401}
1402
1403static void soc15_update_drm_light_sleep(struct amdgpu_device *adev, bool enable)
1404{
1405 uint32_t def, data;
1406
1407 def = data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_LIGHT_SLEEP_CTRL));
1408
1409 if (enable && (adev->cg_flags & AMD_CG_SUPPORT_DRM_LS))
1410 data |= 1;
1411 else
1412 data &= ~1;
1413
1414 if (def != data)
1415 WREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_LIGHT_SLEEP_CTRL), data);
1416}
1417
1418static int soc15_common_set_clockgating_state(struct amdgpu_ip_block *ip_block,
1419 enum amd_clockgating_state state)
1420{
1421 struct amdgpu_device *adev = ip_block->adev;
1422
1423 if (amdgpu_sriov_vf(adev))
1424 return 0;
1425
1426 switch (amdgpu_ip_version(adev, NBIO_HWIP, 0)) {
1427 case IP_VERSION(6, 1, 0):
1428 case IP_VERSION(6, 2, 0):
1429 case IP_VERSION(7, 4, 0):
1430 adev->nbio.funcs->update_medium_grain_clock_gating(adev,
1431 state == AMD_CG_STATE_GATE);
1432 adev->nbio.funcs->update_medium_grain_light_sleep(adev,
1433 state == AMD_CG_STATE_GATE);
1434 adev->hdp.funcs->update_clock_gating(adev,
1435 state == AMD_CG_STATE_GATE);
1436 soc15_update_drm_clock_gating(adev,
1437 state == AMD_CG_STATE_GATE);
1438 soc15_update_drm_light_sleep(adev,
1439 state == AMD_CG_STATE_GATE);
1440 adev->smuio.funcs->update_rom_clock_gating(adev,
1441 state == AMD_CG_STATE_GATE);
1442 adev->df.funcs->update_medium_grain_clock_gating(adev,
1443 state == AMD_CG_STATE_GATE);
1444 break;
1445 case IP_VERSION(7, 0, 0):
1446 case IP_VERSION(7, 0, 1):
1447 case IP_VERSION(2, 5, 0):
1448 adev->nbio.funcs->update_medium_grain_clock_gating(adev,
1449 state == AMD_CG_STATE_GATE);
1450 adev->nbio.funcs->update_medium_grain_light_sleep(adev,
1451 state == AMD_CG_STATE_GATE);
1452 adev->hdp.funcs->update_clock_gating(adev,
1453 state == AMD_CG_STATE_GATE);
1454 soc15_update_drm_clock_gating(adev,
1455 state == AMD_CG_STATE_GATE);
1456 soc15_update_drm_light_sleep(adev,
1457 state == AMD_CG_STATE_GATE);
1458 break;
1459 case IP_VERSION(7, 4, 1):
1460 case IP_VERSION(7, 4, 4):
1461 adev->hdp.funcs->update_clock_gating(adev,
1462 state == AMD_CG_STATE_GATE);
1463 break;
1464 default:
1465 break;
1466 }
1467 return 0;
1468}
1469
1470static void soc15_common_get_clockgating_state(struct amdgpu_ip_block *ip_block, u64 *flags)
1471{
1472 struct amdgpu_device *adev = ip_block->adev;
1473 int data;
1474
1475 if (amdgpu_sriov_vf(adev))
1476 *flags = 0;
1477
1478 if (adev->nbio.funcs && adev->nbio.funcs->get_clockgating_state)
1479 adev->nbio.funcs->get_clockgating_state(adev, flags);
1480
1481 if (adev->hdp.funcs && adev->hdp.funcs->get_clock_gating_state)
1482 adev->hdp.funcs->get_clock_gating_state(adev, flags);
1483
1484 if ((amdgpu_ip_version(adev, MP0_HWIP, 0) != IP_VERSION(13, 0, 2)) &&
1485 (amdgpu_ip_version(adev, MP0_HWIP, 0) != IP_VERSION(13, 0, 6)) &&
1486 (amdgpu_ip_version(adev, MP0_HWIP, 0) != IP_VERSION(13, 0, 12)) &&
1487 (amdgpu_ip_version(adev, MP0_HWIP, 0) != IP_VERSION(13, 0, 14))) {
1488 /* AMD_CG_SUPPORT_DRM_MGCG */
1489 data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_CGTT_CTRL0));
1490 if (!(data & 0x01000000))
1491 *flags |= AMD_CG_SUPPORT_DRM_MGCG;
1492
1493 /* AMD_CG_SUPPORT_DRM_LS */
1494 data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_LIGHT_SLEEP_CTRL));
1495 if (data & 0x1)
1496 *flags |= AMD_CG_SUPPORT_DRM_LS;
1497 }
1498
1499 /* AMD_CG_SUPPORT_ROM_MGCG */
1500 if (adev->smuio.funcs && adev->smuio.funcs->get_clock_gating_state)
1501 adev->smuio.funcs->get_clock_gating_state(adev, flags);
1502
1503 if (adev->df.funcs && adev->df.funcs->get_clockgating_state)
1504 adev->df.funcs->get_clockgating_state(adev, flags);
1505}
1506
1507static int soc15_common_set_powergating_state(struct amdgpu_ip_block *ip_block,
1508 enum amd_powergating_state state)
1509{
1510 /* todo */
1511 return 0;
1512}
1513
1514static const struct amd_ip_funcs soc15_common_ip_funcs = {
1515 .name = "soc15_common",
1516 .early_init = soc15_common_early_init,
1517 .late_init = soc15_common_late_init,
1518 .sw_init = soc15_common_sw_init,
1519 .sw_fini = soc15_common_sw_fini,
1520 .hw_init = soc15_common_hw_init,
1521 .hw_fini = soc15_common_hw_fini,
1522 .suspend = soc15_common_suspend,
1523 .resume = soc15_common_resume,
1524 .is_idle = soc15_common_is_idle,
1525 .set_clockgating_state = soc15_common_set_clockgating_state,
1526 .set_powergating_state = soc15_common_set_powergating_state,
1527 .get_clockgating_state= soc15_common_get_clockgating_state,
1528};