drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c at v5.16-rc2 · tjh.dev/kernel

tjh.dev / kernel
Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux
kernel / drivers / gpu / drm / amd / amdgpu / amdgpu_debugfs.c
at v5.16-rc2 1698 lines 43 kB view raw
   1/*
   2 * Copyright 2008 Advanced Micro Devices, Inc.
   3 * Copyright 2008 Red Hat Inc.
   4 * Copyright 2009 Jerome Glisse.
   5 *
   6 * Permission is hereby granted, free of charge, to any person obtaining a
   7 * copy of this software and associated documentation files (the "Software"),
   8 * to deal in the Software without restriction, including without limitation
   9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10 * and/or sell copies of the Software, and to permit persons to whom the
  11 * Software is furnished to do so, subject to the following conditions:
  12 *
  13 * The above copyright notice and this permission notice shall be included in
  14 * all copies or substantial portions of the Software.
  15 *
  16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22 * OTHER DEALINGS IN THE SOFTWARE.
  23 *
  24 */
  25
  26#include <linux/kthread.h>
  27#include <linux/pci.h>
  28#include <linux/uaccess.h>
  29#include <linux/pm_runtime.h>
  30
  31#include "amdgpu.h"
  32#include "amdgpu_pm.h"
  33#include "amdgpu_dm_debugfs.h"
  34#include "amdgpu_ras.h"
  35#include "amdgpu_rap.h"
  36#include "amdgpu_securedisplay.h"
  37#include "amdgpu_fw_attestation.h"
  38#include "amdgpu_umr.h"
  39
  40#if defined(CONFIG_DEBUG_FS)
  41
  42/**
  43 * amdgpu_debugfs_process_reg_op - Handle MMIO register reads/writes
  44 *
  45 * @read: True if reading
  46 * @f: open file handle
  47 * @buf: User buffer to write/read to
  48 * @size: Number of bytes to write/read
  49 * @pos:  Offset to seek to
  50 *
  51 * This debugfs entry has special meaning on the offset being sought.
  52 * Various bits have different meanings:
  53 *
  54 * Bit 62:  Indicates a GRBM bank switch is needed
  55 * Bit 61:  Indicates a SRBM bank switch is needed (implies bit 62 is
  56 * 	    zero)
  57 * Bits 24..33: The SE or ME selector if needed
  58 * Bits 34..43: The SH (or SA) or PIPE selector if needed
  59 * Bits 44..53: The INSTANCE (or CU/WGP) or QUEUE selector if needed
  60 *
  61 * Bit 23:  Indicates that the PM power gating lock should be held
  62 * 	    This is necessary to read registers that might be
  63 * 	    unreliable during a power gating transistion.
  64 *
  65 * The lower bits are the BYTE offset of the register to read.  This
  66 * allows reading multiple registers in a single call and having
  67 * the returned size reflect that.
  68 */
  69static int  amdgpu_debugfs_process_reg_op(bool read, struct file *f,
  70		char __user *buf, size_t size, loff_t *pos)
  71{
  72	struct amdgpu_device *adev = file_inode(f)->i_private;
  73	ssize_t result = 0;
  74	int r;
  75	bool pm_pg_lock, use_bank, use_ring;
  76	unsigned instance_bank, sh_bank, se_bank, me, pipe, queue, vmid;
  77
  78	pm_pg_lock = use_bank = use_ring = false;
  79	instance_bank = sh_bank = se_bank = me = pipe = queue = vmid = 0;
  80
  81	if (size & 0x3 || *pos & 0x3 ||
  82			((*pos & (1ULL << 62)) && (*pos & (1ULL << 61))))
  83		return -EINVAL;
  84
  85	/* are we reading registers for which a PG lock is necessary? */
  86	pm_pg_lock = (*pos >> 23) & 1;
  87
  88	if (*pos & (1ULL << 62)) {
  89		se_bank = (*pos & GENMASK_ULL(33, 24)) >> 24;
  90		sh_bank = (*pos & GENMASK_ULL(43, 34)) >> 34;
  91		instance_bank = (*pos & GENMASK_ULL(53, 44)) >> 44;
  92
  93		if (se_bank == 0x3FF)
  94			se_bank = 0xFFFFFFFF;
  95		if (sh_bank == 0x3FF)
  96			sh_bank = 0xFFFFFFFF;
  97		if (instance_bank == 0x3FF)
  98			instance_bank = 0xFFFFFFFF;
  99		use_bank = true;
 100	} else if (*pos & (1ULL << 61)) {
 101
 102		me = (*pos & GENMASK_ULL(33, 24)) >> 24;
 103		pipe = (*pos & GENMASK_ULL(43, 34)) >> 34;
 104		queue = (*pos & GENMASK_ULL(53, 44)) >> 44;
 105		vmid = (*pos & GENMASK_ULL(58, 54)) >> 54;
 106
 107		use_ring = true;
 108	} else {
 109		use_bank = use_ring = false;
 110	}
 111
 112	*pos &= (1UL << 22) - 1;
 113
 114	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 115	if (r < 0) {
 116		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 117		return r;
 118	}
 119
 120	r = amdgpu_virt_enable_access_debugfs(adev);
 121	if (r < 0) {
 122		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 123		return r;
 124	}
 125
 126	if (use_bank) {
 127		if ((sh_bank != 0xFFFFFFFF && sh_bank >= adev->gfx.config.max_sh_per_se) ||
 128		    (se_bank != 0xFFFFFFFF && se_bank >= adev->gfx.config.max_shader_engines)) {
 129			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 130			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 131			amdgpu_virt_disable_access_debugfs(adev);
 132			return -EINVAL;
 133		}
 134		mutex_lock(&adev->grbm_idx_mutex);
 135		amdgpu_gfx_select_se_sh(adev, se_bank,
 136					sh_bank, instance_bank);
 137	} else if (use_ring) {
 138		mutex_lock(&adev->srbm_mutex);
 139		amdgpu_gfx_select_me_pipe_q(adev, me, pipe, queue, vmid);
 140	}
 141
 142	if (pm_pg_lock)
 143		mutex_lock(&adev->pm.mutex);
 144
 145	while (size) {
 146		uint32_t value;
 147
 148		if (read) {
 149			value = RREG32(*pos >> 2);
 150			r = put_user(value, (uint32_t *)buf);
 151		} else {
 152			r = get_user(value, (uint32_t *)buf);
 153			if (!r)
 154				amdgpu_mm_wreg_mmio_rlc(adev, *pos >> 2, value);
 155		}
 156		if (r) {
 157			result = r;
 158			goto end;
 159		}
 160
 161		result += 4;
 162		buf += 4;
 163		*pos += 4;
 164		size -= 4;
 165	}
 166
 167end:
 168	if (use_bank) {
 169		amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff);
 170		mutex_unlock(&adev->grbm_idx_mutex);
 171	} else if (use_ring) {
 172		amdgpu_gfx_select_me_pipe_q(adev, 0, 0, 0, 0);
 173		mutex_unlock(&adev->srbm_mutex);
 174	}
 175
 176	if (pm_pg_lock)
 177		mutex_unlock(&adev->pm.mutex);
 178
 179	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 180	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 181
 182	amdgpu_virt_disable_access_debugfs(adev);
 183	return result;
 184}
 185
 186/*
 187 * amdgpu_debugfs_regs_read - Callback for reading MMIO registers
 188 */
 189static ssize_t amdgpu_debugfs_regs_read(struct file *f, char __user *buf,
 190					size_t size, loff_t *pos)
 191{
 192	return amdgpu_debugfs_process_reg_op(true, f, buf, size, pos);
 193}
 194
 195/*
 196 * amdgpu_debugfs_regs_write - Callback for writing MMIO registers
 197 */
 198static ssize_t amdgpu_debugfs_regs_write(struct file *f, const char __user *buf,
 199					 size_t size, loff_t *pos)
 200{
 201	return amdgpu_debugfs_process_reg_op(false, f, (char __user *)buf, size, pos);
 202}
 203
 204static int amdgpu_debugfs_regs2_open(struct inode *inode, struct file *file)
 205{
 206	struct amdgpu_debugfs_regs2_data *rd;
 207
 208	rd = kzalloc(sizeof *rd, GFP_KERNEL);
 209	if (!rd)
 210		return -ENOMEM;
 211	rd->adev = file_inode(file)->i_private;
 212	file->private_data = rd;
 213	mutex_init(&rd->lock);
 214
 215	return 0;
 216}
 217
 218static int amdgpu_debugfs_regs2_release(struct inode *inode, struct file *file)
 219{
 220	struct amdgpu_debugfs_regs2_data *rd = file->private_data;
 221	mutex_destroy(&rd->lock);
 222	kfree(file->private_data);
 223	return 0;
 224}
 225
 226static ssize_t amdgpu_debugfs_regs2_op(struct file *f, char __user *buf, u32 offset, size_t size, int write_en)
 227{
 228	struct amdgpu_debugfs_regs2_data *rd = f->private_data;
 229	struct amdgpu_device *adev = rd->adev;
 230	ssize_t result = 0;
 231	int r;
 232	uint32_t value;
 233
 234	if (size & 0x3 || offset & 0x3)
 235		return -EINVAL;
 236
 237	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 238	if (r < 0) {
 239		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 240		return r;
 241	}
 242
 243	r = amdgpu_virt_enable_access_debugfs(adev);
 244	if (r < 0) {
 245		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 246		return r;
 247	}
 248
 249	mutex_lock(&rd->lock);
 250
 251	if (rd->id.use_grbm) {
 252		if ((rd->id.grbm.sh != 0xFFFFFFFF && rd->id.grbm.sh >= adev->gfx.config.max_sh_per_se) ||
 253		    (rd->id.grbm.se != 0xFFFFFFFF && rd->id.grbm.se >= adev->gfx.config.max_shader_engines)) {
 254			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 255			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 256			amdgpu_virt_disable_access_debugfs(adev);
 257			mutex_unlock(&rd->lock);
 258			return -EINVAL;
 259		}
 260		mutex_lock(&adev->grbm_idx_mutex);
 261		amdgpu_gfx_select_se_sh(adev, rd->id.grbm.se,
 262								rd->id.grbm.sh,
 263								rd->id.grbm.instance);
 264	}
 265
 266	if (rd->id.use_srbm) {
 267		mutex_lock(&adev->srbm_mutex);
 268		amdgpu_gfx_select_me_pipe_q(adev, rd->id.srbm.me, rd->id.srbm.pipe,
 269									rd->id.srbm.queue, rd->id.srbm.vmid);
 270	}
 271
 272	if (rd->id.pg_lock)
 273		mutex_lock(&adev->pm.mutex);
 274
 275	while (size) {
 276		if (!write_en) {
 277			value = RREG32(offset >> 2);
 278			r = put_user(value, (uint32_t *)buf);
 279		} else {
 280			r = get_user(value, (uint32_t *)buf);
 281			if (!r)
 282				amdgpu_mm_wreg_mmio_rlc(adev, offset >> 2, value);
 283		}
 284		if (r) {
 285			result = r;
 286			goto end;
 287		}
 288		offset += 4;
 289		size -= 4;
 290		result += 4;
 291		buf += 4;
 292	}
 293end:
 294	if (rd->id.use_grbm) {
 295		amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff);
 296		mutex_unlock(&adev->grbm_idx_mutex);
 297	}
 298
 299	if (rd->id.use_srbm) {
 300		amdgpu_gfx_select_me_pipe_q(adev, 0, 0, 0, 0);
 301		mutex_unlock(&adev->srbm_mutex);
 302	}
 303
 304	if (rd->id.pg_lock)
 305		mutex_unlock(&adev->pm.mutex);
 306
 307	mutex_unlock(&rd->lock);
 308
 309	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 310	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 311
 312	amdgpu_virt_disable_access_debugfs(adev);
 313	return result;
 314}
 315
 316static long amdgpu_debugfs_regs2_ioctl(struct file *f, unsigned int cmd, unsigned long data)
 317{
 318	struct amdgpu_debugfs_regs2_data *rd = f->private_data;
 319	int r;
 320
 321	switch (cmd) {
 322	case AMDGPU_DEBUGFS_REGS2_IOC_SET_STATE:
 323		mutex_lock(&rd->lock);
 324		r = copy_from_user(&rd->id, (struct amdgpu_debugfs_regs2_iocdata *)data, sizeof rd->id);
 325		mutex_unlock(&rd->lock);
 326		return r ? -EINVAL : 0;
 327	default:
 328		return -EINVAL;
 329	}
 330	return 0;
 331}
 332
 333static ssize_t amdgpu_debugfs_regs2_read(struct file *f, char __user *buf, size_t size, loff_t *pos)
 334{
 335	return amdgpu_debugfs_regs2_op(f, buf, *pos, size, 0);
 336}
 337
 338static ssize_t amdgpu_debugfs_regs2_write(struct file *f, const char __user *buf, size_t size, loff_t *pos)
 339{
 340	return amdgpu_debugfs_regs2_op(f, (char __user *)buf, *pos, size, 1);
 341}
 342
 343
 344/**
 345 * amdgpu_debugfs_regs_pcie_read - Read from a PCIE register
 346 *
 347 * @f: open file handle
 348 * @buf: User buffer to store read data in
 349 * @size: Number of bytes to read
 350 * @pos:  Offset to seek to
 351 *
 352 * The lower bits are the BYTE offset of the register to read.  This
 353 * allows reading multiple registers in a single call and having
 354 * the returned size reflect that.
 355 */
 356static ssize_t amdgpu_debugfs_regs_pcie_read(struct file *f, char __user *buf,
 357					size_t size, loff_t *pos)
 358{
 359	struct amdgpu_device *adev = file_inode(f)->i_private;
 360	ssize_t result = 0;
 361	int r;
 362
 363	if (size & 0x3 || *pos & 0x3)
 364		return -EINVAL;
 365
 366	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 367	if (r < 0) {
 368		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 369		return r;
 370	}
 371
 372	r = amdgpu_virt_enable_access_debugfs(adev);
 373	if (r < 0) {
 374		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 375		return r;
 376	}
 377
 378	while (size) {
 379		uint32_t value;
 380
 381		value = RREG32_PCIE(*pos);
 382		r = put_user(value, (uint32_t *)buf);
 383		if (r) {
 384			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 385			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 386			amdgpu_virt_disable_access_debugfs(adev);
 387			return r;
 388		}
 389
 390		result += 4;
 391		buf += 4;
 392		*pos += 4;
 393		size -= 4;
 394	}
 395
 396	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 397	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 398
 399	amdgpu_virt_disable_access_debugfs(adev);
 400	return result;
 401}
 402
 403/**
 404 * amdgpu_debugfs_regs_pcie_write - Write to a PCIE register
 405 *
 406 * @f: open file handle
 407 * @buf: User buffer to write data from
 408 * @size: Number of bytes to write
 409 * @pos:  Offset to seek to
 410 *
 411 * The lower bits are the BYTE offset of the register to write.  This
 412 * allows writing multiple registers in a single call and having
 413 * the returned size reflect that.
 414 */
 415static ssize_t amdgpu_debugfs_regs_pcie_write(struct file *f, const char __user *buf,
 416					 size_t size, loff_t *pos)
 417{
 418	struct amdgpu_device *adev = file_inode(f)->i_private;
 419	ssize_t result = 0;
 420	int r;
 421
 422	if (size & 0x3 || *pos & 0x3)
 423		return -EINVAL;
 424
 425	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 426	if (r < 0) {
 427		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 428		return r;
 429	}
 430
 431	r = amdgpu_virt_enable_access_debugfs(adev);
 432	if (r < 0) {
 433		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 434		return r;
 435	}
 436
 437	while (size) {
 438		uint32_t value;
 439
 440		r = get_user(value, (uint32_t *)buf);
 441		if (r) {
 442			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 443			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 444			amdgpu_virt_disable_access_debugfs(adev);
 445			return r;
 446		}
 447
 448		WREG32_PCIE(*pos, value);
 449
 450		result += 4;
 451		buf += 4;
 452		*pos += 4;
 453		size -= 4;
 454	}
 455
 456	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 457	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 458
 459	amdgpu_virt_disable_access_debugfs(adev);
 460	return result;
 461}
 462
 463/**
 464 * amdgpu_debugfs_regs_didt_read - Read from a DIDT register
 465 *
 466 * @f: open file handle
 467 * @buf: User buffer to store read data in
 468 * @size: Number of bytes to read
 469 * @pos:  Offset to seek to
 470 *
 471 * The lower bits are the BYTE offset of the register to read.  This
 472 * allows reading multiple registers in a single call and having
 473 * the returned size reflect that.
 474 */
 475static ssize_t amdgpu_debugfs_regs_didt_read(struct file *f, char __user *buf,
 476					size_t size, loff_t *pos)
 477{
 478	struct amdgpu_device *adev = file_inode(f)->i_private;
 479	ssize_t result = 0;
 480	int r;
 481
 482	if (size & 0x3 || *pos & 0x3)
 483		return -EINVAL;
 484
 485	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 486	if (r < 0) {
 487		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 488		return r;
 489	}
 490
 491	r = amdgpu_virt_enable_access_debugfs(adev);
 492	if (r < 0) {
 493		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 494		return r;
 495	}
 496
 497	while (size) {
 498		uint32_t value;
 499
 500		value = RREG32_DIDT(*pos >> 2);
 501		r = put_user(value, (uint32_t *)buf);
 502		if (r) {
 503			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 504			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 505			amdgpu_virt_disable_access_debugfs(adev);
 506			return r;
 507		}
 508
 509		result += 4;
 510		buf += 4;
 511		*pos += 4;
 512		size -= 4;
 513	}
 514
 515	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 516	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 517
 518	amdgpu_virt_disable_access_debugfs(adev);
 519	return result;
 520}
 521
 522/**
 523 * amdgpu_debugfs_regs_didt_write - Write to a DIDT register
 524 *
 525 * @f: open file handle
 526 * @buf: User buffer to write data from
 527 * @size: Number of bytes to write
 528 * @pos:  Offset to seek to
 529 *
 530 * The lower bits are the BYTE offset of the register to write.  This
 531 * allows writing multiple registers in a single call and having
 532 * the returned size reflect that.
 533 */
 534static ssize_t amdgpu_debugfs_regs_didt_write(struct file *f, const char __user *buf,
 535					 size_t size, loff_t *pos)
 536{
 537	struct amdgpu_device *adev = file_inode(f)->i_private;
 538	ssize_t result = 0;
 539	int r;
 540
 541	if (size & 0x3 || *pos & 0x3)
 542		return -EINVAL;
 543
 544	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 545	if (r < 0) {
 546		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 547		return r;
 548	}
 549
 550	r = amdgpu_virt_enable_access_debugfs(adev);
 551	if (r < 0) {
 552		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 553		return r;
 554	}
 555
 556	while (size) {
 557		uint32_t value;
 558
 559		r = get_user(value, (uint32_t *)buf);
 560		if (r) {
 561			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 562			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 563			amdgpu_virt_disable_access_debugfs(adev);
 564			return r;
 565		}
 566
 567		WREG32_DIDT(*pos >> 2, value);
 568
 569		result += 4;
 570		buf += 4;
 571		*pos += 4;
 572		size -= 4;
 573	}
 574
 575	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 576	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 577
 578	amdgpu_virt_disable_access_debugfs(adev);
 579	return result;
 580}
 581
 582/**
 583 * amdgpu_debugfs_regs_smc_read - Read from a SMC register
 584 *
 585 * @f: open file handle
 586 * @buf: User buffer to store read data in
 587 * @size: Number of bytes to read
 588 * @pos:  Offset to seek to
 589 *
 590 * The lower bits are the BYTE offset of the register to read.  This
 591 * allows reading multiple registers in a single call and having
 592 * the returned size reflect that.
 593 */
 594static ssize_t amdgpu_debugfs_regs_smc_read(struct file *f, char __user *buf,
 595					size_t size, loff_t *pos)
 596{
 597	struct amdgpu_device *adev = file_inode(f)->i_private;
 598	ssize_t result = 0;
 599	int r;
 600
 601	if (size & 0x3 || *pos & 0x3)
 602		return -EINVAL;
 603
 604	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 605	if (r < 0) {
 606		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 607		return r;
 608	}
 609
 610	r = amdgpu_virt_enable_access_debugfs(adev);
 611	if (r < 0) {
 612		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 613		return r;
 614	}
 615
 616	while (size) {
 617		uint32_t value;
 618
 619		value = RREG32_SMC(*pos);
 620		r = put_user(value, (uint32_t *)buf);
 621		if (r) {
 622			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 623			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 624			amdgpu_virt_disable_access_debugfs(adev);
 625			return r;
 626		}
 627
 628		result += 4;
 629		buf += 4;
 630		*pos += 4;
 631		size -= 4;
 632	}
 633
 634	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 635	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 636
 637	amdgpu_virt_disable_access_debugfs(adev);
 638	return result;
 639}
 640
 641/**
 642 * amdgpu_debugfs_regs_smc_write - Write to a SMC register
 643 *
 644 * @f: open file handle
 645 * @buf: User buffer to write data from
 646 * @size: Number of bytes to write
 647 * @pos:  Offset to seek to
 648 *
 649 * The lower bits are the BYTE offset of the register to write.  This
 650 * allows writing multiple registers in a single call and having
 651 * the returned size reflect that.
 652 */
 653static ssize_t amdgpu_debugfs_regs_smc_write(struct file *f, const char __user *buf,
 654					 size_t size, loff_t *pos)
 655{
 656	struct amdgpu_device *adev = file_inode(f)->i_private;
 657	ssize_t result = 0;
 658	int r;
 659
 660	if (size & 0x3 || *pos & 0x3)
 661		return -EINVAL;
 662
 663	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 664	if (r < 0) {
 665		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 666		return r;
 667	}
 668
 669	r = amdgpu_virt_enable_access_debugfs(adev);
 670	if (r < 0) {
 671		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 672		return r;
 673	}
 674
 675	while (size) {
 676		uint32_t value;
 677
 678		r = get_user(value, (uint32_t *)buf);
 679		if (r) {
 680			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 681			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 682			amdgpu_virt_disable_access_debugfs(adev);
 683			return r;
 684		}
 685
 686		WREG32_SMC(*pos, value);
 687
 688		result += 4;
 689		buf += 4;
 690		*pos += 4;
 691		size -= 4;
 692	}
 693
 694	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 695	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 696
 697	amdgpu_virt_disable_access_debugfs(adev);
 698	return result;
 699}
 700
 701/**
 702 * amdgpu_debugfs_gca_config_read - Read from gfx config data
 703 *
 704 * @f: open file handle
 705 * @buf: User buffer to store read data in
 706 * @size: Number of bytes to read
 707 * @pos:  Offset to seek to
 708 *
 709 * This file is used to access configuration data in a somewhat
 710 * stable fashion.  The format is a series of DWORDs with the first
 711 * indicating which revision it is.  New content is appended to the
 712 * end so that older software can still read the data.
 713 */
 714
 715static ssize_t amdgpu_debugfs_gca_config_read(struct file *f, char __user *buf,
 716					size_t size, loff_t *pos)
 717{
 718	struct amdgpu_device *adev = file_inode(f)->i_private;
 719	ssize_t result = 0;
 720	int r;
 721	uint32_t *config, no_regs = 0;
 722
 723	if (size & 0x3 || *pos & 0x3)
 724		return -EINVAL;
 725
 726	config = kmalloc_array(256, sizeof(*config), GFP_KERNEL);
 727	if (!config)
 728		return -ENOMEM;
 729
 730	/* version, increment each time something is added */
 731	config[no_regs++] = 3;
 732	config[no_regs++] = adev->gfx.config.max_shader_engines;
 733	config[no_regs++] = adev->gfx.config.max_tile_pipes;
 734	config[no_regs++] = adev->gfx.config.max_cu_per_sh;
 735	config[no_regs++] = adev->gfx.config.max_sh_per_se;
 736	config[no_regs++] = adev->gfx.config.max_backends_per_se;
 737	config[no_regs++] = adev->gfx.config.max_texture_channel_caches;
 738	config[no_regs++] = adev->gfx.config.max_gprs;
 739	config[no_regs++] = adev->gfx.config.max_gs_threads;
 740	config[no_regs++] = adev->gfx.config.max_hw_contexts;
 741	config[no_regs++] = adev->gfx.config.sc_prim_fifo_size_frontend;
 742	config[no_regs++] = adev->gfx.config.sc_prim_fifo_size_backend;
 743	config[no_regs++] = adev->gfx.config.sc_hiz_tile_fifo_size;
 744	config[no_regs++] = adev->gfx.config.sc_earlyz_tile_fifo_size;
 745	config[no_regs++] = adev->gfx.config.num_tile_pipes;
 746	config[no_regs++] = adev->gfx.config.backend_enable_mask;
 747	config[no_regs++] = adev->gfx.config.mem_max_burst_length_bytes;
 748	config[no_regs++] = adev->gfx.config.mem_row_size_in_kb;
 749	config[no_regs++] = adev->gfx.config.shader_engine_tile_size;
 750	config[no_regs++] = adev->gfx.config.num_gpus;
 751	config[no_regs++] = adev->gfx.config.multi_gpu_tile_size;
 752	config[no_regs++] = adev->gfx.config.mc_arb_ramcfg;
 753	config[no_regs++] = adev->gfx.config.gb_addr_config;
 754	config[no_regs++] = adev->gfx.config.num_rbs;
 755
 756	/* rev==1 */
 757	config[no_regs++] = adev->rev_id;
 758	config[no_regs++] = adev->pg_flags;
 759	config[no_regs++] = adev->cg_flags;
 760
 761	/* rev==2 */
 762	config[no_regs++] = adev->family;
 763	config[no_regs++] = adev->external_rev_id;
 764
 765	/* rev==3 */
 766	config[no_regs++] = adev->pdev->device;
 767	config[no_regs++] = adev->pdev->revision;
 768	config[no_regs++] = adev->pdev->subsystem_device;
 769	config[no_regs++] = adev->pdev->subsystem_vendor;
 770
 771	while (size && (*pos < no_regs * 4)) {
 772		uint32_t value;
 773
 774		value = config[*pos >> 2];
 775		r = put_user(value, (uint32_t *)buf);
 776		if (r) {
 777			kfree(config);
 778			return r;
 779		}
 780
 781		result += 4;
 782		buf += 4;
 783		*pos += 4;
 784		size -= 4;
 785	}
 786
 787	kfree(config);
 788	return result;
 789}
 790
 791/**
 792 * amdgpu_debugfs_sensor_read - Read from the powerplay sensors
 793 *
 794 * @f: open file handle
 795 * @buf: User buffer to store read data in
 796 * @size: Number of bytes to read
 797 * @pos:  Offset to seek to
 798 *
 799 * The offset is treated as the BYTE address of one of the sensors
 800 * enumerated in amd/include/kgd_pp_interface.h under the
 801 * 'amd_pp_sensors' enumeration.  For instance to read the UVD VCLK
 802 * you would use the offset 3 * 4 = 12.
 803 */
 804static ssize_t amdgpu_debugfs_sensor_read(struct file *f, char __user *buf,
 805					size_t size, loff_t *pos)
 806{
 807	struct amdgpu_device *adev = file_inode(f)->i_private;
 808	int idx, x, outsize, r, valuesize;
 809	uint32_t values[16];
 810
 811	if (size & 3 || *pos & 0x3)
 812		return -EINVAL;
 813
 814	if (!adev->pm.dpm_enabled)
 815		return -EINVAL;
 816
 817	/* convert offset to sensor number */
 818	idx = *pos >> 2;
 819
 820	valuesize = sizeof(values);
 821
 822	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 823	if (r < 0) {
 824		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 825		return r;
 826	}
 827
 828	r = amdgpu_virt_enable_access_debugfs(adev);
 829	if (r < 0) {
 830		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 831		return r;
 832	}
 833
 834	r = amdgpu_dpm_read_sensor(adev, idx, &values[0], &valuesize);
 835
 836	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 837	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 838
 839	if (r) {
 840		amdgpu_virt_disable_access_debugfs(adev);
 841		return r;
 842	}
 843
 844	if (size > valuesize) {
 845		amdgpu_virt_disable_access_debugfs(adev);
 846		return -EINVAL;
 847	}
 848
 849	outsize = 0;
 850	x = 0;
 851	if (!r) {
 852		while (size) {
 853			r = put_user(values[x++], (int32_t *)buf);
 854			buf += 4;
 855			size -= 4;
 856			outsize += 4;
 857		}
 858	}
 859
 860	amdgpu_virt_disable_access_debugfs(adev);
 861	return !r ? outsize : r;
 862}
 863
 864/** amdgpu_debugfs_wave_read - Read WAVE STATUS data
 865 *
 866 * @f: open file handle
 867 * @buf: User buffer to store read data in
 868 * @size: Number of bytes to read
 869 * @pos:  Offset to seek to
 870 *
 871 * The offset being sought changes which wave that the status data
 872 * will be returned for.  The bits are used as follows:
 873 *
 874 * Bits 0..6: 	Byte offset into data
 875 * Bits 7..14:	SE selector
 876 * Bits 15..22:	SH/SA selector
 877 * Bits 23..30: CU/{WGP+SIMD} selector
 878 * Bits 31..36: WAVE ID selector
 879 * Bits 37..44: SIMD ID selector
 880 *
 881 * The returned data begins with one DWORD of version information
 882 * Followed by WAVE STATUS registers relevant to the GFX IP version
 883 * being used.  See gfx_v8_0_read_wave_data() for an example output.
 884 */
 885static ssize_t amdgpu_debugfs_wave_read(struct file *f, char __user *buf,
 886					size_t size, loff_t *pos)
 887{
 888	struct amdgpu_device *adev = f->f_inode->i_private;
 889	int r, x;
 890	ssize_t result = 0;
 891	uint32_t offset, se, sh, cu, wave, simd, data[32];
 892
 893	if (size & 3 || *pos & 3)
 894		return -EINVAL;
 895
 896	/* decode offset */
 897	offset = (*pos & GENMASK_ULL(6, 0));
 898	se = (*pos & GENMASK_ULL(14, 7)) >> 7;
 899	sh = (*pos & GENMASK_ULL(22, 15)) >> 15;
 900	cu = (*pos & GENMASK_ULL(30, 23)) >> 23;
 901	wave = (*pos & GENMASK_ULL(36, 31)) >> 31;
 902	simd = (*pos & GENMASK_ULL(44, 37)) >> 37;
 903
 904	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
 905	if (r < 0) {
 906		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 907		return r;
 908	}
 909
 910	r = amdgpu_virt_enable_access_debugfs(adev);
 911	if (r < 0) {
 912		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 913		return r;
 914	}
 915
 916	/* switch to the specific se/sh/cu */
 917	mutex_lock(&adev->grbm_idx_mutex);
 918	amdgpu_gfx_select_se_sh(adev, se, sh, cu);
 919
 920	x = 0;
 921	if (adev->gfx.funcs->read_wave_data)
 922		adev->gfx.funcs->read_wave_data(adev, simd, wave, data, &x);
 923
 924	amdgpu_gfx_select_se_sh(adev, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF);
 925	mutex_unlock(&adev->grbm_idx_mutex);
 926
 927	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
 928	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
 929
 930	if (!x) {
 931		amdgpu_virt_disable_access_debugfs(adev);
 932		return -EINVAL;
 933	}
 934
 935	while (size && (offset < x * 4)) {
 936		uint32_t value;
 937
 938		value = data[offset >> 2];
 939		r = put_user(value, (uint32_t *)buf);
 940		if (r) {
 941			amdgpu_virt_disable_access_debugfs(adev);
 942			return r;
 943		}
 944
 945		result += 4;
 946		buf += 4;
 947		offset += 4;
 948		size -= 4;
 949	}
 950
 951	amdgpu_virt_disable_access_debugfs(adev);
 952	return result;
 953}
 954
 955/** amdgpu_debugfs_gpr_read - Read wave gprs
 956 *
 957 * @f: open file handle
 958 * @buf: User buffer to store read data in
 959 * @size: Number of bytes to read
 960 * @pos:  Offset to seek to
 961 *
 962 * The offset being sought changes which wave that the status data
 963 * will be returned for.  The bits are used as follows:
 964 *
 965 * Bits 0..11:	Byte offset into data
 966 * Bits 12..19:	SE selector
 967 * Bits 20..27:	SH/SA selector
 968 * Bits 28..35: CU/{WGP+SIMD} selector
 969 * Bits 36..43: WAVE ID selector
 970 * Bits 37..44: SIMD ID selector
 971 * Bits 52..59: Thread selector
 972 * Bits 60..61: Bank selector (VGPR=0,SGPR=1)
 973 *
 974 * The return data comes from the SGPR or VGPR register bank for
 975 * the selected operational unit.
 976 */
 977static ssize_t amdgpu_debugfs_gpr_read(struct file *f, char __user *buf,
 978					size_t size, loff_t *pos)
 979{
 980	struct amdgpu_device *adev = f->f_inode->i_private;
 981	int r;
 982	ssize_t result = 0;
 983	uint32_t offset, se, sh, cu, wave, simd, thread, bank, *data;
 984
 985	if (size > 4096 || size & 3 || *pos & 3)
 986		return -EINVAL;
 987
 988	/* decode offset */
 989	offset = (*pos & GENMASK_ULL(11, 0)) >> 2;
 990	se = (*pos & GENMASK_ULL(19, 12)) >> 12;
 991	sh = (*pos & GENMASK_ULL(27, 20)) >> 20;
 992	cu = (*pos & GENMASK_ULL(35, 28)) >> 28;
 993	wave = (*pos & GENMASK_ULL(43, 36)) >> 36;
 994	simd = (*pos & GENMASK_ULL(51, 44)) >> 44;
 995	thread = (*pos & GENMASK_ULL(59, 52)) >> 52;
 996	bank = (*pos & GENMASK_ULL(61, 60)) >> 60;
 997
 998	data = kcalloc(1024, sizeof(*data), GFP_KERNEL);
 999	if (!data)
1000		return -ENOMEM;
1001
1002	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
1003	if (r < 0)
1004		goto err;
1005
1006	r = amdgpu_virt_enable_access_debugfs(adev);
1007	if (r < 0)
1008		goto err;
1009
1010	/* switch to the specific se/sh/cu */
1011	mutex_lock(&adev->grbm_idx_mutex);
1012	amdgpu_gfx_select_se_sh(adev, se, sh, cu);
1013
1014	if (bank == 0) {
1015		if (adev->gfx.funcs->read_wave_vgprs)
1016			adev->gfx.funcs->read_wave_vgprs(adev, simd, wave, thread, offset, size>>2, data);
1017	} else {
1018		if (adev->gfx.funcs->read_wave_sgprs)
1019			adev->gfx.funcs->read_wave_sgprs(adev, simd, wave, offset, size>>2, data);
1020	}
1021
1022	amdgpu_gfx_select_se_sh(adev, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF);
1023	mutex_unlock(&adev->grbm_idx_mutex);
1024
1025	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1026	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1027
1028	while (size) {
1029		uint32_t value;
1030
1031		value = data[result >> 2];
1032		r = put_user(value, (uint32_t *)buf);
1033		if (r) {
1034			amdgpu_virt_disable_access_debugfs(adev);
1035			goto err;
1036		}
1037
1038		result += 4;
1039		buf += 4;
1040		size -= 4;
1041	}
1042
1043	kfree(data);
1044	amdgpu_virt_disable_access_debugfs(adev);
1045	return result;
1046
1047err:
1048	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1049	kfree(data);
1050	return r;
1051}
1052
1053/**
1054 * amdgpu_debugfs_gfxoff_write - Enable/disable GFXOFF
1055 *
1056 * @f: open file handle
1057 * @buf: User buffer to write data from
1058 * @size: Number of bytes to write
1059 * @pos:  Offset to seek to
1060 *
1061 * Write a 32-bit zero to disable or a 32-bit non-zero to enable
1062 */
1063static ssize_t amdgpu_debugfs_gfxoff_write(struct file *f, const char __user *buf,
1064					 size_t size, loff_t *pos)
1065{
1066	struct amdgpu_device *adev = file_inode(f)->i_private;
1067	ssize_t result = 0;
1068	int r;
1069
1070	if (size & 0x3 || *pos & 0x3)
1071		return -EINVAL;
1072
1073	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
1074	if (r < 0) {
1075		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1076		return r;
1077	}
1078
1079	while (size) {
1080		uint32_t value;
1081
1082		r = get_user(value, (uint32_t *)buf);
1083		if (r) {
1084			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1085			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1086			return r;
1087		}
1088
1089		amdgpu_gfx_off_ctrl(adev, value ? true : false);
1090
1091		result += 4;
1092		buf += 4;
1093		*pos += 4;
1094		size -= 4;
1095	}
1096
1097	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1098	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1099
1100	return result;
1101}
1102
1103
1104/**
1105 * amdgpu_debugfs_gfxoff_read - read gfxoff status
1106 *
1107 * @f: open file handle
1108 * @buf: User buffer to store read data in
1109 * @size: Number of bytes to read
1110 * @pos:  Offset to seek to
1111 */
1112static ssize_t amdgpu_debugfs_gfxoff_read(struct file *f, char __user *buf,
1113					 size_t size, loff_t *pos)
1114{
1115	struct amdgpu_device *adev = file_inode(f)->i_private;
1116	ssize_t result = 0;
1117	int r;
1118
1119	if (size & 0x3 || *pos & 0x3)
1120		return -EINVAL;
1121
1122	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
1123	if (r < 0)
1124		return r;
1125
1126	while (size) {
1127		uint32_t value;
1128
1129		r = amdgpu_get_gfx_off_status(adev, &value);
1130		if (r) {
1131			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1132			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1133			return r;
1134		}
1135
1136		r = put_user(value, (uint32_t *)buf);
1137		if (r) {
1138			pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1139			pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1140			return r;
1141		}
1142
1143		result += 4;
1144		buf += 4;
1145		*pos += 4;
1146		size -= 4;
1147	}
1148
1149	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1150	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1151
1152	return result;
1153}
1154
1155static const struct file_operations amdgpu_debugfs_regs2_fops = {
1156	.owner = THIS_MODULE,
1157	.unlocked_ioctl = amdgpu_debugfs_regs2_ioctl,
1158	.read = amdgpu_debugfs_regs2_read,
1159	.write = amdgpu_debugfs_regs2_write,
1160	.open = amdgpu_debugfs_regs2_open,
1161	.release = amdgpu_debugfs_regs2_release,
1162	.llseek = default_llseek
1163};
1164
1165static const struct file_operations amdgpu_debugfs_regs_fops = {
1166	.owner = THIS_MODULE,
1167	.read = amdgpu_debugfs_regs_read,
1168	.write = amdgpu_debugfs_regs_write,
1169	.llseek = default_llseek
1170};
1171static const struct file_operations amdgpu_debugfs_regs_didt_fops = {
1172	.owner = THIS_MODULE,
1173	.read = amdgpu_debugfs_regs_didt_read,
1174	.write = amdgpu_debugfs_regs_didt_write,
1175	.llseek = default_llseek
1176};
1177static const struct file_operations amdgpu_debugfs_regs_pcie_fops = {
1178	.owner = THIS_MODULE,
1179	.read = amdgpu_debugfs_regs_pcie_read,
1180	.write = amdgpu_debugfs_regs_pcie_write,
1181	.llseek = default_llseek
1182};
1183static const struct file_operations amdgpu_debugfs_regs_smc_fops = {
1184	.owner = THIS_MODULE,
1185	.read = amdgpu_debugfs_regs_smc_read,
1186	.write = amdgpu_debugfs_regs_smc_write,
1187	.llseek = default_llseek
1188};
1189
1190static const struct file_operations amdgpu_debugfs_gca_config_fops = {
1191	.owner = THIS_MODULE,
1192	.read = amdgpu_debugfs_gca_config_read,
1193	.llseek = default_llseek
1194};
1195
1196static const struct file_operations amdgpu_debugfs_sensors_fops = {
1197	.owner = THIS_MODULE,
1198	.read = amdgpu_debugfs_sensor_read,
1199	.llseek = default_llseek
1200};
1201
1202static const struct file_operations amdgpu_debugfs_wave_fops = {
1203	.owner = THIS_MODULE,
1204	.read = amdgpu_debugfs_wave_read,
1205	.llseek = default_llseek
1206};
1207static const struct file_operations amdgpu_debugfs_gpr_fops = {
1208	.owner = THIS_MODULE,
1209	.read = amdgpu_debugfs_gpr_read,
1210	.llseek = default_llseek
1211};
1212
1213static const struct file_operations amdgpu_debugfs_gfxoff_fops = {
1214	.owner = THIS_MODULE,
1215	.read = amdgpu_debugfs_gfxoff_read,
1216	.write = amdgpu_debugfs_gfxoff_write,
1217	.llseek = default_llseek
1218};
1219
1220static const struct file_operations *debugfs_regs[] = {
1221	&amdgpu_debugfs_regs_fops,
1222	&amdgpu_debugfs_regs2_fops,
1223	&amdgpu_debugfs_regs_didt_fops,
1224	&amdgpu_debugfs_regs_pcie_fops,
1225	&amdgpu_debugfs_regs_smc_fops,
1226	&amdgpu_debugfs_gca_config_fops,
1227	&amdgpu_debugfs_sensors_fops,
1228	&amdgpu_debugfs_wave_fops,
1229	&amdgpu_debugfs_gpr_fops,
1230	&amdgpu_debugfs_gfxoff_fops,
1231};
1232
1233static const char *debugfs_regs_names[] = {
1234	"amdgpu_regs",
1235	"amdgpu_regs2",
1236	"amdgpu_regs_didt",
1237	"amdgpu_regs_pcie",
1238	"amdgpu_regs_smc",
1239	"amdgpu_gca_config",
1240	"amdgpu_sensors",
1241	"amdgpu_wave",
1242	"amdgpu_gpr",
1243	"amdgpu_gfxoff",
1244};
1245
1246/**
1247 * amdgpu_debugfs_regs_init -	Initialize debugfs entries that provide
1248 * 				register access.
1249 *
1250 * @adev: The device to attach the debugfs entries to
1251 */
1252int amdgpu_debugfs_regs_init(struct amdgpu_device *adev)
1253{
1254	struct drm_minor *minor = adev_to_drm(adev)->primary;
1255	struct dentry *ent, *root = minor->debugfs_root;
1256	unsigned int i;
1257
1258	for (i = 0; i < ARRAY_SIZE(debugfs_regs); i++) {
1259		ent = debugfs_create_file(debugfs_regs_names[i],
1260					  S_IFREG | S_IRUGO, root,
1261					  adev, debugfs_regs[i]);
1262		if (!i && !IS_ERR_OR_NULL(ent))
1263			i_size_write(ent->d_inode, adev->rmmio_size);
1264	}
1265
1266	return 0;
1267}
1268
1269static int amdgpu_debugfs_test_ib_show(struct seq_file *m, void *unused)
1270{
1271	struct amdgpu_device *adev = (struct amdgpu_device *)m->private;
1272	struct drm_device *dev = adev_to_drm(adev);
1273	int r = 0, i;
1274
1275	r = pm_runtime_get_sync(dev->dev);
1276	if (r < 0) {
1277		pm_runtime_put_autosuspend(dev->dev);
1278		return r;
1279	}
1280
1281	/* Avoid accidently unparking the sched thread during GPU reset */
1282	r = down_write_killable(&adev->reset_sem);
1283	if (r)
1284		return r;
1285
1286	/* hold on the scheduler */
1287	for (i = 0; i < AMDGPU_MAX_RINGS; i++) {
1288		struct amdgpu_ring *ring = adev->rings[i];
1289
1290		if (!ring || !ring->sched.thread)
1291			continue;
1292		kthread_park(ring->sched.thread);
1293	}
1294
1295	seq_printf(m, "run ib test:\n");
1296	r = amdgpu_ib_ring_tests(adev);
1297	if (r)
1298		seq_printf(m, "ib ring tests failed (%d).\n", r);
1299	else
1300		seq_printf(m, "ib ring tests passed.\n");
1301
1302	/* go on the scheduler */
1303	for (i = 0; i < AMDGPU_MAX_RINGS; i++) {
1304		struct amdgpu_ring *ring = adev->rings[i];
1305
1306		if (!ring || !ring->sched.thread)
1307			continue;
1308		kthread_unpark(ring->sched.thread);
1309	}
1310
1311	up_write(&adev->reset_sem);
1312
1313	pm_runtime_mark_last_busy(dev->dev);
1314	pm_runtime_put_autosuspend(dev->dev);
1315
1316	return 0;
1317}
1318
1319static int amdgpu_debugfs_evict_vram(void *data, u64 *val)
1320{
1321	struct amdgpu_device *adev = (struct amdgpu_device *)data;
1322	struct drm_device *dev = adev_to_drm(adev);
1323	int r;
1324
1325	r = pm_runtime_get_sync(dev->dev);
1326	if (r < 0) {
1327		pm_runtime_put_autosuspend(dev->dev);
1328		return r;
1329	}
1330
1331	*val = amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM);
1332
1333	pm_runtime_mark_last_busy(dev->dev);
1334	pm_runtime_put_autosuspend(dev->dev);
1335
1336	return 0;
1337}
1338
1339
1340static int amdgpu_debugfs_evict_gtt(void *data, u64 *val)
1341{
1342	struct amdgpu_device *adev = (struct amdgpu_device *)data;
1343	struct drm_device *dev = adev_to_drm(adev);
1344	int r;
1345
1346	r = pm_runtime_get_sync(dev->dev);
1347	if (r < 0) {
1348		pm_runtime_put_autosuspend(dev->dev);
1349		return r;
1350	}
1351
1352	*val = amdgpu_ttm_evict_resources(adev, TTM_PL_TT);
1353
1354	pm_runtime_mark_last_busy(dev->dev);
1355	pm_runtime_put_autosuspend(dev->dev);
1356
1357	return 0;
1358}
1359
1360
1361static int amdgpu_debugfs_vm_info_show(struct seq_file *m, void *unused)
1362{
1363	struct amdgpu_device *adev = (struct amdgpu_device *)m->private;
1364	struct drm_device *dev = adev_to_drm(adev);
1365	struct drm_file *file;
1366	int r;
1367
1368	r = mutex_lock_interruptible(&dev->filelist_mutex);
1369	if (r)
1370		return r;
1371
1372	list_for_each_entry(file, &dev->filelist, lhead) {
1373		struct amdgpu_fpriv *fpriv = file->driver_priv;
1374		struct amdgpu_vm *vm = &fpriv->vm;
1375
1376		seq_printf(m, "pid:%d\tProcess:%s ----------\n",
1377				vm->task_info.pid, vm->task_info.process_name);
1378		r = amdgpu_bo_reserve(vm->root.bo, true);
1379		if (r)
1380			break;
1381		amdgpu_debugfs_vm_bo_info(vm, m);
1382		amdgpu_bo_unreserve(vm->root.bo);
1383	}
1384
1385	mutex_unlock(&dev->filelist_mutex);
1386
1387	return r;
1388}
1389
1390DEFINE_SHOW_ATTRIBUTE(amdgpu_debugfs_test_ib);
1391DEFINE_SHOW_ATTRIBUTE(amdgpu_debugfs_vm_info);
1392DEFINE_DEBUGFS_ATTRIBUTE(amdgpu_evict_vram_fops, amdgpu_debugfs_evict_vram,
1393			 NULL, "%lld\n");
1394DEFINE_DEBUGFS_ATTRIBUTE(amdgpu_evict_gtt_fops, amdgpu_debugfs_evict_gtt,
1395			 NULL, "%lld\n");
1396
1397static void amdgpu_ib_preempt_fences_swap(struct amdgpu_ring *ring,
1398					  struct dma_fence **fences)
1399{
1400	struct amdgpu_fence_driver *drv = &ring->fence_drv;
1401	uint32_t sync_seq, last_seq;
1402
1403	last_seq = atomic_read(&ring->fence_drv.last_seq);
1404	sync_seq = ring->fence_drv.sync_seq;
1405
1406	last_seq &= drv->num_fences_mask;
1407	sync_seq &= drv->num_fences_mask;
1408
1409	do {
1410		struct dma_fence *fence, **ptr;
1411
1412		++last_seq;
1413		last_seq &= drv->num_fences_mask;
1414		ptr = &drv->fences[last_seq];
1415
1416		fence = rcu_dereference_protected(*ptr, 1);
1417		RCU_INIT_POINTER(*ptr, NULL);
1418
1419		if (!fence)
1420			continue;
1421
1422		fences[last_seq] = fence;
1423
1424	} while (last_seq != sync_seq);
1425}
1426
1427static void amdgpu_ib_preempt_signal_fences(struct dma_fence **fences,
1428					    int length)
1429{
1430	int i;
1431	struct dma_fence *fence;
1432
1433	for (i = 0; i < length; i++) {
1434		fence = fences[i];
1435		if (!fence)
1436			continue;
1437		dma_fence_signal(fence);
1438		dma_fence_put(fence);
1439	}
1440}
1441
1442static void amdgpu_ib_preempt_job_recovery(struct drm_gpu_scheduler *sched)
1443{
1444	struct drm_sched_job *s_job;
1445	struct dma_fence *fence;
1446
1447	spin_lock(&sched->job_list_lock);
1448	list_for_each_entry(s_job, &sched->pending_list, list) {
1449		fence = sched->ops->run_job(s_job);
1450		dma_fence_put(fence);
1451	}
1452	spin_unlock(&sched->job_list_lock);
1453}
1454
1455static void amdgpu_ib_preempt_mark_partial_job(struct amdgpu_ring *ring)
1456{
1457	struct amdgpu_job *job;
1458	struct drm_sched_job *s_job, *tmp;
1459	uint32_t preempt_seq;
1460	struct dma_fence *fence, **ptr;
1461	struct amdgpu_fence_driver *drv = &ring->fence_drv;
1462	struct drm_gpu_scheduler *sched = &ring->sched;
1463	bool preempted = true;
1464
1465	if (ring->funcs->type != AMDGPU_RING_TYPE_GFX)
1466		return;
1467
1468	preempt_seq = le32_to_cpu(*(drv->cpu_addr + 2));
1469	if (preempt_seq <= atomic_read(&drv->last_seq)) {
1470		preempted = false;
1471		goto no_preempt;
1472	}
1473
1474	preempt_seq &= drv->num_fences_mask;
1475	ptr = &drv->fences[preempt_seq];
1476	fence = rcu_dereference_protected(*ptr, 1);
1477
1478no_preempt:
1479	spin_lock(&sched->job_list_lock);
1480	list_for_each_entry_safe(s_job, tmp, &sched->pending_list, list) {
1481		if (dma_fence_is_signaled(&s_job->s_fence->finished)) {
1482			/* remove job from ring_mirror_list */
1483			list_del_init(&s_job->list);
1484			sched->ops->free_job(s_job);
1485			continue;
1486		}
1487		job = to_amdgpu_job(s_job);
1488		if (preempted && (&job->hw_fence) == fence)
1489			/* mark the job as preempted */
1490			job->preemption_status |= AMDGPU_IB_PREEMPTED;
1491	}
1492	spin_unlock(&sched->job_list_lock);
1493}
1494
1495static int amdgpu_debugfs_ib_preempt(void *data, u64 val)
1496{
1497	int r, resched, length;
1498	struct amdgpu_ring *ring;
1499	struct dma_fence **fences = NULL;
1500	struct amdgpu_device *adev = (struct amdgpu_device *)data;
1501
1502	if (val >= AMDGPU_MAX_RINGS)
1503		return -EINVAL;
1504
1505	ring = adev->rings[val];
1506
1507	if (!ring || !ring->funcs->preempt_ib || !ring->sched.thread)
1508		return -EINVAL;
1509
1510	/* the last preemption failed */
1511	if (ring->trail_seq != le32_to_cpu(*ring->trail_fence_cpu_addr))
1512		return -EBUSY;
1513
1514	length = ring->fence_drv.num_fences_mask + 1;
1515	fences = kcalloc(length, sizeof(void *), GFP_KERNEL);
1516	if (!fences)
1517		return -ENOMEM;
1518
1519	/* Avoid accidently unparking the sched thread during GPU reset */
1520	r = down_read_killable(&adev->reset_sem);
1521	if (r)
1522		goto pro_end;
1523
1524	/* stop the scheduler */
1525	kthread_park(ring->sched.thread);
1526
1527	resched = ttm_bo_lock_delayed_workqueue(&adev->mman.bdev);
1528
1529	/* preempt the IB */
1530	r = amdgpu_ring_preempt_ib(ring);
1531	if (r) {
1532		DRM_WARN("failed to preempt ring %d\n", ring->idx);
1533		goto failure;
1534	}
1535
1536	amdgpu_fence_process(ring);
1537
1538	if (atomic_read(&ring->fence_drv.last_seq) !=
1539	    ring->fence_drv.sync_seq) {
1540		DRM_INFO("ring %d was preempted\n", ring->idx);
1541
1542		amdgpu_ib_preempt_mark_partial_job(ring);
1543
1544		/* swap out the old fences */
1545		amdgpu_ib_preempt_fences_swap(ring, fences);
1546
1547		amdgpu_fence_driver_force_completion(ring);
1548
1549		/* resubmit unfinished jobs */
1550		amdgpu_ib_preempt_job_recovery(&ring->sched);
1551
1552		/* wait for jobs finished */
1553		amdgpu_fence_wait_empty(ring);
1554
1555		/* signal the old fences */
1556		amdgpu_ib_preempt_signal_fences(fences, length);
1557	}
1558
1559failure:
1560	/* restart the scheduler */
1561	kthread_unpark(ring->sched.thread);
1562
1563	up_read(&adev->reset_sem);
1564
1565	ttm_bo_unlock_delayed_workqueue(&adev->mman.bdev, resched);
1566
1567pro_end:
1568	kfree(fences);
1569
1570	return r;
1571}
1572
1573static int amdgpu_debugfs_sclk_set(void *data, u64 val)
1574{
1575	int ret = 0;
1576	uint32_t max_freq, min_freq;
1577	struct amdgpu_device *adev = (struct amdgpu_device *)data;
1578
1579	if (amdgpu_sriov_vf(adev) && !amdgpu_sriov_is_pp_one_vf(adev))
1580		return -EINVAL;
1581
1582	ret = pm_runtime_get_sync(adev_to_drm(adev)->dev);
1583	if (ret < 0) {
1584		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1585		return ret;
1586	}
1587
1588	if (is_support_sw_smu(adev)) {
1589		ret = smu_get_dpm_freq_range(&adev->smu, SMU_SCLK, &min_freq, &max_freq);
1590		if (ret || val > max_freq || val < min_freq)
1591			return -EINVAL;
1592		ret = smu_set_soft_freq_range(&adev->smu, SMU_SCLK, (uint32_t)val, (uint32_t)val);
1593	} else {
1594		return 0;
1595	}
1596
1597	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1598	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1599
1600	if (ret)
1601		return -EINVAL;
1602
1603	return 0;
1604}
1605
1606DEFINE_DEBUGFS_ATTRIBUTE(fops_ib_preempt, NULL,
1607			amdgpu_debugfs_ib_preempt, "%llu\n");
1608
1609DEFINE_DEBUGFS_ATTRIBUTE(fops_sclk_set, NULL,
1610			amdgpu_debugfs_sclk_set, "%llu\n");
1611
1612int amdgpu_debugfs_init(struct amdgpu_device *adev)
1613{
1614	struct dentry *root = adev_to_drm(adev)->primary->debugfs_root;
1615	struct dentry *ent;
1616	int r, i;
1617
1618	if (!debugfs_initialized())
1619		return 0;
1620
1621	ent = debugfs_create_file("amdgpu_preempt_ib", 0600, root, adev,
1622				  &fops_ib_preempt);
1623	if (IS_ERR(ent)) {
1624		DRM_ERROR("unable to create amdgpu_preempt_ib debugsfs file\n");
1625		return PTR_ERR(ent);
1626	}
1627
1628	ent = debugfs_create_file("amdgpu_force_sclk", 0200, root, adev,
1629				  &fops_sclk_set);
1630	if (IS_ERR(ent)) {
1631		DRM_ERROR("unable to create amdgpu_set_sclk debugsfs file\n");
1632		return PTR_ERR(ent);
1633	}
1634
1635	/* Register debugfs entries for amdgpu_ttm */
1636	amdgpu_ttm_debugfs_init(adev);
1637	amdgpu_debugfs_pm_init(adev);
1638	amdgpu_debugfs_sa_init(adev);
1639	amdgpu_debugfs_fence_init(adev);
1640	amdgpu_debugfs_gem_init(adev);
1641
1642	r = amdgpu_debugfs_regs_init(adev);
1643	if (r)
1644		DRM_ERROR("registering register debugfs failed (%d).\n", r);
1645
1646	amdgpu_debugfs_firmware_init(adev);
1647
1648#if defined(CONFIG_DRM_AMD_DC)
1649	if (amdgpu_device_has_dc_support(adev))
1650		dtn_debugfs_init(adev);
1651#endif
1652
1653	for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
1654		struct amdgpu_ring *ring = adev->rings[i];
1655
1656		if (!ring)
1657			continue;
1658
1659		amdgpu_debugfs_ring_init(adev, ring);
1660	}
1661
1662	amdgpu_ras_debugfs_create_all(adev);
1663	amdgpu_rap_debugfs_init(adev);
1664	amdgpu_securedisplay_debugfs_init(adev);
1665	amdgpu_fw_attestation_debugfs_init(adev);
1666
1667	debugfs_create_file("amdgpu_evict_vram", 0444, root, adev,
1668			    &amdgpu_evict_vram_fops);
1669	debugfs_create_file("amdgpu_evict_gtt", 0444, root, adev,
1670			    &amdgpu_evict_gtt_fops);
1671	debugfs_create_file("amdgpu_test_ib", 0444, root, adev,
1672			    &amdgpu_debugfs_test_ib_fops);
1673	debugfs_create_file("amdgpu_vm_info", 0444, root, adev,
1674			    &amdgpu_debugfs_vm_info_fops);
1675
1676	adev->debugfs_vbios_blob.data = adev->bios;
1677	adev->debugfs_vbios_blob.size = adev->bios_size;
1678	debugfs_create_blob("amdgpu_vbios", 0444, root,
1679			    &adev->debugfs_vbios_blob);
1680
1681	adev->debugfs_discovery_blob.data = adev->mman.discovery_bin;
1682	adev->debugfs_discovery_blob.size = adev->mman.discovery_tmr_size;
1683	debugfs_create_blob("amdgpu_discovery", 0444, root,
1684			    &adev->debugfs_discovery_blob);
1685
1686	return 0;
1687}
1688
1689#else
1690int amdgpu_debugfs_init(struct amdgpu_device *adev)
1691{
1692	return 0;
1693}
1694int amdgpu_debugfs_regs_init(struct amdgpu_device *adev)
1695{
1696	return 0;
1697}
1698#endif