Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux

drm/amdgpu: group BOs by log2 of the size on the LRU v2

This allows us to have small BOs on the LRU before big ones.

v2: fix of by one and list corruption bug

Signed-off-by: Christian König <christian.koenig@amd.com>
Reviewed-by: Alex Deucher <alexander.deucher@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>

authored by

Christian König and committed by
Alex Deucher
29b3259a 1359d6e4

+70 -2
+11
drivers/gpu/drm/amd/amdgpu/amdgpu.h
··· 393 393 /* 394 394 * TTM. 395 395 */ 396 + 397 + #define AMDGPU_TTM_LRU_SIZE 20 398 + 399 + struct amdgpu_mman_lru { 400 + struct list_head *lru[TTM_NUM_MEM_TYPES]; 401 + struct list_head *swap_lru; 402 + }; 403 + 396 404 struct amdgpu_mman { 397 405 struct ttm_bo_global_ref bo_global_ref; 398 406 struct drm_global_reference mem_global_ref; ··· 418 410 struct amdgpu_ring *buffer_funcs_ring; 419 411 /* Scheduler entity for buffer moves */ 420 412 struct amd_sched_entity entity; 413 + 414 + /* custom LRU management */ 415 + struct amdgpu_mman_lru log2_size[AMDGPU_TTM_LRU_SIZE]; 421 416 }; 422 417 423 418 int amdgpu_copy_buffer(struct amdgpu_ring *ring,
+59 -2
drivers/gpu/drm/amd/amdgpu/amdgpu_ttm.c
··· 909 909 return flags; 910 910 } 911 911 912 + static void amdgpu_ttm_lru_removal(struct ttm_buffer_object *tbo) 913 + { 914 + struct amdgpu_device *adev = amdgpu_get_adev(tbo->bdev); 915 + unsigned i, j; 916 + 917 + for (i = 0; i < AMDGPU_TTM_LRU_SIZE; ++i) { 918 + struct amdgpu_mman_lru *lru = &adev->mman.log2_size[i]; 919 + 920 + for (j = 0; j < TTM_NUM_MEM_TYPES; ++j) 921 + if (&tbo->lru == lru->lru[j]) 922 + lru->lru[j] = tbo->lru.prev; 923 + 924 + if (&tbo->swap == lru->swap_lru) 925 + lru->swap_lru = tbo->swap.prev; 926 + } 927 + } 928 + 929 + static struct amdgpu_mman_lru *amdgpu_ttm_lru(struct ttm_buffer_object *tbo) 930 + { 931 + struct amdgpu_device *adev = amdgpu_get_adev(tbo->bdev); 932 + unsigned log2_size = min(ilog2(tbo->num_pages), 933 + AMDGPU_TTM_LRU_SIZE - 1); 934 + 935 + return &adev->mman.log2_size[log2_size]; 936 + } 937 + 938 + static struct list_head *amdgpu_ttm_lru_tail(struct ttm_buffer_object *tbo) 939 + { 940 + struct amdgpu_mman_lru *lru = amdgpu_ttm_lru(tbo); 941 + struct list_head *res = lru->lru[tbo->mem.mem_type]; 942 + 943 + lru->lru[tbo->mem.mem_type] = &tbo->lru; 944 + 945 + return res; 946 + } 947 + 948 + static struct list_head *amdgpu_ttm_swap_lru_tail(struct ttm_buffer_object *tbo) 949 + { 950 + struct amdgpu_mman_lru *lru = amdgpu_ttm_lru(tbo); 951 + struct list_head *res = lru->swap_lru; 952 + 953 + lru->swap_lru = &tbo->swap; 954 + 955 + return res; 956 + } 957 + 912 958 static struct ttm_bo_driver amdgpu_bo_driver = { 913 959 .ttm_tt_create = &amdgpu_ttm_tt_create, 914 960 .ttm_tt_populate = &amdgpu_ttm_tt_populate, ··· 968 922 .fault_reserve_notify = &amdgpu_bo_fault_reserve_notify, 969 923 .io_mem_reserve = &amdgpu_ttm_io_mem_reserve, 970 924 .io_mem_free = &amdgpu_ttm_io_mem_free, 971 - .lru_tail = &ttm_bo_default_lru_tail, 972 - .swap_lru_tail = &ttm_bo_default_swap_lru_tail, 925 + .lru_removal = &amdgpu_ttm_lru_removal, 926 + .lru_tail = &amdgpu_ttm_lru_tail, 927 + .swap_lru_tail = &amdgpu_ttm_swap_lru_tail, 973 928 }; 974 929 975 930 int amdgpu_ttm_init(struct amdgpu_device *adev) 976 931 { 932 + unsigned i, j; 977 933 int r; 978 934 979 935 r = amdgpu_ttm_global_init(adev); ··· 993 945 DRM_ERROR("failed initializing buffer object driver(%d).\n", r); 994 946 return r; 995 947 } 948 + 949 + for (i = 0; i < AMDGPU_TTM_LRU_SIZE; ++i) { 950 + struct amdgpu_mman_lru *lru = &adev->mman.log2_size[i]; 951 + 952 + for (j = 0; j < TTM_NUM_MEM_TYPES; ++j) 953 + lru->lru[j] = &adev->mman.bdev.man[j].lru; 954 + lru->swap_lru = &adev->mman.bdev.glob->swap_lru; 955 + } 956 + 996 957 adev->mman.initialized = true; 997 958 r = ttm_bo_init_mm(&adev->mman.bdev, TTM_PL_VRAM, 998 959 adev->mc.real_vram_size >> PAGE_SHIFT);