mirror of
https://github.com/torvalds/linux.git
synced 2026-05-03 05:52:38 -04:00
MMIO_REMAP (HDP flush page) exposes a hardware MMIO register window via a PCI BAR; there are no struct pages backing it (not normal RAM). But when one device shares memory with another through dma-buf, the receiver still expects a delivery route—a list of DMA-able chunks—called an sg_table. For the BAR window, we can’t (no pages!), so we instead create a one-entry list that points directly to the BAR’s physical bus address and tell DMA: “use this I/O span.” - A single, contiguous byte range on the PCI bus (start DMA address + length)). That’s why we map it with dma_map_resource() and set sg_set_page(..., NULL, ...). Perform DMA reads/writes directly to that range so we build an sg_table from a BAR physical span and map it with dma_map_resource(). This patch centralizes the BAR-I/O mapping in TTM and wires dma-buf to it: Add amdgpu_ttm_mmio_remap_alloc_sgt() / amdgpu_ttm_mmio_remap_free_sgt(). They walk the TTM resource via amdgpu_res_cursor, add the byte offset to adev->rmmio_remap.bus_addr, build a one-entry sg_table with sg_set_page(NULL, …), and map/unmap it with dma_map_resource(). In dma-buf map/unmap, if the BO is in AMDGPU_PL_MMIO_REMAP, call the new helpers. Single place for BAR-I/O handling: amdgpu_ttm.c in amdgpu_ttm_mmio_remap_alloc_sgt() and ..._free_sgt(). No struct pages: sg_set_page(sg, NULL, cur.size, 0); inside amdgpu_ttm_mmio_remap_alloc_sgt(). Minimal sg_table: sg_alloc_table(*sgt, 1, GFP_KERNEL); inside amdgpu_ttm_mmio_remap_alloc_sgt(). Hooked into dma-buf: amdgpu_dma_buf_map()/unmap() in amdgpu_dma_buf.c call these helpers for AMDGPU_PL_MMIO_REMAP. v2: squash in fix for set/get tiling Suggested-by: Christian König <christian.koenig@amd.com> Cc: Alex Deucher <alexander.deucher@amd.com> Signed-off-by: Srinivasan Shanmugam <srinivasan.shanmugam@amd.com> Reviewed-by: Alex Deucher <alexander.deucher@amd.com> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
226 lines
8.1 KiB
C
226 lines
8.1 KiB
C
/*
|
|
* Copyright 2016 Advanced Micro Devices, Inc.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
* OTHER DEALINGS IN THE SOFTWARE.
|
|
*
|
|
*/
|
|
|
|
#ifndef __AMDGPU_TTM_H__
|
|
#define __AMDGPU_TTM_H__
|
|
|
|
#include <linux/dma-direction.h>
|
|
#include <drm/gpu_scheduler.h>
|
|
#include <drm/ttm/ttm_placement.h>
|
|
#include "amdgpu_vram_mgr.h"
|
|
#include "amdgpu_hmm.h"
|
|
|
|
#define AMDGPU_PL_GDS (TTM_PL_PRIV + 0)
|
|
#define AMDGPU_PL_GWS (TTM_PL_PRIV + 1)
|
|
#define AMDGPU_PL_OA (TTM_PL_PRIV + 2)
|
|
#define AMDGPU_PL_PREEMPT (TTM_PL_PRIV + 3)
|
|
#define AMDGPU_PL_DOORBELL (TTM_PL_PRIV + 4)
|
|
#define AMDGPU_PL_MMIO_REMAP (TTM_PL_PRIV + 5)
|
|
#define __AMDGPU_PL_NUM (TTM_PL_PRIV + 6)
|
|
|
|
#define AMDGPU_GTT_MAX_TRANSFER_SIZE 512
|
|
#define AMDGPU_GTT_NUM_TRANSFER_WINDOWS 2
|
|
|
|
extern const struct attribute_group amdgpu_vram_mgr_attr_group;
|
|
extern const struct attribute_group amdgpu_gtt_mgr_attr_group;
|
|
|
|
struct hmm_range;
|
|
|
|
struct amdgpu_gtt_mgr {
|
|
struct ttm_resource_manager manager;
|
|
struct drm_mm mm;
|
|
spinlock_t lock;
|
|
};
|
|
|
|
struct amdgpu_mman {
|
|
struct ttm_device bdev;
|
|
struct ttm_pool *ttm_pools;
|
|
bool initialized;
|
|
void __iomem *aper_base_kaddr;
|
|
|
|
/* buffer handling */
|
|
const struct amdgpu_buffer_funcs *buffer_funcs;
|
|
struct amdgpu_ring *buffer_funcs_ring;
|
|
bool buffer_funcs_enabled;
|
|
|
|
struct mutex gtt_window_lock;
|
|
/* High priority scheduler entity for buffer moves */
|
|
struct drm_sched_entity high_pr;
|
|
/* Low priority scheduler entity for VRAM clearing */
|
|
struct drm_sched_entity low_pr;
|
|
|
|
struct amdgpu_vram_mgr vram_mgr;
|
|
struct amdgpu_gtt_mgr gtt_mgr;
|
|
struct ttm_resource_manager preempt_mgr;
|
|
|
|
uint64_t stolen_vga_size;
|
|
struct amdgpu_bo *stolen_vga_memory;
|
|
uint64_t stolen_extended_size;
|
|
struct amdgpu_bo *stolen_extended_memory;
|
|
bool keep_stolen_vga_memory;
|
|
|
|
struct amdgpu_bo *stolen_reserved_memory;
|
|
uint64_t stolen_reserved_offset;
|
|
uint64_t stolen_reserved_size;
|
|
|
|
/* fw reserved memory */
|
|
struct amdgpu_bo *fw_reserved_memory;
|
|
struct amdgpu_bo *fw_reserved_memory_extend;
|
|
|
|
/* firmware VRAM reservation */
|
|
u64 fw_vram_usage_start_offset;
|
|
u64 fw_vram_usage_size;
|
|
struct amdgpu_bo *fw_vram_usage_reserved_bo;
|
|
void *fw_vram_usage_va;
|
|
|
|
/* driver VRAM reservation */
|
|
u64 drv_vram_usage_start_offset;
|
|
u64 drv_vram_usage_size;
|
|
struct amdgpu_bo *drv_vram_usage_reserved_bo;
|
|
void *drv_vram_usage_va;
|
|
|
|
/* PAGE_SIZE'd BO for process memory r/w over SDMA. */
|
|
struct amdgpu_bo *sdma_access_bo;
|
|
void *sdma_access_ptr;
|
|
};
|
|
|
|
struct amdgpu_copy_mem {
|
|
struct ttm_buffer_object *bo;
|
|
struct ttm_resource *mem;
|
|
unsigned long offset;
|
|
};
|
|
|
|
#define AMDGPU_COPY_FLAGS_TMZ (1 << 0)
|
|
#define AMDGPU_COPY_FLAGS_READ_DECOMPRESSED (1 << 1)
|
|
#define AMDGPU_COPY_FLAGS_WRITE_COMPRESSED (1 << 2)
|
|
#define AMDGPU_COPY_FLAGS_MAX_COMPRESSED_SHIFT 3
|
|
#define AMDGPU_COPY_FLAGS_MAX_COMPRESSED_MASK 0x03
|
|
#define AMDGPU_COPY_FLAGS_NUMBER_TYPE_SHIFT 5
|
|
#define AMDGPU_COPY_FLAGS_NUMBER_TYPE_MASK 0x07
|
|
#define AMDGPU_COPY_FLAGS_DATA_FORMAT_SHIFT 8
|
|
#define AMDGPU_COPY_FLAGS_DATA_FORMAT_MASK 0x3f
|
|
#define AMDGPU_COPY_FLAGS_WRITE_COMPRESS_DISABLE_SHIFT 14
|
|
#define AMDGPU_COPY_FLAGS_WRITE_COMPRESS_DISABLE_MASK 0x1
|
|
|
|
#define AMDGPU_COPY_FLAGS_SET(field, value) \
|
|
(((__u32)(value) & AMDGPU_COPY_FLAGS_##field##_MASK) << AMDGPU_COPY_FLAGS_##field##_SHIFT)
|
|
#define AMDGPU_COPY_FLAGS_GET(value, field) \
|
|
(((__u32)(value) >> AMDGPU_COPY_FLAGS_##field##_SHIFT) & AMDGPU_COPY_FLAGS_##field##_MASK)
|
|
|
|
int amdgpu_gtt_mgr_init(struct amdgpu_device *adev, uint64_t gtt_size);
|
|
void amdgpu_gtt_mgr_fini(struct amdgpu_device *adev);
|
|
int amdgpu_preempt_mgr_init(struct amdgpu_device *adev);
|
|
void amdgpu_preempt_mgr_fini(struct amdgpu_device *adev);
|
|
int amdgpu_vram_mgr_init(struct amdgpu_device *adev);
|
|
void amdgpu_vram_mgr_fini(struct amdgpu_device *adev);
|
|
|
|
bool amdgpu_gtt_mgr_has_gart_addr(struct ttm_resource *mem);
|
|
void amdgpu_gtt_mgr_recover(struct amdgpu_gtt_mgr *mgr);
|
|
|
|
uint64_t amdgpu_preempt_mgr_usage(struct ttm_resource_manager *man);
|
|
|
|
u64 amdgpu_vram_mgr_bo_visible_size(struct amdgpu_bo *bo);
|
|
int amdgpu_vram_mgr_alloc_sgt(struct amdgpu_device *adev,
|
|
struct ttm_resource *mem,
|
|
u64 offset, u64 size,
|
|
struct device *dev,
|
|
enum dma_data_direction dir,
|
|
struct sg_table **sgt);
|
|
void amdgpu_vram_mgr_free_sgt(struct device *dev,
|
|
enum dma_data_direction dir,
|
|
struct sg_table *sgt);
|
|
uint64_t amdgpu_vram_mgr_vis_usage(struct amdgpu_vram_mgr *mgr);
|
|
int amdgpu_vram_mgr_reserve_range(struct amdgpu_vram_mgr *mgr,
|
|
uint64_t start, uint64_t size);
|
|
int amdgpu_vram_mgr_query_page_status(struct amdgpu_vram_mgr *mgr,
|
|
uint64_t start);
|
|
void amdgpu_vram_mgr_clear_reset_blocks(struct amdgpu_device *adev);
|
|
|
|
bool amdgpu_res_cpu_visible(struct amdgpu_device *adev,
|
|
struct ttm_resource *res);
|
|
|
|
int amdgpu_ttm_init(struct amdgpu_device *adev);
|
|
void amdgpu_ttm_fini(struct amdgpu_device *adev);
|
|
void amdgpu_ttm_set_buffer_funcs_status(struct amdgpu_device *adev,
|
|
bool enable);
|
|
int amdgpu_copy_buffer(struct amdgpu_ring *ring, uint64_t src_offset,
|
|
uint64_t dst_offset, uint32_t byte_count,
|
|
struct dma_resv *resv,
|
|
struct dma_fence **fence, bool direct_submit,
|
|
bool vm_needs_flush, uint32_t copy_flags);
|
|
int amdgpu_ttm_clear_buffer(struct amdgpu_bo *bo,
|
|
struct dma_resv *resv,
|
|
struct dma_fence **fence);
|
|
int amdgpu_fill_buffer(struct amdgpu_bo *bo,
|
|
uint32_t src_data,
|
|
struct dma_resv *resv,
|
|
struct dma_fence **fence,
|
|
bool delayed,
|
|
u64 k_job_id);
|
|
|
|
int amdgpu_ttm_alloc_gart(struct ttm_buffer_object *bo);
|
|
void amdgpu_ttm_recover_gart(struct ttm_buffer_object *tbo);
|
|
uint64_t amdgpu_ttm_domain_start(struct amdgpu_device *adev, uint32_t type);
|
|
|
|
#if IS_ENABLED(CONFIG_DRM_AMDGPU_USERPTR)
|
|
int amdgpu_ttm_tt_get_user_pages(struct amdgpu_bo *bo,
|
|
struct amdgpu_hmm_range *range);
|
|
#else
|
|
static inline int amdgpu_ttm_tt_get_user_pages(struct amdgpu_bo *bo,
|
|
struct amdgpu_hmm_range *range)
|
|
{
|
|
return -EPERM;
|
|
}
|
|
#endif
|
|
|
|
void amdgpu_ttm_tt_set_user_pages(struct ttm_tt *ttm, struct amdgpu_hmm_range *range);
|
|
int amdgpu_ttm_tt_get_userptr(const struct ttm_buffer_object *tbo,
|
|
uint64_t *user_addr);
|
|
int amdgpu_ttm_tt_set_userptr(struct ttm_buffer_object *bo,
|
|
uint64_t addr, uint32_t flags);
|
|
bool amdgpu_ttm_tt_has_userptr(struct ttm_tt *ttm);
|
|
struct mm_struct *amdgpu_ttm_tt_get_usermm(struct ttm_tt *ttm);
|
|
bool amdgpu_ttm_tt_affect_userptr(struct ttm_tt *ttm, unsigned long start,
|
|
unsigned long end, unsigned long *userptr);
|
|
bool amdgpu_ttm_tt_userptr_invalidated(struct ttm_tt *ttm,
|
|
int *last_invalidated);
|
|
bool amdgpu_ttm_tt_is_userptr(struct ttm_tt *ttm);
|
|
bool amdgpu_ttm_tt_is_readonly(struct ttm_tt *ttm);
|
|
uint64_t amdgpu_ttm_tt_pde_flags(struct ttm_tt *ttm, struct ttm_resource *mem);
|
|
uint64_t amdgpu_ttm_tt_pte_flags(struct amdgpu_device *adev, struct ttm_tt *ttm,
|
|
struct ttm_resource *mem);
|
|
int amdgpu_ttm_evict_resources(struct amdgpu_device *adev, int mem_type);
|
|
|
|
void amdgpu_ttm_debugfs_init(struct amdgpu_device *adev);
|
|
|
|
int amdgpu_ttm_mmio_remap_alloc_sgt(struct amdgpu_device *adev,
|
|
struct ttm_resource *res,
|
|
struct device *dev,
|
|
enum dma_data_direction dir,
|
|
struct sg_table **sgt);
|
|
void amdgpu_ttm_mmio_remap_free_sgt(struct device *dev,
|
|
enum dma_data_direction dir,
|
|
struct sg_table *sgt);
|
|
|
|
#endif
|