#include <drm/drm_debugfs.h>
#include "lsdc_benchmark.h"
#include "lsdc_drv.h"
#include "lsdc_gem.h"
#include "lsdc_ttm.h"
typedef void (*lsdc_copy_proc_t)(struct lsdc_bo *src_bo,
struct lsdc_bo *dst_bo,
unsigned int size,
int n);
static void lsdc_copy_gtt_to_vram_cpu(struct lsdc_bo *src_bo,
struct lsdc_bo *dst_bo,
unsigned int size,
int n)
{
lsdc_bo_kmap(src_bo);
lsdc_bo_kmap(dst_bo);
while (n--)
memcpy_toio(dst_bo->kptr, src_bo->kptr, size);
lsdc_bo_kunmap(src_bo);
lsdc_bo_kunmap(dst_bo);
}
static void lsdc_copy_vram_to_gtt_cpu(struct lsdc_bo *src_bo,
struct lsdc_bo *dst_bo,
unsigned int size,
int n)
{
lsdc_bo_kmap(src_bo);
lsdc_bo_kmap(dst_bo);
while (n--)
memcpy_fromio(dst_bo->kptr, src_bo->kptr, size);
lsdc_bo_kunmap(src_bo);
lsdc_bo_kunmap(dst_bo);
}
static void lsdc_copy_gtt_to_gtt_cpu(struct lsdc_bo *src_bo,
struct lsdc_bo *dst_bo,
unsigned int size,
int n)
{
lsdc_bo_kmap(src_bo);
lsdc_bo_kmap(dst_bo);
while (n--)
memcpy(dst_bo->kptr, src_bo->kptr, size);
lsdc_bo_kunmap(src_bo);
lsdc_bo_kunmap(dst_bo);
}
static void lsdc_benchmark_copy(struct lsdc_device *ldev,
unsigned int size,
unsigned int n,
u32 src_domain,
u32 dst_domain,
lsdc_copy_proc_t copy_proc,
struct drm_printer *p)
{
struct drm_device *ddev = &ldev->base;
struct lsdc_bo *src_bo;
struct lsdc_bo *dst_bo;
unsigned long start_jiffies;
unsigned long end_jiffies;
unsigned int throughput;
unsigned int time;
src_bo = lsdc_bo_create_kernel_pinned(ddev, src_domain, size);
dst_bo = lsdc_bo_create_kernel_pinned(ddev, dst_domain, size);
start_jiffies = jiffies;
copy_proc(src_bo, dst_bo, size, n);
end_jiffies = jiffies;
lsdc_bo_free_kernel_pinned(src_bo);
lsdc_bo_free_kernel_pinned(dst_bo);
time = jiffies_to_msecs(end_jiffies - start_jiffies);
throughput = (n * (size >> 10)) / time;
drm_printf(p,
"Copy bo of %uKiB %u times from %s to %s in %ums: %uMB/s\n",
size >> 10, n,
lsdc_domain_to_str(src_domain),
lsdc_domain_to_str(dst_domain),
time, throughput);
}
int lsdc_show_benchmark_copy(struct lsdc_device *ldev, struct drm_printer *p)
{
unsigned int buffer_size = 1920 * 1080 * 4;
unsigned int iteration = 60;
lsdc_benchmark_copy(ldev,
buffer_size,
iteration,
LSDC_GEM_DOMAIN_GTT,
LSDC_GEM_DOMAIN_GTT,
lsdc_copy_gtt_to_gtt_cpu,
p);
lsdc_benchmark_copy(ldev,
buffer_size,
iteration,
LSDC_GEM_DOMAIN_GTT,
LSDC_GEM_DOMAIN_VRAM,
lsdc_copy_gtt_to_vram_cpu,
p);
lsdc_benchmark_copy(ldev,
buffer_size,
iteration,
LSDC_GEM_DOMAIN_VRAM,
LSDC_GEM_DOMAIN_GTT,
lsdc_copy_vram_to_gtt_cpu,
p);
return 0;
}