// SPDX-License-Identifier: GPL-2.0+
/*
 * Copyright (C) 2023 Loongson Technology Corporation Limited
 */

#include <drm/drm_debugfs.h>

#include "lsdc_benchmark.h"
#include "lsdc_drv.h"
#include "lsdc_gem.h"
#include "lsdc_ttm.h"

typedef void (*lsdc_copy_proc_t)(struct lsdc_bo *src_bo,
				 struct lsdc_bo *dst_bo,
				 unsigned int size,
				 int n);

static void lsdc_copy_gtt_to_vram_cpu(struct lsdc_bo *src_bo,
				      struct lsdc_bo *dst_bo,
				      unsigned int size,
				      int n)
{
	lsdc_bo_kmap(src_bo);
	lsdc_bo_kmap(dst_bo);

	while (n--)
		memcpy_toio(dst_bo->kptr, src_bo->kptr, size);

	lsdc_bo_kunmap(src_bo);
	lsdc_bo_kunmap(dst_bo);
}

static void lsdc_copy_vram_to_gtt_cpu(struct lsdc_bo *src_bo,
				      struct lsdc_bo *dst_bo,
				      unsigned int size,
				      int n)
{
	lsdc_bo_kmap(src_bo);
	lsdc_bo_kmap(dst_bo);

	while (n--)
		memcpy_fromio(dst_bo->kptr, src_bo->kptr, size);

	lsdc_bo_kunmap(src_bo);
	lsdc_bo_kunmap(dst_bo);
}

static void lsdc_copy_gtt_to_gtt_cpu(struct lsdc_bo *src_bo,
				     struct lsdc_bo *dst_bo,
				     unsigned int size,
				     int n)
{
	lsdc_bo_kmap(src_bo);
	lsdc_bo_kmap(dst_bo);

	while (n--)
		memcpy(dst_bo->kptr, src_bo->kptr, size);

	lsdc_bo_kunmap(src_bo);
	lsdc_bo_kunmap(dst_bo);
}

static void lsdc_benchmark_copy(struct lsdc_device *ldev,
				unsigned int size,
				unsigned int n,
				u32 src_domain,
				u32 dst_domain,
				lsdc_copy_proc_t copy_proc,
				struct drm_printer *p)
{
	struct drm_device *ddev = &ldev->base;
	struct lsdc_bo *src_bo;
	struct lsdc_bo *dst_bo;
	unsigned long start_jiffies;
	unsigned long end_jiffies;
	unsigned int throughput;
	unsigned int time;

	src_bo = lsdc_bo_create_kernel_pinned(ddev, src_domain, size);
	dst_bo = lsdc_bo_create_kernel_pinned(ddev, dst_domain, size);

	start_jiffies = jiffies;

	copy_proc(src_bo, dst_bo, size, n);

	end_jiffies = jiffies;

	lsdc_bo_free_kernel_pinned(src_bo);
	lsdc_bo_free_kernel_pinned(dst_bo);

	time = jiffies_to_msecs(end_jiffies - start_jiffies);

	throughput = (n * (size >> 10)) / time;

	drm_printf(p,
		   "Copy bo of %uKiB %u times from %s to %s in %ums: %uMB/s\n",
		   size >> 10, n,
		   lsdc_domain_to_str(src_domain),
		   lsdc_domain_to_str(dst_domain),
		   time, throughput);
}

int lsdc_show_benchmark_copy(struct lsdc_device *ldev, struct drm_printer *p)
{
	unsigned int buffer_size = 1920 * 1080 * 4;
	unsigned int iteration = 60;

	lsdc_benchmark_copy(ldev,
			    buffer_size,
			    iteration,
			    LSDC_GEM_DOMAIN_GTT,
			    LSDC_GEM_DOMAIN_GTT,
			    lsdc_copy_gtt_to_gtt_cpu,
			    p);

	lsdc_benchmark_copy(ldev,
			    buffer_size,
			    iteration,
			    LSDC_GEM_DOMAIN_GTT,
			    LSDC_GEM_DOMAIN_VRAM,
			    lsdc_copy_gtt_to_vram_cpu,
			    p);

	lsdc_benchmark_copy(ldev,
			    buffer_size,
			    iteration,
			    LSDC_GEM_DOMAIN_VRAM,
			    LSDC_GEM_DOMAIN_GTT,
			    lsdc_copy_vram_to_gtt_cpu,
			    p);

	return 0;
}