ARM: mali400: r5p2_rel0: add sc8830 platform codes

author Joonyoung Shim <jy0922.shim@samsung.com>

Tue, 10 May 2016 06:49:03 +0000 (15:49 +0900)

committer Joonyoung Shim <jy0922.shim@samsung.com>

Mon, 23 May 2016 06:41:28 +0000 (15:41 +0900)
author Joonyoung Shim <jy0922.shim@samsung.com>
Tue, 10 May 2016 06:49:03 +0000 (15:49 +0900)
committer Joonyoung Shim <jy0922.shim@samsung.com>
Mon, 23 May 2016 06:41:28 +0000 (15:41 +0900)
diff --git a/drivers/gpu/arm/mali400/r5p2_rel0/Kbuild b/drivers/gpu/arm/mali400/r5p2_rel0/Kbuild

index ab2a41e..81b4d85 100644 (file)
--- a/drivers/gpu/arm/mali400/r5p2_rel0/Kbuild
+++ b/drivers/gpu/arm/mali400/r5p2_rel0/Kbuild
@@ -21,6 +21,10 @@ MALI_PP_SCHEDULER_KEEP_SUB_JOB_STARTS_ALIGNED ?= 0
  MALI_PP_SCHEDULER_FORCE_NO_JOB_OVERLAP_BETWEEN_APPS ?= 0
  MALI_UPPER_HALF_SCHEDULING ?= 1
  MALI_ENABLE_CPU_CYCLES ?= 0
+MALI_PLATFORM ?= sc8830
+MALI_FAKE_PLATFORM_DEVICE ?= 1
+DFS_ONE_STEP_SCALE_DOWN ?= 1
+MATCH_DFS_TO_LOWER_FREQ ?= 1
  
  # For customer releases the Linux Device Drivers will be provided as ARM proprietary and GPL releases:
  # The ARM proprietary product will only include the license/proprietary directory
@@ -118,6 +122,7 @@ mali-y += \
         linux/mali_pmu_power_up_down.o \
         __malidrv_build_info.o
  
+MALI_PLATFORM_FILES = platform/$(MALI_PLATFORM)/mali_platform.c
  ifneq ($(MALI_PLATFORM_FILES),)
         mali-y += $(MALI_PLATFORM_FILES:.c=.o)
  endif
@@ -143,6 +148,8 @@ ccflags-y += $(EXTRA_DEFINES)
  
  # Set up our defines, which will be passed to gcc
  ccflags-y += -DSPRD_GPU_BOOST
+ccflags-y += -DSPRD_DFS_ONE_STEP_SCALE_DOWN=$(DFS_ONE_STEP_SCALE_DOWN)
+ccflags-y += -DSPRD_MATCH_DFS_TO_LOWER_FREQ=$(MATCH_DFS_TO_LOWER_FREQ)
  
  ccflags-y += -DMALI_PP_SCHEDULER_FORCE_NO_JOB_OVERLAP=$(MALI_PP_SCHEDULER_FORCE_NO_JOB_OVERLAP)
  ccflags-y += -DMALI_PP_SCHEDULER_KEEP_SUB_JOB_STARTS_ALIGNED=$(MALI_PP_SCHEDULER_KEEP_SUB_JOB_STARTS_ALIGNED)
@@ -151,6 +158,7 @@ ccflags-y += -DMALI_STATE_TRACKING=1
  ccflags-y += -DMALI_OS_MEMORY_KERNEL_BUFFER_SIZE_IN_MB=$(OS_MEMORY_KERNEL_BUFFER_SIZE_IN_MB)
  ccflags-y += -DUSING_GPU_UTILIZATION=$(USING_GPU_UTILIZATION)
  ccflags-y += -DMALI_ENABLE_CPU_CYCLES=$(MALI_ENABLE_CPU_CYCLES)
+ccflags-y += -DMALI_FAKE_PLATFORM_DEVICE=$(MALI_FAKE_PLATFORM_DEVICE)
  
  ifeq ($(MALI_UPPER_HALF_SCHEDULING),1)
         ccflags-y += -DMALI_UPPER_HALF_SCHEDULING
@@ -207,7 +215,7 @@ VERSION_STRINGS += BUILD=debug
  else
  VERSION_STRINGS += BUILD=release
  endif
-VERSION_STRINGS += TARGET_PLATFORM=$(TARGET_PLATFORM)
+VERSION_STRINGS += TARGET_PLATFORM=$(MALI_PLATFORM)
  VERSION_STRINGS += MALI_PLATFORM=$(MALI_PLATFORM)
  VERSION_STRINGS += KDIR=$(KDIR)
  VERSION_STRINGS += OS_MEMORY_KERNEL_BUFFER_SIZE_IN_MB=$(OS_MEMORY_KERNEL_BUFFER_SIZE_IN_MB)
diff --git a/drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/base.h b/drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/base.h

new file mode 100644 (file)

index 0000000..b7f2f80
--- /dev/null
+++ b/drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/base.h
@@ -0,0 +1,22 @@
+/*
+ * Copyright (C) 2010-2011 ARM Limited. All rights reserved.
+ * 
+ * This program is free software and is provided to you under the terms of the
+ * GNU General Public License version 2 as published by the Free Software
+ * Foundation, and any use by you of this program is subject to the terms of
+ * such GNU licence.
+ * 
+ * A copy of the licence is included with the program, and can also be obtained
+ * from Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
+ * MA  02110-1301, USA.
+ */
+
+#ifndef __ARCH_BASE_H__
+#define __ARCH_BASE_H__
+
+#define ARCH_MALI_MEMORY_BASE_DEFAULT      (4 * 1024 * 1024UL)
+#define ARCH_MALI_MEMORY_SIZE_DEFAULT      (1024 * 1024 * 1024UL)
+
+#define MALI400_L2_MAX_READS_DEFAULT        0x1C
+
+#endif
diff --git a/drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/mali_platform.c b/drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/mali_platform.c

new file mode 100644 (file)

index 0000000..8b4cb77
--- /dev/null
+++ b/drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/mali_platform.c
@@ -0,0 +1,730 @@
+/*
+ * Copyright (C) 2010-2011 ARM Limited. All rights reserved.
+ *
+ * This program is free software and is provided to you under the terms of the
+ * GNU General Public License version 2 as published by the Free Software
+ * Foundation, and any use by you of this program is subject to the terms of
+ * such GNU licence.
+ *
+ * A copy of the licence is included with the program, and can also be obtained
+ * from Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
+ * MA  02110-1301, USA.
+ */
+
+/**
+ * @file mali_platform.c
+ * Platform specific Mali driver functions for a default platform
+ */
+
+#include <linux/version.h>
+#include <linux/clk.h>
+#include <linux/delay.h>
+#include <linux/dma-mapping.h>
+#ifdef CONFIG_SYSTEM_LOAD_ANALYZER
+#include <linux/load_analyzer.h>
+#endif
+#include <linux/mali/mali_utgard.h>
+#ifdef CONFIG_MALI_DT
+#include <linux/of.h>
+#endif
+#include <linux/platform_device.h>
+#include <linux/pm.h>
+#ifdef CONFIG_PM_RUNTIME
+#include <linux/pm_runtime.h>
+#endif
+#include <linux/semaphore.h>
+#include <linux/vmalloc.h>
+#include <linux/workqueue.h>
+
+#ifdef CONFIG_64BIT
+#include <soc/sprd/irqs.h>
+#include <soc/sprd/sci.h>
+#include <soc/sprd/sci_glb_regs.h>
+#else
+#include <soc/sprd/sci.h>
+#include <soc/sprd/sci_glb_regs.h>
+#endif
+
+#include "base.h"
+#include "mali_executor.h"
+#include "mali_kernel_common.h"
+#include "mali_kernel_linux.h"
+#include "mali_pm.h"
+
+#define GPU_GLITCH_FREE_DFS    0
+
+#define UP_THRESHOLD           9/10
+#define DOWN_THRESHOLD         5/10
+
+#define __SPRD_GPU_TIMEOUT      (3*1000)
+
+struct gpu_freq_info {
+       struct clk *clk_src;
+       int freq;
+       int div;
+       int up_threshold;
+};
+
+struct gpu_dfs_context {
+       int gpu_clock_on;
+       int gpu_power_on;
+
+       struct clk *gpu_clock;
+       struct clk *gpu_clock_i;
+       struct clk **gpu_clk_src;
+       int gpu_clk_num;
+
+       int cur_load;
+
+       struct gpu_freq_info *freq_list;
+       int freq_list_len;
+
+       const struct gpu_freq_info *freq_cur;
+       const struct gpu_freq_info *freq_next;
+
+       const struct gpu_freq_info *freq_min;
+       const struct gpu_freq_info *freq_max;
+       const struct gpu_freq_info *freq_default;
+       const struct gpu_freq_info *freq_9;
+       const struct gpu_freq_info *freq_8;
+       const struct gpu_freq_info *freq_7;
+       const struct gpu_freq_info *freq_5;
+       const struct gpu_freq_info *freq_range_max;
+       const struct gpu_freq_info *freq_range_min;
+
+       struct workqueue_struct *gpu_dfs_workqueue;
+       struct semaphore* sem;
+};
+
+extern int gpu_boost_level;
+extern int gpu_boost_sf_level;
+
+extern int gpu_freq_cur;
+extern int gpu_freq_min_limit;
+extern int gpu_freq_max_limit;
+extern char* gpu_freq_list;
+
+extern _mali_osk_errcode_t mali_executor_initialize(void);
+extern void mali_executor_lock(void);
+extern void mali_executor_unlock(void);
+
+static void gpu_dfs_func(struct work_struct *work);
+static void mali_platform_utilization(struct mali_gpu_utilization_data *data);
+
+static DECLARE_WORK(gpu_dfs_work, &gpu_dfs_func);
+
+DEFINE_SEMAPHORE(gpu_dfs_sem);
+
+static struct gpu_dfs_context gpu_dfs_ctx = {
+       .sem = &gpu_dfs_sem,
+};
+
+struct mali_gpu_device_data mali_gpu_data = {
+       .shared_mem_size = ARCH_MALI_MEMORY_SIZE_DEFAULT,
+       .control_interval = 100,
+       .utilization_callback = mali_platform_utilization,
+       .get_clock_info = NULL,
+       .get_freq = NULL,
+       .set_freq = NULL,
+};
+
+static void gpu_freq_list_show(char *buf)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+       int i;
+
+       for (i = 0; i < ctx->freq_list_len; i++)
+               buf += sprintf(buf, "%2d  %6d\n", i, ctx->freq_list[i].freq);
+}
+
+static int sprd_gpu_domain_state(void)
+{
+       /* FIXME: rtc domain */
+       unsigned int power_state1, power_state2, power_state3;
+       unsigned long timeout = jiffies + msecs_to_jiffies(__SPRD_GPU_TIMEOUT);
+
+       do {
+               cpu_relax();
+               power_state1 = sci_glb_read(REG_PMU_APB_PWR_STATUS0_DBG,
+                                               BITS_PD_GPU_TOP_STATE(-1));
+               power_state2 = sci_glb_read(REG_PMU_APB_PWR_STATUS0_DBG,
+                                               BITS_PD_GPU_TOP_STATE(-1));
+               power_state3 = sci_glb_read(REG_PMU_APB_PWR_STATUS0_DBG,
+                                               BITS_PD_GPU_TOP_STATE(-1));
+               if (time_after(jiffies, timeout)) {
+                       pr_emerg("gpu domain not ready, state %08x %08x\n",
+                               sci_glb_read(REG_PMU_APB_PWR_STATUS0_DBG, -1),
+                               sci_glb_read(REG_AON_APB_APB_EB0, -1));
+               }
+       } while ((power_state1 != power_state2) ||
+                       (power_state2 != power_state3));
+
+       return (int)(power_state1);
+}
+
+static void sprd_gpu_domain_wait_for_ready(void)
+{
+       int timeout_count = 2000;
+
+       while (sprd_gpu_domain_state() != BITS_PD_GPU_TOP_STATE(0)) {
+               if (!timeout_count) {
+                       pr_emerg(
+                       "gpu domain not ready too long time, state %08x %08x\n",
+                               sci_glb_read(REG_PMU_APB_PWR_STATUS0_DBG, -1),
+                               sci_glb_read(REG_AON_APB_APB_EB0, -1));
+                       return;
+               }
+               udelay(50);
+               timeout_count--;
+       }
+}
+
+static inline void mali_set_div(int clock_div)
+{
+       sci_glb_write(REG_GPU_APB_APB_CLK_CTRL, BITS_CLK_GPU_DIV(clock_div - 1),
+                       BITS_CLK_GPU_DIV(3));
+}
+
+static inline void mali_power_on(void)
+{
+       sci_glb_clr(REG_PMU_APB_PD_GPU_TOP_CFG, BIT_PD_GPU_TOP_FORCE_SHUTDOWN);
+       udelay(100);
+       mali_executor_lock();
+       gpu_dfs_ctx.gpu_power_on = 1;
+       mali_executor_unlock();
+}
+
+static inline void mali_power_off(void)
+{
+       mali_executor_lock();
+       gpu_dfs_ctx.gpu_power_on = 0;
+       mali_executor_unlock();
+       sci_glb_set(REG_PMU_APB_PD_GPU_TOP_CFG, BIT_PD_GPU_TOP_FORCE_SHUTDOWN);
+}
+
+static inline void mali_clock_on(void)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+       int i;
+
+       for (i = 0; i < ctx->gpu_clk_num; i++) {
+#ifdef CONFIG_COMMON_CLK
+               clk_prepare_enable(ctx->gpu_clk_src[i]);
+#else
+               clk_enable(ctx->gpu_clk_src[i]);
+#endif
+       }
+
+#ifdef CONFIG_COMMON_CLK
+       clk_prepare_enable(ctx->gpu_clock_i);
+#else
+       clk_enable(ctx->gpu_clock_i);
+#endif
+       sprd_gpu_domain_wait_for_ready();
+
+       clk_set_parent(ctx->gpu_clock, ctx->freq_default->clk_src);
+
+       MALI_DEBUG_ASSERT(ctx->freq_cur);
+       clk_set_parent(ctx->gpu_clock, ctx->freq_cur->clk_src);
+       mali_set_div(ctx->freq_cur->div);
+
+#ifdef CONFIG_COMMON_CLK
+       clk_prepare_enable(ctx->gpu_clock);
+#else
+       clk_enable(ctx->gpu_clock);
+#endif
+       udelay(100);
+
+       mali_executor_lock();
+       ctx->gpu_clock_on = 1;
+       mali_executor_unlock();
+
+       gpu_freq_cur = ctx->freq_cur->freq;
+#ifdef CONFIG_SYSTEM_LOAD_ANALYZER
+       store_external_load_factor(GPU_FREQ, gpu_freq_cur);
+#endif
+}
+
+static inline void mali_clock_off(void)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+       int i;
+
+       gpu_freq_cur = 0;
+#ifdef CONFIG_SYSTEM_LOAD_ANALYZER
+       store_external_load_factor(GPU_UTILIZATION, 0);
+       store_external_load_factor(GPU_FREQ, gpu_freq_cur);
+#endif
+
+       mali_executor_lock();
+       ctx->gpu_clock_on = 0;
+       mali_executor_unlock();
+
+#ifdef CONFIG_COMMON_CLK
+       clk_disable_unprepare(ctx->gpu_clock);
+       clk_disable_unprepare(ctx->gpu_clock_i);
+#else
+       clk_disable(ctx->gpu_clock);
+       clk_disable(ctx->gpu_clock_i);
+#endif
+
+       for (i = 0; i < ctx->gpu_clk_num; i++) {
+#ifdef CONFIG_COMMON_CLK
+               clk_disable_unprepare(ctx->gpu_clk_src[i]);
+#else
+               clk_disable(ctx->gpu_clk_src[i]);
+#endif
+       }
+}
+
+int mali_platform_device_init(struct platform_device *pdev)
+{
+#ifndef CONFIG_SCX35L64BIT_FPGA /* not use fpga */
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+       int i, err = -1;
+#ifdef CONFIG_ARCH_SCX30G
+       int clksrc_300m_idx = -1;
+#endif
+#ifdef CONFIG_MALI_DT
+       extern struct of_device_id base_dt_ids[];
+       struct device_node *np;
+       int clk_cnt;
+
+       np = of_find_matching_node(NULL, base_dt_ids);
+       if (!np)
+               return err;
+
+       ctx->gpu_clock_i = of_clk_get(np, 0);
+       MALI_DEBUG_ASSERT(ctx->gpu_clock_i);
+       ctx->gpu_clock = of_clk_get(np, 1);
+       MALI_DEBUG_ASSERT(ctx->gpu_clock);
+
+       clk_cnt = of_property_count_strings(np, "clock-names");
+       ctx->gpu_clk_num = clk_cnt - 2;
+       ctx->gpu_clk_src = vmalloc(sizeof(struct clk *) * ctx->gpu_clk_num);
+       MALI_DEBUG_ASSERT(ctx->gpu_clk_src);
+
+       for (i = 0; i < ctx->gpu_clk_num; i++) {
+               const char *clk_name;
+
+               of_property_read_string_index(np, "clock-names", i + 2,
+                                               &clk_name);
+               ctx->gpu_clk_src[i] = of_clk_get_by_name(np, clk_name);
+               MALI_DEBUG_ASSERT(ctx->gpu_clk_src[i]);
+#ifdef CONFIG_ARCH_SCX30G
+               if (!strcmp(clk_name, "clk_300m_gpu_gate"))
+                       clksrc_300m_idx = i;
+#endif
+       }
+
+       of_property_read_u32(np, "freq-list-len", &ctx->freq_list_len);
+       ctx->freq_list =
+               vmalloc(sizeof(struct gpu_freq_info) * ctx->freq_list_len);
+       MALI_DEBUG_ASSERT(ctx->freq_list);
+
+       for (i = 0; i < ctx->freq_list_len; i++) {
+               int clk;
+
+               of_property_read_u32_index(np, "freq-lists", 3 * i + 1, &clk);
+               ctx->freq_list[i].clk_src = ctx->gpu_clk_src[clk - 2];
+               MALI_DEBUG_ASSERT(ctx->freq_list[i].clk_src);
+               of_property_read_u32_index(np, "freq-lists", 3 * i,
+                                               &ctx->freq_list[i].freq);
+               of_property_read_u32_index(np, "freq-lists", 3 * i + 2,
+                                               &ctx->freq_list[i].div);
+               ctx->freq_list[i].up_threshold =
+                                       ctx->freq_list[i].freq * UP_THRESHOLD;
+       }
+
+       of_property_read_u32(np, "freq-default", &i);
+       ctx->freq_default = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_default);
+
+       of_property_read_u32(np, "freq-9", &i);
+       ctx->freq_9 = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_9);
+
+       of_property_read_u32(np, "freq-8", &i);
+       ctx->freq_8 = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_8);
+
+       of_property_read_u32(np, "freq-7", &i);
+       ctx->freq_7 = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_7);
+
+       of_property_read_u32(np, "freq-5", &i);
+       ctx->freq_5 = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_5);
+
+       of_property_read_u32(np, "freq-range-max", &i);
+       ctx->freq_range_max = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_range_max);
+
+       of_property_read_u32(np, "freq-range-min", &i);
+       ctx->freq_range_min = &ctx->freq_list[i];
+       MALI_DEBUG_ASSERT(ctx->freq_range_min);
+
+       of_node_put(np);
+
+       ctx->freq_max = ctx->freq_range_max;
+       ctx->freq_min = ctx->freq_range_min;
+       ctx->freq_cur = ctx->freq_default;
+#endif
+
+       sci_glb_write(REG_PMU_APB_PD_GPU_TOP_CFG,
+                       BITS_PD_GPU_TOP_PWR_ON_DLY(1), 0xff0000);
+       sci_glb_write(REG_PMU_APB_PD_GPU_TOP_CFG,
+                       BITS_PD_GPU_TOP_PWR_ON_SEQ_DLY(1), 0xff00);
+       sci_glb_write(REG_PMU_APB_PD_GPU_TOP_CFG,
+                       BITS_PD_GPU_TOP_ISO_ON_DLY(1), 0xff);
+
+       mali_power_on();
+
+       mali_clock_on();
+#ifdef CONFIG_ARCH_SCX30G
+       /* CPU could disable MPLL, so should increase MPLL refcnt */
+       if (clksrc_300m_idx != -1) {
+#ifdef CONFIG_COMMON_CLK
+               clk_prepare_enable(ctx->gpu_clk_src[clksrc_300m_idx]);
+#else
+               clk_enable(ctx->gpu_clk_src[clksrc_300m_idx]);
+#endif
+       }
+#endif
+
+       ctx->gpu_dfs_workqueue = create_singlethread_workqueue("gpu_dfs");
+
+       err = platform_device_add_data(pdev, &mali_gpu_data,
+                                       sizeof(mali_gpu_data));
+       if (!err) {
+#ifdef CONFIG_PM_RUNTIME
+#if (LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 37))
+               pm_runtime_set_autosuspend_delay(&(pdev->dev), 50);
+               pm_runtime_use_autosuspend(&(pdev->dev));
+#endif
+               pm_runtime_enable(&(pdev->dev));
+#endif
+       }
+
+       gpu_freq_list = vmalloc(sizeof(char) * 256);
+       gpu_freq_list_show(gpu_freq_list);
+
+       return err;
+#else /* use fpga */
+#ifdef CONFIG_MALI_DT
+       if (!of_find_matching_node(NULL, gpu_ids))
+               return -1;
+#endif
+       sci_glb_clr(REG_PMU_APB_PD_GPU_TOP_CFG, BIT_PD_GPU_TOP_FORCE_SHUTDOWN);
+       mdelay(2);
+
+       return 0;
+#endif /* use fpga */
+}
+
+int mali_platform_device_deinit(struct platform_device *device)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+
+       destroy_workqueue(ctx->gpu_dfs_workqueue);
+
+       mali_clock_off();
+
+       mali_power_off();
+
+       vfree(gpu_freq_list);
+       vfree(ctx->freq_list);
+       vfree(ctx->gpu_clk_src);
+
+       return 0;
+}
+
+static int freq_search(struct gpu_freq_info freq_list[], int len, int key)
+{
+       int low = 0, high = len - 1, mid;
+
+       if (key < 0)
+               return -1;
+
+       while (low <= high) {
+               mid = (low + high) / 2;
+
+               if (key == freq_list[mid].freq)
+                       return mid;
+
+               if (key < freq_list[mid].freq)
+                       high = mid - 1;
+               else
+                       low = mid + 1;
+       }
+
+       return -1;
+}
+
+void mali_platform_power_mode_change(int power_mode)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+
+       down(ctx->sem);
+
+       MALI_DEBUG_PRINT(3,
+               ("Mali power mode change %d, gpu_power_on=%d gpu_clock_on=%d\n",
+                       power_mode, ctx->gpu_power_on, ctx->gpu_clock_on));
+
+       switch (power_mode) {
+       case 0: /* MALI_POWER_MODE_ON */
+               if (!ctx->gpu_power_on) {
+                       /*
+                        * The max limit feature is applied only utilization
+                        * routine, so GPU can work with max freq even though
+                        * max limit is set.
+                        */
+                       int max_index = freq_search(ctx->freq_list,
+                                                       ctx->freq_list_len,
+                                                       gpu_freq_max_limit);
+
+                       if (max_index >= 0)
+                               ctx->freq_max = &ctx->freq_list[max_index];
+
+                       ctx->freq_cur = ctx->freq_max;
+                       mali_power_on();
+                       mali_clock_on();
+               }
+
+               if (!ctx->gpu_clock_on)
+                       mali_clock_on();
+               break;
+       case 1: /* MALI_POWER_MODE_LIGHT_SLEEP */
+       case 2: /* MALI_POWER_MODE_DEEP_SLEEP */
+       default:
+               if (ctx->gpu_clock_on)
+                       mali_clock_off();
+
+               if (ctx->gpu_power_on)
+                       mali_power_off();
+               break;
+       };
+
+       up(ctx->sem);
+}
+
+static void gpu_dfs_func(struct work_struct *work)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+
+       down(ctx->sem);
+
+       if (!ctx->gpu_power_on || !ctx->gpu_clock_on) {
+               up(ctx->sem);
+               return;
+       }
+
+       if (ctx->freq_next == ctx->freq_cur) {
+               up(ctx->sem);
+               return;
+       }
+
+#if !GPU_GLITCH_FREE_DFS
+       mali_dev_pause();
+
+#ifdef CONFIG_COMMON_CLK
+       clk_disable_unprepare(ctx->gpu_clock);
+#else
+       clk_disable(ctx->gpu_clock);
+#endif
+#endif
+
+       if (ctx->freq_next->clk_src != ctx->freq_cur->clk_src)
+               clk_set_parent(ctx->gpu_clock, ctx->freq_next->clk_src);
+
+       if (ctx->freq_next->div != ctx->freq_cur->div)
+               mali_set_div(ctx->freq_next->div);
+
+       ctx->freq_cur = ctx->freq_next;
+       gpu_freq_cur = ctx->freq_cur->freq;
+#ifdef CONFIG_SYSTEM_LOAD_ANALYZER
+       store_external_load_factor(GPU_FREQ, gpu_freq_cur);
+#endif
+
+#if !GPU_GLITCH_FREE_DFS
+#ifdef CONFIG_COMMON_CLK
+       clk_prepare_enable(ctx->gpu_clock);
+#else
+       clk_enable(ctx->gpu_clock);
+#endif
+       udelay(100);
+
+       mali_dev_resume();
+#endif
+
+       up(ctx->sem);
+}
+
+/*
+ * DVFS of SPRD implementation
+ */
+
+#if !SPRD_DFS_ONE_STEP_SCALE_DOWN
+static const struct gpu_freq_info
+*get_next_freq(const struct gpu_freq_info *min_freq,
+                       const struct gpu_freq_info *max_freq, int target)
+{
+       const struct gpu_freq_info *freq;
+
+       for (freq = min_freq; freq <= max_freq; freq++) {
+               if (freq->up_threshold > target)
+                       return freq;
+       }
+
+       return max_freq;
+}
+#endif
+
+static void mali_platform_utilization(struct mali_gpu_utilization_data *data)
+{
+#ifndef CONFIG_SCX35L64BIT_FPGA  /* not use fpga */
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+       int max_index, min_index;
+
+       ctx->cur_load = data->utilization_gpu;
+
+       MALI_DEBUG_PRINT(3,
+                       ("GPU_DFS mali_utilization  gpu:%d  gp:%d pp:%d\n",
+                               data->utilization_gpu, data->utilization_gp,
+                               data->utilization_pp));
+       MALI_DEBUG_PRINT(3,
+                       ("GPU_DFS gpu_boost_level:%d gpu_boost_sf_level:%d\n",
+                               gpu_boost_level, gpu_boost_sf_level));
+
+       switch (gpu_boost_level) {
+       case 10:
+               ctx->freq_max = ctx->freq_min =
+                                       &ctx->freq_list[ctx->freq_list_len - 1];
+               break;
+       case 9:
+               ctx->freq_max = ctx->freq_min = ctx->freq_9;
+               break;
+       case 7:
+               ctx->freq_max = ctx->freq_min = ctx->freq_7;
+               break;
+       case 5:
+               ctx->freq_max = ctx->freq_min = ctx->freq_5;
+               break;
+       case 0:
+       default:
+               ctx->freq_max = ctx->freq_range_max;
+               ctx->freq_min = ctx->freq_range_min;
+               break;
+       }
+
+       if (!gpu_boost_level && (gpu_boost_sf_level > 0)) {
+               ctx->freq_max = ctx->freq_min =
+                                       &ctx->freq_list[ctx->freq_list_len - 1];
+       }
+
+       gpu_boost_level = 0;
+       gpu_boost_sf_level = 0;
+
+       /*
+        * SPRD_MATCH_DFS_TO_LOWER_FREQ
+        *
+        * If user uses gpufreq_min/max_limit sysfs node, it is possible that
+        * the minimum DFS frequency is higher than the maximum one.
+        * So we should correct this inversion phenomenon and there are two
+        * possible solutions.
+        * The first one is to change the minimum DFS frequency as the maximum
+        * one and is suitable for power-saving mode which requires to keep
+        * minimum frequency always.
+        * The other one is to change the maximum DFS frequency as the minimum
+        * one and is suitable for performance mode which requires to keep
+        * maximum frequency always.
+        */
+
+       /* limit min freq */
+       min_index = freq_search(ctx->freq_list, ctx->freq_list_len,
+                               gpu_freq_min_limit);
+       if ((min_index >= 0) &&
+               (ctx->freq_min->freq < ctx->freq_list[min_index].freq)) {
+               ctx->freq_min = &ctx->freq_list[min_index];
+#if !SPRD_MATCH_DFS_TO_LOWER_FREQ
+               if (ctx->freq_min->freq > ctx->freq_max->freq)
+                       ctx->freq_max = ctx->freq_min;
+#endif
+       }
+
+       /* limit max freq */
+       max_index = freq_search(ctx->freq_list, ctx->freq_list_len,
+                               gpu_freq_max_limit);
+       if ((max_index >= 0) &&
+               (ctx->freq_max->freq > ctx->freq_list[max_index].freq)) {
+               ctx->freq_max = &ctx->freq_list[max_index];
+#if SPRD_MATCH_DFS_TO_LOWER_FREQ
+               if (ctx->freq_max->freq < ctx->freq_min->freq)
+                       ctx->freq_min = ctx->freq_max;
+#endif
+       }
+
+       /*
+        * Scale up to maximum frequency if current load ratio is equal or
+        * greater than UP_THRESHOLD.
+        */
+       if (ctx->cur_load >= (256 * UP_THRESHOLD)) {
+               ctx->freq_next = ctx->freq_max;
+
+               MALI_DEBUG_PRINT(3, ("GPU_DFS util %3d; next_freq %6d\n",
+                                       ctx->cur_load, ctx->freq_next->freq));
+       } else {
+               int target_freq = ctx->freq_cur->freq * ctx->cur_load / 256;
+#if SPRD_DFS_ONE_STEP_SCALE_DOWN
+               /*
+                * Scale down one step if current load ratio is equal or less
+                * than DOWN_THRESHOLD.
+                */
+               ctx->freq_next = ctx->freq_cur;
+               if (ctx->cur_load <= (256 * DOWN_THRESHOLD)) {
+                       if (ctx->freq_next != &ctx->freq_list[0])
+                               ctx->freq_next--;
+
+                       /* Avoid meaningless scale down */
+                       if (ctx->freq_next->up_threshold < target_freq)
+                               ctx->freq_next++;
+               }
+
+               /* Consider limit max & min freq */
+               if (ctx->freq_next->freq > ctx->freq_max->freq)
+                       ctx->freq_next = ctx->freq_max;
+               else if (ctx->freq_next->freq < ctx->freq_min->freq)
+                       ctx->freq_next = ctx->freq_min;
+#else
+               /* Scale down to target frequency */
+               ctx->freq_next = get_next_freq(ctx->freq_min, ctx->freq_max,
+                                                               target_freq);
+#endif
+
+               MALI_DEBUG_PRINT(3,
+                       ("GPU_DFS util %3d; target_freq %6d; cur_freq %6d -> next_freq %6d\n",
+                               ctx->cur_load, target_freq, ctx->freq_cur->freq,
+                               ctx->freq_next->freq));
+       }
+
+#ifdef CONFIG_SYSTEM_LOAD_ANALYZER
+       store_external_load_factor(GPU_UTILIZATION, ctx->cur_load);
+#endif
+
+       if (ctx->freq_next->freq != ctx->freq_cur->freq)
+               queue_work(ctx->gpu_dfs_workqueue, &gpu_dfs_work);
+#endif  /* not use fpga */
+}
+
+bool mali_is_on(void)
+{
+       struct gpu_dfs_context *ctx = &gpu_dfs_ctx;
+
+       if (ctx->gpu_power_on && ctx->gpu_clock_on)
+               return true;
+       else
+               MALI_DEBUG_PRINT(5, ("gpu_power_on = %d, gpu_clock_on = %d\n",
+                                       ctx->gpu_power_on, ctx->gpu_clock_on));
+
+       return false;
+}
author	Joonyoung Shim <jy0922.shim@samsung.com>
	Tue, 10 May 2016 06:49:03 +0000 (15:49 +0900)
committer	Joonyoung Shim <jy0922.shim@samsung.com>
	Mon, 23 May 2016 06:41:28 +0000 (15:41 +0900)
drivers/gpu/arm/mali400/r5p2_rel0/Kbuild		patch \| blob \| history
drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/base.h	[new file with mode: 0644]	patch \| blob
drivers/gpu/arm/mali400/r5p2_rel0/platform/sc8830/mali_platform.c	[new file with mode: 0644]	patch \| blob