summaryrefslogtreecommitdiff
path: root/drivers/devfreq
diff options
context:
space:
mode:
authorRohit Gupta <rohgup@codeaurora.org>2014-07-18 16:16:02 -0700
committerDavid Keitel <dkeitel@codeaurora.org>2016-03-23 20:04:39 -0700
commit43f61ed8aa3ebb85c40b329b83f33b79f08712c6 (patch)
tree43497c36ef8ef9e856dc7947222036cbbda452c9 /drivers/devfreq
parentc36f6302dc08e5152b6afcfeb4e75a914d8166b1 (diff)
PM / devfreq : Introduce a memory-latency governor
Use performance counters to detect the memory latency sensitivity of CPU workloads and vote for higher DDR frequency if required. Change-Id: Ie77a3523bc5713fc0315bd0abc3913f485a96e0e Signed-off-by: Rohit Gupta <rohgup@codeaurora.org> Suggested-by: Saravana Kannan <skannan@codeaurora.org> [junjiew@codeaurora.org: dropped changes in arch/arm64/Kconfig] Signed-off-by: Junjie Wu <junjiew@codeaurora.org>
Diffstat (limited to 'drivers/devfreq')
-rw-r--r--drivers/devfreq/Kconfig19
-rw-r--r--drivers/devfreq/Makefile2
-rw-r--r--drivers/devfreq/arm-memlat-mon.c316
-rw-r--r--drivers/devfreq/governor_memlat.c338
-rw-r--r--drivers/devfreq/governor_memlat.h83
5 files changed, 758 insertions, 0 deletions
diff --git a/drivers/devfreq/Kconfig b/drivers/devfreq/Kconfig
index 4bbdb76c6d65..65ad59284c53 100644
--- a/drivers/devfreq/Kconfig
+++ b/drivers/devfreq/Kconfig
@@ -98,6 +98,15 @@ config ARMBW_HWMON
capability to raise an IRQ when the counter overflows, which can be
used to get an IRQ when the count exceeds a certain value
+config ARM_MEMLAT_MON
+ tristate "ARM CPU Memory Latency monitor hardware"
+ depends on ARCH_MSM
+ help
+ The PMU present on these ARM cores allow for the use of counters to
+ monitor the memory latency characteristics of an ARM CPU workload.
+ This driver uses these counters to implement the APIs needed by
+ the mem_latency devfreq governor.
+
config MSMCCI_HWMON
tristate "MSM CCI Cache monitor hardware"
depends on ARCH_MSM
@@ -144,6 +153,16 @@ config DEVFREQ_GOV_SPDM_HYP
Sets the frequency using a "on-demand" algorithm.
This governor is unlikely to be useful for other devices.
+config DEVFREQ_GOV_MEMLAT
+ tristate "HW monitor based governor for device BW"
+ depends on ARM_MEMLAT_MON
+ help
+ HW monitor based governor for device to DDR bandwidth voting.
+ This governor sets the CPU BW vote based on stats obtained from memalat
+ monitor if it determines that a workload is memory latency bound. Since
+ this uses target specific counters it can conflict with existing profiling
+ tools.
+
comment "DEVFREQ Drivers"
config ARM_EXYNOS4_BUS_DEVFREQ
diff --git a/drivers/devfreq/Makefile b/drivers/devfreq/Makefile
index 166c3d220b26..5adb9492c5e1 100644
--- a/drivers/devfreq/Makefile
+++ b/drivers/devfreq/Makefile
@@ -8,11 +8,13 @@ obj-$(CONFIG_DEVFREQ_GOV_QCOM_ADRENO_TZ) += governor_msm_adreno_tz.o
obj-$(CONFIG_DEVFREQ_GOV_CPUFREQ) += governor_cpufreq.o
obj-$(CONFIG_MSM_BIMC_BWMON) += bimc-bwmon.o
obj-$(CONFIG_ARMBW_HWMON) += armbw-pm.o
+obj-$(CONFIG_ARM_MEMLAT_MON) += arm-memlat-mon.o
obj-$(CONFIG_MSMCCI_HWMON) += msmcci-hwmon.o
obj-$(CONFIG_MSM_M4M_HWMON) += m4m-hwmon.o
obj-$(CONFIG_DEVFREQ_GOV_MSM_BW_HWMON) += governor_bw_hwmon.o
obj-$(CONFIG_DEVFREQ_GOV_MSM_CACHE_HWMON) += governor_cache_hwmon.o
obj-$(CONFIG_DEVFREQ_GOV_SPDM_HYP) += governor_spdm_bw_hyp.o
+obj-$(CONFIG_DEVFREQ_GOV_MEMLAT) += governor_memlat.o
# DEVFREQ Drivers
obj-$(CONFIG_ARM_EXYNOS4_BUS_DEVFREQ) += exynos/
diff --git a/drivers/devfreq/arm-memlat-mon.c b/drivers/devfreq/arm-memlat-mon.c
new file mode 100644
index 000000000000..a13cb1995329
--- /dev/null
+++ b/drivers/devfreq/arm-memlat-mon.c
@@ -0,0 +1,316 @@
+/*
+ * Copyright (c) 2014-2015, The Linux Foundation. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License version 2 and
+ * only version 2 as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ */
+
+#define pr_fmt(fmt) "arm-memlat-mon: " fmt
+
+#include <linux/kernel.h>
+#include <linux/module.h>
+#include <linux/init.h>
+#include <linux/io.h>
+#include <linux/delay.h>
+#include <linux/err.h>
+#include <linux/errno.h>
+#include <linux/interrupt.h>
+#include <linux/platform_device.h>
+#include <linux/of.h>
+#include <linux/of_irq.h>
+#include <linux/slab.h>
+#include <linux/irq.h>
+#include <linux/cpu_pm.h>
+#include <linux/cpu.h>
+#include "governor.h"
+#include "governor_memlat.h"
+#include <linux/perf_event.h>
+
+enum ev_index {
+ INST_IDX,
+ L2DM_IDX,
+ CYC_IDX,
+ NUM_EVENTS
+};
+#define INST_EV 0x08
+#define L2DM_EV 0x17
+#define CYC_EV 0x11
+
+struct event_data {
+ struct perf_event *pevent;
+ unsigned long prev_count;
+ bool overflow;
+};
+
+struct memlat_hwmon_data {
+ struct event_data events[NUM_EVENTS];
+ ktime_t prev_ts;
+};
+static DEFINE_PER_CPU(struct memlat_hwmon_data, pm_data);
+
+struct cpu_grp_info {
+ cpumask_t cpus;
+ struct memlat_hwmon hw;
+};
+
+static unsigned long compute_freq(struct memlat_hwmon_data *hw_data,
+ unsigned long cyc_cnt)
+{
+ ktime_t ts;
+ unsigned int diff;
+ unsigned long freq = 0;
+
+ ts = ktime_get();
+ diff = ktime_to_us(ktime_sub(ts, hw_data->prev_ts));
+ if (!diff)
+ diff = 1;
+ hw_data->prev_ts = ts;
+ freq = cyc_cnt;
+ do_div(freq, diff);
+
+ return freq;
+}
+
+#define MAX_COUNT_LIM 0xFFFFFFFFFFFFFFFF
+static inline unsigned long read_event(struct event_data *event)
+{
+ unsigned long ev_count;
+ u64 total, enabled, running;
+
+ total = perf_event_read_value(event->pevent, &enabled, &running);
+ if (total >= event->prev_count)
+ ev_count = total - event->prev_count;
+ else
+ ev_count = (MAX_COUNT_LIM - event->prev_count) + total;
+
+ event->prev_count = total;
+
+ return ev_count;
+}
+
+static void read_perf_counters(int cpu, struct cpu_grp_info *cpu_grp)
+{
+ int cpu_idx;
+ struct memlat_hwmon_data *hw_data = &per_cpu(pm_data, cpu);
+ struct memlat_hwmon *hw = &cpu_grp->hw;
+ unsigned long cyc_cnt;
+
+ cpu_idx = cpu - cpumask_first(&cpu_grp->cpus);
+
+ hw->core_stats[cpu_idx].inst_count =
+ read_event(&hw_data->events[INST_IDX]);
+
+ hw->core_stats[cpu_idx].mem_count =
+ read_event(&hw_data->events[L2DM_IDX]);
+
+ cyc_cnt = read_event(&hw_data->events[CYC_IDX]);
+ hw->core_stats[cpu_idx].freq = compute_freq(hw_data, cyc_cnt);
+}
+
+static unsigned long get_cnt(struct memlat_hwmon *hw)
+{
+ int cpu;
+ struct cpu_grp_info *cpu_grp = container_of(hw,
+ struct cpu_grp_info, hw);
+
+ for_each_cpu(cpu, &cpu_grp->cpus)
+ read_perf_counters(cpu, cpu_grp);
+
+ return 0;
+}
+
+static void delete_events(struct memlat_hwmon_data *hw_data)
+{
+ perf_event_release_kernel(hw_data->events[INST_IDX].pevent);
+ perf_event_release_kernel(hw_data->events[L2DM_IDX].pevent);
+ perf_event_release_kernel(hw_data->events[CYC_IDX].pevent);
+}
+
+static void stop_hwmon(struct memlat_hwmon *hw)
+{
+ int cpu;
+ struct memlat_hwmon_data *hw_data;
+ struct cpu_grp_info *cpu_grp = container_of(hw,
+ struct cpu_grp_info, hw);
+
+ get_online_cpus();
+ for_each_cpu(cpu, &cpu_grp->cpus) {
+ hw_data = &per_cpu(pm_data, cpu);
+ delete_events(hw_data);
+ }
+ put_online_cpus();
+
+}
+
+struct perf_event *create_event(int cpu, unsigned long event)
+{
+ struct perf_event *pevent;
+ struct perf_event_attr *attr;
+
+ attr = kzalloc(sizeof(struct perf_event_attr), GFP_KERNEL);
+ if (!attr)
+ return ERR_PTR(-ENOMEM);
+
+ attr->config = event;
+ attr->type = PERF_TYPE_RAW;
+ attr->size = sizeof(struct perf_event_attr);
+ attr->pinned = 1;
+ attr->exclude_idle = 1;
+
+ pevent = perf_event_create_kernel_counter(attr, cpu, NULL, NULL, NULL);
+
+ return pevent;
+}
+
+static int set_events(struct memlat_hwmon_data *hw_data, int cpu)
+{
+ struct perf_event *pevent;
+ int err;
+
+ pevent = create_event(cpu, INST_EV);
+ if (IS_ERR(pevent))
+ goto err_out;
+ hw_data->events[INST_IDX].pevent = pevent;
+ perf_event_enable(hw_data->events[INST_IDX].pevent);
+
+ pevent = create_event(cpu, L2DM_EV);
+ if (IS_ERR(pevent))
+ goto err_out;
+ hw_data->events[L2DM_IDX].pevent = pevent;
+ perf_event_enable(hw_data->events[L2DM_IDX].pevent);
+
+ pevent = create_event(cpu, CYC_EV);
+ if (IS_ERR(pevent))
+ goto err_out;
+ hw_data->events[CYC_IDX].pevent = pevent;
+ perf_event_enable(hw_data->events[CYC_IDX].pevent);
+
+ return 0;
+
+err_out:
+ err = PTR_ERR(pevent);
+ return err;
+}
+
+static int start_hwmon(struct memlat_hwmon *hw)
+{
+ int cpu, ret = 0;
+ struct memlat_hwmon_data *hw_data;
+ struct cpu_grp_info *cpu_grp = container_of(hw,
+ struct cpu_grp_info, hw);
+
+ get_online_cpus();
+ for_each_cpu(cpu, &cpu_grp->cpus) {
+ hw_data = &per_cpu(pm_data, cpu);
+ ret = set_events(hw_data, cpu);
+ if (ret)
+ goto err;
+ }
+ pr_info("Group %d events created\n", cpumask_first(&cpu_grp->cpus));
+
+err:
+ put_online_cpus();
+ return ret;
+}
+
+static int get_mask_from_dev_handle(struct platform_device *pdev,
+ cpumask_t *mask)
+{
+ struct device_node *dev_phandle;
+ int cpu = 0;
+
+ dev_phandle = of_parse_phandle(pdev->dev.of_node, "qcom,firstcpu", 0);
+ if (!dev_phandle)
+ return -ENOENT;
+
+ for_each_possible_cpu(cpu) {
+ if (arch_find_n_match_cpu_physical_id(dev_phandle, cpu, NULL)) {
+ cpumask_copy(mask, cpu_coregroup_mask(cpu));
+ return 0;
+ }
+ }
+
+ return -ENOENT;
+}
+
+static int arm_memlat_mon_driver_probe(struct platform_device *pdev)
+{
+ struct device *dev = &pdev->dev;
+ struct memlat_hwmon *hw;
+ struct cpu_grp_info *cpu_grp;
+ int cpu, ret;
+
+ cpu_grp = devm_kzalloc(dev, sizeof(*cpu_grp), GFP_KERNEL);
+ if (!cpu_grp)
+ return -ENOMEM;
+ hw = &cpu_grp->hw;
+
+ hw->dev = dev;
+ hw->of_node = of_parse_phandle(dev->of_node, "qcom,target-dev", 0);
+ if (!hw->of_node) {
+ dev_err(dev, "Couldn't find a target device\n");
+ goto err_out;
+ }
+
+ if (get_mask_from_dev_handle(pdev, &cpu_grp->cpus)) {
+ dev_err(dev, "CPU list is empty\n");
+ goto err_out;
+ }
+
+ hw->num_cores = cpumask_weight(&cpu_grp->cpus);
+ hw->core_stats = devm_kzalloc(dev, hw->num_cores *
+ sizeof(*(hw->core_stats)), GFP_KERNEL);
+ if (!hw->core_stats)
+ goto err_out;
+
+ for_each_cpu(cpu, &cpu_grp->cpus)
+ hw->core_stats[cpu - cpumask_first(&cpu_grp->cpus)].id = cpu;
+
+ hw->start_hwmon = &start_hwmon;
+ hw->stop_hwmon = &stop_hwmon;
+ hw->get_cnt = &get_cnt;
+
+ ret = register_memlat(dev, hw);
+ if (ret) {
+ pr_err("Mem Latency Gov registration failed\n");
+ goto err_out;
+ }
+
+ return 0;
+
+err_out:
+ kfree(cpu_grp);
+ return -EINVAL;
+}
+
+static struct of_device_id match_table[] = {
+ { .compatible = "qcom,arm-memlat-mon" },
+ {}
+};
+
+static struct platform_driver arm_memlat_mon_driver = {
+ .probe = arm_memlat_mon_driver_probe,
+ .driver = {
+ .name = "arm-memlat-mon",
+ .of_match_table = match_table,
+ .owner = THIS_MODULE,
+ },
+};
+
+static int __init arm_memlat_mon_init(void)
+{
+ return platform_driver_register(&arm_memlat_mon_driver);
+}
+module_init(arm_memlat_mon_init);
+
+static void __exit arm_memlat_mon_exit(void)
+{
+ platform_driver_unregister(&arm_memlat_mon_driver);
+}
+module_exit(arm_memlat_mon_exit);
diff --git a/drivers/devfreq/governor_memlat.c b/drivers/devfreq/governor_memlat.c
new file mode 100644
index 000000000000..90c92f38053c
--- /dev/null
+++ b/drivers/devfreq/governor_memlat.c
@@ -0,0 +1,338 @@
+/*
+ * Copyright (c) 2015, The Linux Foundation. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License version 2 and
+ * only version 2 as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ */
+
+#define pr_fmt(fmt) "mem_lat: " fmt
+
+#include <linux/kernel.h>
+#include <linux/sizes.h>
+#include <linux/module.h>
+#include <linux/init.h>
+#include <linux/io.h>
+#include <linux/delay.h>
+#include <linux/ktime.h>
+#include <linux/time.h>
+#include <linux/err.h>
+#include <linux/errno.h>
+#include <linux/mutex.h>
+#include <linux/interrupt.h>
+#include <linux/platform_device.h>
+#include <linux/of.h>
+#include <linux/devfreq.h>
+#include "governor.h"
+#include "governor_memlat.h"
+
+#include <trace/events/power.h>
+
+struct memlat_node {
+ unsigned int ratio_ceil;
+ unsigned int freq_thresh_mhz;
+ unsigned int mult_factor;
+ bool mon_started;
+ struct list_head list;
+ void *orig_data;
+ struct memlat_hwmon *hw;
+ struct devfreq_governor *gov;
+ struct attribute_group *attr_grp;
+};
+
+static LIST_HEAD(memlat_list);
+static DEFINE_MUTEX(list_lock);
+
+static int use_cnt;
+static DEFINE_MUTEX(state_lock);
+
+#define show_attr(name) \
+static ssize_t show_##name(struct device *dev, \
+ struct device_attribute *attr, char *buf) \
+{ \
+ struct devfreq *df = to_devfreq(dev); \
+ struct memlat_node *hw = df->data; \
+ return snprintf(buf, PAGE_SIZE, "%u\n", hw->name); \
+}
+
+#define store_attr(name, _min, _max) \
+static ssize_t store_##name(struct device *dev, \
+ struct device_attribute *attr, const char *buf, \
+ size_t count) \
+{ \
+ struct devfreq *df = to_devfreq(dev); \
+ struct memlat_node *hw = df->data; \
+ int ret; \
+ unsigned int val; \
+ ret = kstrtouint(buf, 10, &val); \
+ if (ret != 1) \
+ return -EINVAL; \
+ val = max(val, _min); \
+ val = min(val, _max); \
+ hw->name = val; \
+ return count; \
+}
+
+#define gov_attr(__attr, min, max) \
+show_attr(__attr) \
+store_attr(__attr, min, max) \
+static DEVICE_ATTR(__attr, 0644, show_##__attr, store_##__attr)
+
+static unsigned long compute_dev_vote(struct devfreq *df)
+{
+ int i, lat_dev;
+ struct memlat_node *node = df->data;
+ struct memlat_hwmon *hw = node->hw;
+ unsigned long max_freq = 0;
+ unsigned int ratio;
+
+ hw->get_cnt(hw);
+
+ for (i = 0; i < hw->num_cores; i++) {
+ ratio = hw->core_stats[i].inst_count;
+
+ if (hw->core_stats[i].mem_count)
+ ratio /= hw->core_stats[i].mem_count;
+
+ trace_memlat_dev_meas(dev_name(df->dev.parent),
+ hw->core_stats[i].id,
+ hw->core_stats[i].inst_count,
+ hw->core_stats[i].mem_count,
+ hw->core_stats[i].freq, ratio);
+
+ if (ratio && ratio <= node->ratio_ceil
+ && hw->core_stats[i].freq >= node->freq_thresh_mhz
+ && hw->core_stats[i].freq > max_freq) {
+ lat_dev = i;
+ max_freq = hw->core_stats[i].freq;
+ }
+ }
+
+ if (max_freq)
+ trace_memlat_dev_update(dev_name(df->dev.parent),
+ hw->core_stats[lat_dev].id,
+ hw->core_stats[lat_dev].inst_count,
+ hw->core_stats[lat_dev].mem_count,
+ hw->core_stats[lat_dev].freq,
+ max_freq * node->mult_factor);
+
+ return max_freq;
+}
+
+static struct memlat_node *find_memlat_node(struct devfreq *df)
+{
+ struct memlat_node *node, *found = NULL;
+
+ mutex_lock(&list_lock);
+ list_for_each_entry(node, &memlat_list, list)
+ if (node->hw->dev == df->dev.parent ||
+ node->hw->of_node == df->dev.parent->of_node) {
+ found = node;
+ break;
+ }
+ mutex_unlock(&list_lock);
+
+ return found;
+}
+
+static int start_monitor(struct devfreq *df)
+{
+ struct memlat_node *node = df->data;
+ struct memlat_hwmon *hw = node->hw;
+ struct device *dev = df->dev.parent;
+ int ret;
+
+ ret = hw->start_hwmon(hw);
+
+ if (ret) {
+ dev_err(dev, "Unable to start HW monitor! (%d)\n", ret);
+ return ret;
+ }
+
+ devfreq_monitor_start(df);
+
+ node->mon_started = true;
+
+ return 0;
+}
+
+static void stop_monitor(struct devfreq *df)
+{
+ struct memlat_node *node = df->data;
+ struct memlat_hwmon *hw = node->hw;
+
+ node->mon_started = false;
+
+ devfreq_monitor_stop(df);
+ hw->stop_hwmon(hw);
+}
+
+static int gov_start(struct devfreq *df)
+{
+ int ret = 0;
+ struct device *dev = df->dev.parent;
+ struct memlat_node *node;
+ struct memlat_hwmon *hw;
+
+ node = find_memlat_node(df);
+ if (!node) {
+ dev_err(dev, "Unable to find HW monitor!\n");
+ return -ENODEV;
+ }
+ hw = node->hw;
+
+ hw->df = df;
+ node->orig_data = df->data;
+ df->data = node;
+
+ if (start_monitor(df))
+ goto err_start;
+
+ ret = sysfs_create_group(&df->dev.kobj, node->attr_grp);
+ if (ret)
+ goto err_sysfs;
+
+ return 0;
+
+err_sysfs:
+ stop_monitor(df);
+err_start:
+ df->data = node->orig_data;
+ node->orig_data = NULL;
+ hw->df = NULL;
+ return ret;
+}
+
+static void gov_stop(struct devfreq *df)
+{
+ struct memlat_node *node = df->data;
+ struct memlat_hwmon *hw = node->hw;
+
+ sysfs_remove_group(&df->dev.kobj, node->attr_grp);
+ stop_monitor(df);
+ df->data = node->orig_data;
+ node->orig_data = NULL;
+ hw->df = NULL;
+}
+
+static int devfreq_memlat_get_freq(struct devfreq *df,
+ unsigned long *freq,
+ u32 *flag)
+{
+ unsigned long mhz;
+ struct memlat_node *node = df->data;
+
+ mhz = compute_dev_vote(df);
+ *freq = mhz ? (mhz * node->mult_factor) : 0;
+
+ return 0;
+}
+
+gov_attr(ratio_ceil, 1U, 1000U);
+gov_attr(freq_thresh_mhz, 300U, 5000U);
+gov_attr(mult_factor, 1U, 10U);
+
+static struct attribute *dev_attr[] = {
+ &dev_attr_ratio_ceil.attr,
+ &dev_attr_freq_thresh_mhz.attr,
+ &dev_attr_mult_factor.attr,
+ NULL,
+};
+
+static struct attribute_group dev_attr_group = {
+ .name = "mem_latency",
+ .attrs = dev_attr,
+};
+
+#define MIN_MS 10U
+#define MAX_MS 500U
+static int devfreq_memlat_ev_handler(struct devfreq *df,
+ unsigned int event, void *data)
+{
+ int ret;
+ unsigned int sample_ms;
+
+ switch (event) {
+ case DEVFREQ_GOV_START:
+ sample_ms = df->profile->polling_ms;
+ sample_ms = max(MIN_MS, sample_ms);
+ sample_ms = min(MAX_MS, sample_ms);
+ df->profile->polling_ms = sample_ms;
+
+ ret = gov_start(df);
+ if (ret)
+ return ret;
+
+ dev_dbg(df->dev.parent,
+ "Enabled Memory Latency governor\n");
+ break;
+
+ case DEVFREQ_GOV_STOP:
+ gov_stop(df);
+ dev_dbg(df->dev.parent,
+ "Disabled Memory Latency governor\n");
+ break;
+
+ case DEVFREQ_GOV_INTERVAL:
+ sample_ms = *(unsigned int *)data;
+ sample_ms = max(MIN_MS, sample_ms);
+ sample_ms = min(MAX_MS, sample_ms);
+ devfreq_interval_update(df, &sample_ms);
+ break;
+ }
+
+ return 0;
+}
+
+static struct devfreq_governor devfreq_gov_memlat = {
+ .name = "mem_latency",
+ .get_target_freq = devfreq_memlat_get_freq,
+ .event_handler = devfreq_memlat_ev_handler,
+};
+
+int register_memlat(struct device *dev, struct memlat_hwmon *hw)
+{
+ int ret = 0;
+ struct memlat_node *node;
+
+ if (!hw->dev && !hw->of_node)
+ return -EINVAL;
+
+ node = devm_kzalloc(dev, sizeof(*node), GFP_KERNEL);
+ if (!node)
+ return -ENOMEM;
+
+ node->gov = &devfreq_gov_memlat;
+ node->attr_grp = &dev_attr_group;
+
+ node->ratio_ceil = 10;
+ node->freq_thresh_mhz = 900;
+ node->mult_factor = 8;
+ node->hw = hw;
+
+ mutex_lock(&list_lock);
+ list_add_tail(&node->list, &memlat_list);
+ mutex_unlock(&list_lock);
+
+ mutex_lock(&state_lock);
+ if (!use_cnt)
+ ret = devfreq_add_governor(&devfreq_gov_memlat);
+ if (!ret)
+ use_cnt++;
+ mutex_unlock(&state_lock);
+
+ if (!ret)
+ dev_info(dev, "Memory Latency governor registered.\n");
+ else
+ dev_err(dev, "Memory Latency governor registration failed!\n");
+
+ return ret;
+}
+
+MODULE_DESCRIPTION("HW monitor based dev DDR bandwidth voting driver");
+MODULE_LICENSE("GPL v2");
diff --git a/drivers/devfreq/governor_memlat.h b/drivers/devfreq/governor_memlat.h
new file mode 100644
index 000000000000..19a35009a4a0
--- /dev/null
+++ b/drivers/devfreq/governor_memlat.h
@@ -0,0 +1,83 @@
+/*
+ * Copyright (c) 2015, The Linux Foundation. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License version 2 and
+ * only version 2 as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ */
+
+#ifndef _GOVERNOR_BW_HWMON_H
+#define _GOVERNOR_BW_HWMON_H
+
+#include <linux/kernel.h>
+#include <linux/devfreq.h>
+
+/**
+ * struct dev_stats - Device stats
+ * @inst_count: Number of instructions executed.
+ * @mem_count: Number of memory accesses made.
+ * @freq: Effective frequency of the device in the
+ * last interval.
+ */
+struct dev_stats {
+ int id;
+ unsigned long inst_count;
+ unsigned long mem_count;
+ unsigned long freq;
+};
+
+/**
+ * struct memlat_hwmon - Memory Latency HW monitor info
+ * @start_hwmon: Start the HW monitoring
+ * @stop_hwmon: Stop the HW monitoring
+ * @get_cnt: Return the number of intructions executed,
+ * memory accesses and effective frequency
+ * @dev: Pointer to device that this HW monitor can
+ * monitor.
+ * @of_node: OF node of device that this HW monitor can
+ * monitor.
+ * @df: Devfreq node that this HW monitor is being
+ * used for. NULL when not actively in use and
+ * non-NULL when in use.
+ * @num_cores: Number of cores that are monitored by the
+ * hardware monitor.
+ * @core_stats: Array containing instruction count, memory
+ * accesses and effective frequency for each core.
+ *
+ * One of dev or of_node needs to be specified for a successful registration.
+ *
+ */
+struct memlat_hwmon {
+ int (*start_hwmon)(struct memlat_hwmon *hw);
+ void (*stop_hwmon)(struct memlat_hwmon *hw);
+ unsigned long (*get_cnt)(struct memlat_hwmon *hw);
+ struct device *dev;
+ struct device_node *of_node;
+
+ unsigned int num_cores;
+ struct dev_stats *core_stats;
+
+ struct devfreq *df;
+};
+
+#ifdef CONFIG_DEVFREQ_GOV_MEMLAT
+int register_memlat(struct device *dev, struct memlat_hwmon *hw);
+int update_memlat(struct memlat_hwmon *hw);
+#else
+static inline int register_memlat(struct device *dev,
+ struct memlat_hwmon *hw)
+{
+ return 0;
+}
+static inline int update_memlat(struct memlat_hwmon *hw)
+{
+ return 0;
+}
+#endif
+
+#endif /* _GOVERNOR_BW_HWMON_H */