1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun #include <linux/cpufreq.h>
7*4882a593Smuzhiyun #include <linux/dma-mapping.h>
8*4882a593Smuzhiyun #include <linux/module.h>
9*4882a593Smuzhiyun #include <linux/of.h>
10*4882a593Smuzhiyun #include <linux/platform_device.h>
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include <soc/tegra/bpmp.h>
13*4882a593Smuzhiyun #include <soc/tegra/bpmp-abi.h>
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun #define EDVD_CORE_VOLT_FREQ(core) (0x20 + (core) * 0x4)
16*4882a593Smuzhiyun #define EDVD_CORE_VOLT_FREQ_F_SHIFT 0
17*4882a593Smuzhiyun #define EDVD_CORE_VOLT_FREQ_F_MASK 0xffff
18*4882a593Smuzhiyun #define EDVD_CORE_VOLT_FREQ_V_SHIFT 16
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun struct tegra186_cpufreq_cluster_info {
21*4882a593Smuzhiyun unsigned long offset;
22*4882a593Smuzhiyun int cpus[4];
23*4882a593Smuzhiyun unsigned int bpmp_cluster_id;
24*4882a593Smuzhiyun };
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun #define NO_CPU -1
27*4882a593Smuzhiyun static const struct tegra186_cpufreq_cluster_info tegra186_clusters[] = {
28*4882a593Smuzhiyun /* Denver cluster */
29*4882a593Smuzhiyun {
30*4882a593Smuzhiyun .offset = SZ_64K * 7,
31*4882a593Smuzhiyun .cpus = { 1, 2, NO_CPU, NO_CPU },
32*4882a593Smuzhiyun .bpmp_cluster_id = 0,
33*4882a593Smuzhiyun },
34*4882a593Smuzhiyun /* A57 cluster */
35*4882a593Smuzhiyun {
36*4882a593Smuzhiyun .offset = SZ_64K * 6,
37*4882a593Smuzhiyun .cpus = { 0, 3, 4, 5 },
38*4882a593Smuzhiyun .bpmp_cluster_id = 1,
39*4882a593Smuzhiyun },
40*4882a593Smuzhiyun };
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun struct tegra186_cpufreq_cluster {
43*4882a593Smuzhiyun const struct tegra186_cpufreq_cluster_info *info;
44*4882a593Smuzhiyun struct cpufreq_frequency_table *table;
45*4882a593Smuzhiyun u32 ref_clk_khz;
46*4882a593Smuzhiyun u32 div;
47*4882a593Smuzhiyun };
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun struct tegra186_cpufreq_data {
50*4882a593Smuzhiyun void __iomem *regs;
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun size_t num_clusters;
53*4882a593Smuzhiyun struct tegra186_cpufreq_cluster *clusters;
54*4882a593Smuzhiyun };
55*4882a593Smuzhiyun
tegra186_cpufreq_init(struct cpufreq_policy * policy)56*4882a593Smuzhiyun static int tegra186_cpufreq_init(struct cpufreq_policy *policy)
57*4882a593Smuzhiyun {
58*4882a593Smuzhiyun struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
59*4882a593Smuzhiyun unsigned int i;
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun for (i = 0; i < data->num_clusters; i++) {
62*4882a593Smuzhiyun struct tegra186_cpufreq_cluster *cluster = &data->clusters[i];
63*4882a593Smuzhiyun const struct tegra186_cpufreq_cluster_info *info =
64*4882a593Smuzhiyun cluster->info;
65*4882a593Smuzhiyun int core;
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun for (core = 0; core < ARRAY_SIZE(info->cpus); core++) {
68*4882a593Smuzhiyun if (info->cpus[core] == policy->cpu)
69*4882a593Smuzhiyun break;
70*4882a593Smuzhiyun }
71*4882a593Smuzhiyun if (core == ARRAY_SIZE(info->cpus))
72*4882a593Smuzhiyun continue;
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun policy->driver_data =
75*4882a593Smuzhiyun data->regs + info->offset + EDVD_CORE_VOLT_FREQ(core);
76*4882a593Smuzhiyun policy->freq_table = cluster->table;
77*4882a593Smuzhiyun break;
78*4882a593Smuzhiyun }
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun policy->cpuinfo.transition_latency = 300 * 1000;
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun return 0;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun
tegra186_cpufreq_set_target(struct cpufreq_policy * policy,unsigned int index)85*4882a593Smuzhiyun static int tegra186_cpufreq_set_target(struct cpufreq_policy *policy,
86*4882a593Smuzhiyun unsigned int index)
87*4882a593Smuzhiyun {
88*4882a593Smuzhiyun struct cpufreq_frequency_table *tbl = policy->freq_table + index;
89*4882a593Smuzhiyun void __iomem *edvd_reg = policy->driver_data;
90*4882a593Smuzhiyun u32 edvd_val = tbl->driver_data;
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun writel(edvd_val, edvd_reg);
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun return 0;
95*4882a593Smuzhiyun }
96*4882a593Smuzhiyun
tegra186_cpufreq_get(unsigned int cpu)97*4882a593Smuzhiyun static unsigned int tegra186_cpufreq_get(unsigned int cpu)
98*4882a593Smuzhiyun {
99*4882a593Smuzhiyun struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
100*4882a593Smuzhiyun struct cpufreq_policy *policy;
101*4882a593Smuzhiyun void __iomem *edvd_reg;
102*4882a593Smuzhiyun unsigned int i, freq = 0;
103*4882a593Smuzhiyun u32 ndiv;
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun policy = cpufreq_cpu_get(cpu);
106*4882a593Smuzhiyun if (!policy)
107*4882a593Smuzhiyun return 0;
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun edvd_reg = policy->driver_data;
110*4882a593Smuzhiyun ndiv = readl(edvd_reg) & EDVD_CORE_VOLT_FREQ_F_MASK;
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun for (i = 0; i < data->num_clusters; i++) {
113*4882a593Smuzhiyun struct tegra186_cpufreq_cluster *cluster = &data->clusters[i];
114*4882a593Smuzhiyun int core;
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun for (core = 0; core < ARRAY_SIZE(cluster->info->cpus); core++) {
117*4882a593Smuzhiyun if (cluster->info->cpus[core] != policy->cpu)
118*4882a593Smuzhiyun continue;
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun freq = (cluster->ref_clk_khz * ndiv) / cluster->div;
121*4882a593Smuzhiyun goto out;
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun out:
126*4882a593Smuzhiyun cpufreq_cpu_put(policy);
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun return freq;
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun static struct cpufreq_driver tegra186_cpufreq_driver = {
132*4882a593Smuzhiyun .name = "tegra186",
133*4882a593Smuzhiyun .flags = CPUFREQ_STICKY | CPUFREQ_HAVE_GOVERNOR_PER_POLICY |
134*4882a593Smuzhiyun CPUFREQ_NEED_INITIAL_FREQ_CHECK,
135*4882a593Smuzhiyun .get = tegra186_cpufreq_get,
136*4882a593Smuzhiyun .verify = cpufreq_generic_frequency_table_verify,
137*4882a593Smuzhiyun .target_index = tegra186_cpufreq_set_target,
138*4882a593Smuzhiyun .init = tegra186_cpufreq_init,
139*4882a593Smuzhiyun .attr = cpufreq_generic_attr,
140*4882a593Smuzhiyun };
141*4882a593Smuzhiyun
init_vhint_table(struct platform_device * pdev,struct tegra_bpmp * bpmp,struct tegra186_cpufreq_cluster * cluster)142*4882a593Smuzhiyun static struct cpufreq_frequency_table *init_vhint_table(
143*4882a593Smuzhiyun struct platform_device *pdev, struct tegra_bpmp *bpmp,
144*4882a593Smuzhiyun struct tegra186_cpufreq_cluster *cluster)
145*4882a593Smuzhiyun {
146*4882a593Smuzhiyun struct cpufreq_frequency_table *table;
147*4882a593Smuzhiyun struct mrq_cpu_vhint_request req;
148*4882a593Smuzhiyun struct tegra_bpmp_message msg;
149*4882a593Smuzhiyun struct cpu_vhint_data *data;
150*4882a593Smuzhiyun int err, i, j, num_rates = 0;
151*4882a593Smuzhiyun dma_addr_t phys;
152*4882a593Smuzhiyun void *virt;
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun virt = dma_alloc_coherent(bpmp->dev, sizeof(*data), &phys,
155*4882a593Smuzhiyun GFP_KERNEL);
156*4882a593Smuzhiyun if (!virt)
157*4882a593Smuzhiyun return ERR_PTR(-ENOMEM);
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun data = (struct cpu_vhint_data *)virt;
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun memset(&req, 0, sizeof(req));
162*4882a593Smuzhiyun req.addr = phys;
163*4882a593Smuzhiyun req.cluster_id = cluster->info->bpmp_cluster_id;
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun memset(&msg, 0, sizeof(msg));
166*4882a593Smuzhiyun msg.mrq = MRQ_CPU_VHINT;
167*4882a593Smuzhiyun msg.tx.data = &req;
168*4882a593Smuzhiyun msg.tx.size = sizeof(req);
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun err = tegra_bpmp_transfer(bpmp, &msg);
171*4882a593Smuzhiyun if (err) {
172*4882a593Smuzhiyun table = ERR_PTR(err);
173*4882a593Smuzhiyun goto free;
174*4882a593Smuzhiyun }
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun for (i = data->vfloor; i <= data->vceil; i++) {
177*4882a593Smuzhiyun u16 ndiv = data->ndiv[i];
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun if (ndiv < data->ndiv_min || ndiv > data->ndiv_max)
180*4882a593Smuzhiyun continue;
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun /* Only store lowest voltage index for each rate */
183*4882a593Smuzhiyun if (i > 0 && ndiv == data->ndiv[i - 1])
184*4882a593Smuzhiyun continue;
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun num_rates++;
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun table = devm_kcalloc(&pdev->dev, num_rates + 1, sizeof(*table),
190*4882a593Smuzhiyun GFP_KERNEL);
191*4882a593Smuzhiyun if (!table) {
192*4882a593Smuzhiyun table = ERR_PTR(-ENOMEM);
193*4882a593Smuzhiyun goto free;
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun cluster->ref_clk_khz = data->ref_clk_hz / 1000;
197*4882a593Smuzhiyun cluster->div = data->pdiv * data->mdiv;
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun for (i = data->vfloor, j = 0; i <= data->vceil; i++) {
200*4882a593Smuzhiyun struct cpufreq_frequency_table *point;
201*4882a593Smuzhiyun u16 ndiv = data->ndiv[i];
202*4882a593Smuzhiyun u32 edvd_val = 0;
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun if (ndiv < data->ndiv_min || ndiv > data->ndiv_max)
205*4882a593Smuzhiyun continue;
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun /* Only store lowest voltage index for each rate */
208*4882a593Smuzhiyun if (i > 0 && ndiv == data->ndiv[i - 1])
209*4882a593Smuzhiyun continue;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun edvd_val |= i << EDVD_CORE_VOLT_FREQ_V_SHIFT;
212*4882a593Smuzhiyun edvd_val |= ndiv << EDVD_CORE_VOLT_FREQ_F_SHIFT;
213*4882a593Smuzhiyun
214*4882a593Smuzhiyun point = &table[j++];
215*4882a593Smuzhiyun point->driver_data = edvd_val;
216*4882a593Smuzhiyun point->frequency = (cluster->ref_clk_khz * ndiv) / cluster->div;
217*4882a593Smuzhiyun }
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun table[j].frequency = CPUFREQ_TABLE_END;
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun free:
222*4882a593Smuzhiyun dma_free_coherent(bpmp->dev, sizeof(*data), virt, phys);
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun return table;
225*4882a593Smuzhiyun }
226*4882a593Smuzhiyun
tegra186_cpufreq_probe(struct platform_device * pdev)227*4882a593Smuzhiyun static int tegra186_cpufreq_probe(struct platform_device *pdev)
228*4882a593Smuzhiyun {
229*4882a593Smuzhiyun struct tegra186_cpufreq_data *data;
230*4882a593Smuzhiyun struct tegra_bpmp *bpmp;
231*4882a593Smuzhiyun unsigned int i = 0, err;
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun data = devm_kzalloc(&pdev->dev, sizeof(*data), GFP_KERNEL);
234*4882a593Smuzhiyun if (!data)
235*4882a593Smuzhiyun return -ENOMEM;
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun data->clusters = devm_kcalloc(&pdev->dev, ARRAY_SIZE(tegra186_clusters),
238*4882a593Smuzhiyun sizeof(*data->clusters), GFP_KERNEL);
239*4882a593Smuzhiyun if (!data->clusters)
240*4882a593Smuzhiyun return -ENOMEM;
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun data->num_clusters = ARRAY_SIZE(tegra186_clusters);
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun bpmp = tegra_bpmp_get(&pdev->dev);
245*4882a593Smuzhiyun if (IS_ERR(bpmp))
246*4882a593Smuzhiyun return PTR_ERR(bpmp);
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun data->regs = devm_platform_ioremap_resource(pdev, 0);
249*4882a593Smuzhiyun if (IS_ERR(data->regs)) {
250*4882a593Smuzhiyun err = PTR_ERR(data->regs);
251*4882a593Smuzhiyun goto put_bpmp;
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun for (i = 0; i < data->num_clusters; i++) {
255*4882a593Smuzhiyun struct tegra186_cpufreq_cluster *cluster = &data->clusters[i];
256*4882a593Smuzhiyun
257*4882a593Smuzhiyun cluster->info = &tegra186_clusters[i];
258*4882a593Smuzhiyun cluster->table = init_vhint_table(pdev, bpmp, cluster);
259*4882a593Smuzhiyun if (IS_ERR(cluster->table)) {
260*4882a593Smuzhiyun err = PTR_ERR(cluster->table);
261*4882a593Smuzhiyun goto put_bpmp;
262*4882a593Smuzhiyun }
263*4882a593Smuzhiyun }
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun tegra186_cpufreq_driver.driver_data = data;
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun err = cpufreq_register_driver(&tegra186_cpufreq_driver);
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun put_bpmp:
270*4882a593Smuzhiyun tegra_bpmp_put(bpmp);
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun return err;
273*4882a593Smuzhiyun }
274*4882a593Smuzhiyun
tegra186_cpufreq_remove(struct platform_device * pdev)275*4882a593Smuzhiyun static int tegra186_cpufreq_remove(struct platform_device *pdev)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun cpufreq_unregister_driver(&tegra186_cpufreq_driver);
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun return 0;
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun static const struct of_device_id tegra186_cpufreq_of_match[] = {
283*4882a593Smuzhiyun { .compatible = "nvidia,tegra186-ccplex-cluster", },
284*4882a593Smuzhiyun { }
285*4882a593Smuzhiyun };
286*4882a593Smuzhiyun MODULE_DEVICE_TABLE(of, tegra186_cpufreq_of_match);
287*4882a593Smuzhiyun
288*4882a593Smuzhiyun static struct platform_driver tegra186_cpufreq_platform_driver = {
289*4882a593Smuzhiyun .driver = {
290*4882a593Smuzhiyun .name = "tegra186-cpufreq",
291*4882a593Smuzhiyun .of_match_table = tegra186_cpufreq_of_match,
292*4882a593Smuzhiyun },
293*4882a593Smuzhiyun .probe = tegra186_cpufreq_probe,
294*4882a593Smuzhiyun .remove = tegra186_cpufreq_remove,
295*4882a593Smuzhiyun };
296*4882a593Smuzhiyun module_platform_driver(tegra186_cpufreq_platform_driver);
297*4882a593Smuzhiyun
298*4882a593Smuzhiyun MODULE_AUTHOR("Mikko Perttunen <mperttunen@nvidia.com>");
299*4882a593Smuzhiyun MODULE_DESCRIPTION("NVIDIA Tegra186 cpufreq driver");
300*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
301