percpu, x86: don't use PMD_SIZE as embedded atom_size on 32bit
[zen-stable.git] / drivers / gpu / drm / nouveau / nvc0_pm.c
blobe9992f62c1c0f97da00b8c04c5fdaca6d5c0f13b
1 /*
2 * Copyright 2011 Red Hat Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
22 * Authors: Ben Skeggs
25 #include "drmP.h"
26 #include "nouveau_drv.h"
27 #include "nouveau_bios.h"
28 #include "nouveau_pm.h"
30 static u32 read_div(struct drm_device *, int, u32, u32);
31 static u32 read_pll(struct drm_device *, u32);
33 static u32
34 read_vco(struct drm_device *dev, u32 dsrc)
36 u32 ssrc = nv_rd32(dev, dsrc);
37 if (!(ssrc & 0x00000100))
38 return read_pll(dev, 0x00e800);
39 return read_pll(dev, 0x00e820);
42 static u32
43 read_pll(struct drm_device *dev, u32 pll)
45 u32 ctrl = nv_rd32(dev, pll + 0);
46 u32 coef = nv_rd32(dev, pll + 4);
47 u32 P = (coef & 0x003f0000) >> 16;
48 u32 N = (coef & 0x0000ff00) >> 8;
49 u32 M = (coef & 0x000000ff) >> 0;
50 u32 sclk, doff;
52 if (!(ctrl & 0x00000001))
53 return 0;
55 switch (pll & 0xfff000) {
56 case 0x00e000:
57 sclk = 27000;
58 P = 1;
59 break;
60 case 0x137000:
61 doff = (pll - 0x137000) / 0x20;
62 sclk = read_div(dev, doff, 0x137120, 0x137140);
63 break;
64 case 0x132000:
65 switch (pll) {
66 case 0x132000:
67 sclk = read_pll(dev, 0x132020);
68 break;
69 case 0x132020:
70 sclk = read_div(dev, 0, 0x137320, 0x137330);
71 break;
72 default:
73 return 0;
75 break;
76 default:
77 return 0;
80 return sclk * N / M / P;
83 static u32
84 read_div(struct drm_device *dev, int doff, u32 dsrc, u32 dctl)
86 u32 ssrc = nv_rd32(dev, dsrc + (doff * 4));
87 u32 sctl = nv_rd32(dev, dctl + (doff * 4));
89 switch (ssrc & 0x00000003) {
90 case 0:
91 if ((ssrc & 0x00030000) != 0x00030000)
92 return 27000;
93 return 108000;
94 case 2:
95 return 100000;
96 case 3:
97 if (sctl & 0x80000000) {
98 u32 sclk = read_vco(dev, dsrc + (doff * 4));
99 u32 sdiv = (sctl & 0x0000003f) + 2;
100 return (sclk * 2) / sdiv;
103 return read_vco(dev, dsrc + (doff * 4));
104 default:
105 return 0;
109 static u32
110 read_mem(struct drm_device *dev)
112 u32 ssel = nv_rd32(dev, 0x1373f0);
113 if (ssel & 0x00000001)
114 return read_div(dev, 0, 0x137300, 0x137310);
115 return read_pll(dev, 0x132000);
118 static u32
119 read_clk(struct drm_device *dev, int clk)
121 u32 sctl = nv_rd32(dev, 0x137250 + (clk * 4));
122 u32 ssel = nv_rd32(dev, 0x137100);
123 u32 sclk, sdiv;
125 if (ssel & (1 << clk)) {
126 if (clk < 7)
127 sclk = read_pll(dev, 0x137000 + (clk * 0x20));
128 else
129 sclk = read_pll(dev, 0x1370e0);
130 sdiv = ((sctl & 0x00003f00) >> 8) + 2;
131 } else {
132 sclk = read_div(dev, clk, 0x137160, 0x1371d0);
133 sdiv = ((sctl & 0x0000003f) >> 0) + 2;
136 if (sctl & 0x80000000)
137 return (sclk * 2) / sdiv;
138 return sclk;
142 nvc0_pm_clocks_get(struct drm_device *dev, struct nouveau_pm_level *perflvl)
144 perflvl->shader = read_clk(dev, 0x00);
145 perflvl->core = perflvl->shader / 2;
146 perflvl->memory = read_mem(dev);
147 perflvl->rop = read_clk(dev, 0x01);
148 perflvl->hub07 = read_clk(dev, 0x02);
149 perflvl->hub06 = read_clk(dev, 0x07);
150 perflvl->hub01 = read_clk(dev, 0x08);
151 perflvl->copy = read_clk(dev, 0x09);
152 perflvl->daemon = read_clk(dev, 0x0c);
153 perflvl->vdec = read_clk(dev, 0x0e);
154 return 0;
157 struct nvc0_pm_clock {
158 u32 freq;
159 u32 ssel;
160 u32 mdiv;
161 u32 dsrc;
162 u32 ddiv;
163 u32 coef;
166 struct nvc0_pm_state {
167 struct nvc0_pm_clock eng[16];
170 static u32
171 calc_div(struct drm_device *dev, int clk, u32 ref, u32 freq, u32 *ddiv)
173 u32 div = min((ref * 2) / freq, (u32)65);
174 if (div < 2)
175 div = 2;
177 *ddiv = div - 2;
178 return (ref * 2) / div;
181 static u32
182 calc_src(struct drm_device *dev, int clk, u32 freq, u32 *dsrc, u32 *ddiv)
184 u32 sclk;
186 /* use one of the fixed frequencies if possible */
187 *ddiv = 0x00000000;
188 switch (freq) {
189 case 27000:
190 case 108000:
191 *dsrc = 0x00000000;
192 if (freq == 108000)
193 *dsrc |= 0x00030000;
194 return freq;
195 case 100000:
196 *dsrc = 0x00000002;
197 return freq;
198 default:
199 *dsrc = 0x00000003;
200 break;
203 /* otherwise, calculate the closest divider */
204 sclk = read_vco(dev, clk);
205 if (clk < 7)
206 sclk = calc_div(dev, clk, sclk, freq, ddiv);
207 return sclk;
210 static u32
211 calc_pll(struct drm_device *dev, int clk, u32 freq, u32 *coef)
213 struct pll_lims limits;
214 int N, M, P, ret;
216 ret = get_pll_limits(dev, 0x137000 + (clk * 0x20), &limits);
217 if (ret)
218 return 0;
220 limits.refclk = read_div(dev, clk, 0x137120, 0x137140);
221 if (!limits.refclk)
222 return 0;
224 ret = nva3_calc_pll(dev, &limits, freq, &N, NULL, &M, &P);
225 if (ret <= 0)
226 return 0;
228 *coef = (P << 16) | (N << 8) | M;
229 return ret;
232 /* A (likely rather simplified and incomplete) view of the clock tree
234 * Key:
236 * S: source select
237 * D: divider
238 * P: pll
239 * F: switch
241 * Engine clocks:
243 * 137250(D) ---- 137100(F0) ---- 137160(S)/1371d0(D) ------------------- ref
244 * (F1) ---- 1370X0(P) ---- 137120(S)/137140(D) ---- ref
246 * Not all registers exist for all clocks. For example: clocks >= 8 don't
247 * have their own PLL (all tied to clock 7's PLL when in PLL mode), nor do
248 * they have the divider at 1371d0, though the source selection at 137160
249 * still exists. You must use the divider at 137250 for these instead.
251 * Memory clock:
253 * TBD, read_mem() above is likely very wrong...
257 static int
258 calc_clk(struct drm_device *dev, int clk, struct nvc0_pm_clock *info, u32 freq)
260 u32 src0, div0, div1D, div1P = 0;
261 u32 clk0, clk1 = 0;
263 /* invalid clock domain */
264 if (!freq)
265 return 0;
267 /* first possible path, using only dividers */
268 clk0 = calc_src(dev, clk, freq, &src0, &div0);
269 clk0 = calc_div(dev, clk, clk0, freq, &div1D);
271 /* see if we can get any closer using PLLs */
272 if (clk0 != freq) {
273 if (clk < 7)
274 clk1 = calc_pll(dev, clk, freq, &info->coef);
275 else
276 clk1 = read_pll(dev, 0x1370e0);
277 clk1 = calc_div(dev, clk, clk1, freq, &div1P);
280 /* select the method which gets closest to target freq */
281 if (abs((int)freq - clk0) <= abs((int)freq - clk1)) {
282 info->dsrc = src0;
283 if (div0) {
284 info->ddiv |= 0x80000000;
285 info->ddiv |= div0 << 8;
286 info->ddiv |= div0;
288 if (div1D) {
289 info->mdiv |= 0x80000000;
290 info->mdiv |= div1D;
292 info->ssel = 0;
293 info->freq = clk0;
294 } else {
295 if (div1P) {
296 info->mdiv |= 0x80000000;
297 info->mdiv |= div1P << 8;
299 info->ssel = (1 << clk);
300 info->freq = clk1;
303 return 0;
306 void *
307 nvc0_pm_clocks_pre(struct drm_device *dev, struct nouveau_pm_level *perflvl)
309 struct drm_nouveau_private *dev_priv = dev->dev_private;
310 struct nvc0_pm_state *info;
311 int ret;
313 info = kzalloc(sizeof(*info), GFP_KERNEL);
314 if (!info)
315 return ERR_PTR(-ENOMEM);
317 /* NFI why this is still in the performance table, the ROPCs appear
318 * to get their clock from clock 2 ("hub07", actually hub05 on this
319 * chip, but, anyway...) as well. nvatiming confirms hub05 and ROP
320 * are always the same freq with the binary driver even when the
321 * performance table says they should differ.
323 if (dev_priv->chipset == 0xd9)
324 perflvl->rop = 0;
326 if ((ret = calc_clk(dev, 0x00, &info->eng[0x00], perflvl->shader)) ||
327 (ret = calc_clk(dev, 0x01, &info->eng[0x01], perflvl->rop)) ||
328 (ret = calc_clk(dev, 0x02, &info->eng[0x02], perflvl->hub07)) ||
329 (ret = calc_clk(dev, 0x07, &info->eng[0x07], perflvl->hub06)) ||
330 (ret = calc_clk(dev, 0x08, &info->eng[0x08], perflvl->hub01)) ||
331 (ret = calc_clk(dev, 0x09, &info->eng[0x09], perflvl->copy)) ||
332 (ret = calc_clk(dev, 0x0c, &info->eng[0x0c], perflvl->daemon)) ||
333 (ret = calc_clk(dev, 0x0e, &info->eng[0x0e], perflvl->vdec))) {
334 kfree(info);
335 return ERR_PTR(ret);
338 return info;
341 static void
342 prog_clk(struct drm_device *dev, int clk, struct nvc0_pm_clock *info)
344 /* program dividers at 137160/1371d0 first */
345 if (clk < 7 && !info->ssel) {
346 nv_mask(dev, 0x1371d0 + (clk * 0x04), 0x80003f3f, info->ddiv);
347 nv_wr32(dev, 0x137160 + (clk * 0x04), info->dsrc);
350 /* switch clock to non-pll mode */
351 nv_mask(dev, 0x137100, (1 << clk), 0x00000000);
352 nv_wait(dev, 0x137100, (1 << clk), 0x00000000);
354 /* reprogram pll */
355 if (clk < 7) {
356 /* make sure it's disabled first... */
357 u32 base = 0x137000 + (clk * 0x20);
358 u32 ctrl = nv_rd32(dev, base + 0x00);
359 if (ctrl & 0x00000001) {
360 nv_mask(dev, base + 0x00, 0x00000004, 0x00000000);
361 nv_mask(dev, base + 0x00, 0x00000001, 0x00000000);
363 /* program it to new values, if necessary */
364 if (info->ssel) {
365 nv_wr32(dev, base + 0x04, info->coef);
366 nv_mask(dev, base + 0x00, 0x00000001, 0x00000001);
367 nv_wait(dev, base + 0x00, 0x00020000, 0x00020000);
368 nv_mask(dev, base + 0x00, 0x00020004, 0x00000004);
372 /* select pll/non-pll mode, and program final clock divider */
373 nv_mask(dev, 0x137100, (1 << clk), info->ssel);
374 nv_wait(dev, 0x137100, (1 << clk), info->ssel);
375 nv_mask(dev, 0x137250 + (clk * 0x04), 0x00003f3f, info->mdiv);
379 nvc0_pm_clocks_set(struct drm_device *dev, void *data)
381 struct nvc0_pm_state *info = data;
382 int i;
384 for (i = 0; i < 16; i++) {
385 if (!info->eng[i].freq)
386 continue;
387 prog_clk(dev, i, &info->eng[i]);
390 kfree(info);
391 return 0;