xref: /linux/drivers/gpu/drm/nouveau/nvkm/subdev/fb/ramgt215.c (revision e0a37f85fc95e3f2550446316bc4a27d00d75993)
1 /*
2  * Copyright 2013 Red Hat Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Authors: Ben Skeggs
23  * 	    Roy Spliet <rspliet@eclipso.eu>
24  */
25 #define gt215_ram(p) container_of((p), struct gt215_ram, base)
26 #include "ram.h"
27 #include "ramfuc.h"
28 
29 #include <core/option.h>
30 #include <subdev/bios.h>
31 #include <subdev/bios/M0205.h>
32 #include <subdev/bios/rammap.h>
33 #include <subdev/bios/timing.h>
34 #include <subdev/clk/gt215.h>
35 #include <subdev/gpio.h>
36 
37 struct gt215_ramfuc {
38 	struct ramfuc base;
39 	struct ramfuc_reg r_0x001610;
40 	struct ramfuc_reg r_0x001700;
41 	struct ramfuc_reg r_0x002504;
42 	struct ramfuc_reg r_0x004000;
43 	struct ramfuc_reg r_0x004004;
44 	struct ramfuc_reg r_0x004018;
45 	struct ramfuc_reg r_0x004128;
46 	struct ramfuc_reg r_0x004168;
47 	struct ramfuc_reg r_0x100080;
48 	struct ramfuc_reg r_0x100200;
49 	struct ramfuc_reg r_0x100210;
50 	struct ramfuc_reg r_0x100220[9];
51 	struct ramfuc_reg r_0x100264;
52 	struct ramfuc_reg r_0x1002d0;
53 	struct ramfuc_reg r_0x1002d4;
54 	struct ramfuc_reg r_0x1002dc;
55 	struct ramfuc_reg r_0x10053c;
56 	struct ramfuc_reg r_0x1005a0;
57 	struct ramfuc_reg r_0x1005a4;
58 	struct ramfuc_reg r_0x100700;
59 	struct ramfuc_reg r_0x100714;
60 	struct ramfuc_reg r_0x100718;
61 	struct ramfuc_reg r_0x10071c;
62 	struct ramfuc_reg r_0x100720;
63 	struct ramfuc_reg r_0x100760;
64 	struct ramfuc_reg r_0x1007a0;
65 	struct ramfuc_reg r_0x1007e0;
66 	struct ramfuc_reg r_0x100da0;
67 	struct ramfuc_reg r_0x10f804;
68 	struct ramfuc_reg r_0x1110e0;
69 	struct ramfuc_reg r_0x111100;
70 	struct ramfuc_reg r_0x111104;
71 	struct ramfuc_reg r_0x1111e0;
72 	struct ramfuc_reg r_0x111400;
73 	struct ramfuc_reg r_0x611200;
74 	struct ramfuc_reg r_mr[4];
75 	struct ramfuc_reg r_gpio[4];
76 };
77 
78 struct gt215_ltrain {
79 	enum {
80 		NVA3_TRAIN_UNKNOWN,
81 		NVA3_TRAIN_UNSUPPORTED,
82 		NVA3_TRAIN_ONCE,
83 		NVA3_TRAIN_EXEC,
84 		NVA3_TRAIN_DONE
85 	} state;
86 	u32 r_100720;
87 	u32 r_1111e0;
88 	u32 r_111400;
89 	struct nvkm_mem *mem;
90 };
91 
92 struct gt215_ram {
93 	struct nvkm_ram base;
94 	struct gt215_ramfuc fuc;
95 	struct gt215_ltrain ltrain;
96 };
97 
98 void
99 gt215_link_train_calc(u32 *vals, struct gt215_ltrain *train)
100 {
101 	int i, lo, hi;
102 	u8 median[8], bins[4] = {0, 0, 0, 0}, bin = 0, qty = 0;
103 
104 	for (i = 0; i < 8; i++) {
105 		for (lo = 0; lo < 0x40; lo++) {
106 			if (!(vals[lo] & 0x80000000))
107 				continue;
108 			if (vals[lo] & (0x101 << i))
109 				break;
110 		}
111 
112 		if (lo == 0x40)
113 			return;
114 
115 		for (hi = lo + 1; hi < 0x40; hi++) {
116 			if (!(vals[lo] & 0x80000000))
117 				continue;
118 			if (!(vals[hi] & (0x101 << i))) {
119 				hi--;
120 				break;
121 			}
122 		}
123 
124 		median[i] = ((hi - lo) >> 1) + lo;
125 		bins[(median[i] & 0xf0) >> 4]++;
126 		median[i] += 0x30;
127 	}
128 
129 	/* Find the best value for 0x1111e0 */
130 	for (i = 0; i < 4; i++) {
131 		if (bins[i] > qty) {
132 			bin = i + 3;
133 			qty = bins[i];
134 		}
135 	}
136 
137 	train->r_100720 = 0;
138 	for (i = 0; i < 8; i++) {
139 		median[i] = max(median[i], (u8) (bin << 4));
140 		median[i] = min(median[i], (u8) ((bin << 4) | 0xf));
141 
142 		train->r_100720 |= ((median[i] & 0x0f) << (i << 2));
143 	}
144 
145 	train->r_1111e0 = 0x02000000 | (bin * 0x101);
146 	train->r_111400 = 0x0;
147 }
148 
149 /*
150  * Link training for (at least) DDR3
151  */
152 int
153 gt215_link_train(struct gt215_ram *ram)
154 {
155 	struct gt215_ltrain *train = &ram->ltrain;
156 	struct gt215_ramfuc *fuc = &ram->fuc;
157 	struct nvkm_subdev *subdev = &ram->base.fb->subdev;
158 	struct nvkm_device *device = subdev->device;
159 	struct nvkm_bios *bios = device->bios;
160 	struct nvkm_clk *clk = device->clk;
161 	u32 *result, r1700;
162 	int ret, i;
163 	struct nvbios_M0205T M0205T = { 0 };
164 	u8 ver, hdr, cnt, len, snr, ssz;
165 	unsigned int clk_current;
166 	unsigned long flags;
167 	unsigned long *f = &flags;
168 
169 	if (nvkm_boolopt(device->cfgopt, "NvMemExec", true) != true)
170 		return -ENOSYS;
171 
172 	/* XXX: Multiple partitions? */
173 	result = kmalloc(64 * sizeof(u32), GFP_KERNEL);
174 	if (!result)
175 		return -ENOMEM;
176 
177 	train->state = NVA3_TRAIN_EXEC;
178 
179 	/* Clock speeds for training and back */
180 	nvbios_M0205Tp(bios, &ver, &hdr, &cnt, &len, &snr, &ssz, &M0205T);
181 	if (M0205T.freq == 0) {
182 		kfree(result);
183 		return -ENOENT;
184 	}
185 
186 	clk_current = nvkm_clk_read(clk, nv_clk_src_mem);
187 
188 	ret = gt215_clk_pre(clk, f);
189 	if (ret)
190 		goto out;
191 
192 	/* First: clock up/down */
193 	ret = ram->base.func->calc(&ram->base, (u32) M0205T.freq * 1000);
194 	if (ret)
195 		goto out;
196 
197 	/* Do this *after* calc, eliminates write in script */
198 	nvkm_wr32(device, 0x111400, 0x00000000);
199 	/* XXX: Magic writes that improve train reliability? */
200 	nvkm_mask(device, 0x100674, 0x0000ffff, 0x00000000);
201 	nvkm_mask(device, 0x1005e4, 0x0000ffff, 0x00000000);
202 	nvkm_mask(device, 0x100b0c, 0x000000ff, 0x00000000);
203 	nvkm_wr32(device, 0x100c04, 0x00000400);
204 
205 	/* Now the training script */
206 	r1700 = ram_rd32(fuc, 0x001700);
207 
208 	ram_mask(fuc, 0x100200, 0x00000800, 0x00000000);
209 	ram_wr32(fuc, 0x611200, 0x3300);
210 	ram_wait_vblank(fuc);
211 	ram_wait(fuc, 0x611200, 0x00000003, 0x00000000, 500000);
212 	ram_mask(fuc, 0x001610, 0x00000083, 0x00000003);
213 	ram_mask(fuc, 0x100080, 0x00000020, 0x00000000);
214 	ram_mask(fuc, 0x10f804, 0x80000000, 0x00000000);
215 	ram_wr32(fuc, 0x001700, 0x00000000);
216 
217 	ram_train(fuc);
218 
219 	/* Reset */
220 	ram_mask(fuc, 0x10f804, 0x80000000, 0x80000000);
221 	ram_wr32(fuc, 0x10053c, 0x0);
222 	ram_wr32(fuc, 0x100720, train->r_100720);
223 	ram_wr32(fuc, 0x1111e0, train->r_1111e0);
224 	ram_wr32(fuc, 0x111400, train->r_111400);
225 	ram_nuke(fuc, 0x100080);
226 	ram_mask(fuc, 0x100080, 0x00000020, 0x00000020);
227 	ram_nsec(fuc, 1000);
228 
229 	ram_wr32(fuc, 0x001700, r1700);
230 	ram_mask(fuc, 0x001610, 0x00000083, 0x00000080);
231 	ram_wr32(fuc, 0x611200, 0x3330);
232 	ram_mask(fuc, 0x100200, 0x00000800, 0x00000800);
233 
234 	ram_exec(fuc, true);
235 
236 	ram->base.func->calc(&ram->base, clk_current);
237 	ram_exec(fuc, true);
238 
239 	/* Post-processing, avoids flicker */
240 	nvkm_mask(device, 0x616308, 0x10, 0x10);
241 	nvkm_mask(device, 0x616b08, 0x10, 0x10);
242 
243 	gt215_clk_post(clk, f);
244 
245 	ram_train_result(ram->base.fb, result, 64);
246 	for (i = 0; i < 64; i++)
247 		nvkm_debug(subdev, "Train: %08x", result[i]);
248 	gt215_link_train_calc(result, train);
249 
250 	nvkm_debug(subdev, "Train: %08x %08x %08x", train->r_100720,
251 		   train->r_1111e0, train->r_111400);
252 
253 	kfree(result);
254 
255 	train->state = NVA3_TRAIN_DONE;
256 
257 	return ret;
258 
259 out:
260 	if(ret == -EBUSY)
261 		f = NULL;
262 
263 	train->state = NVA3_TRAIN_UNSUPPORTED;
264 
265 	gt215_clk_post(clk, f);
266 	kfree(result);
267 	return ret;
268 }
269 
270 int
271 gt215_link_train_init(struct gt215_ram *ram)
272 {
273 	static const u32 pattern[16] = {
274 		0xaaaaaaaa, 0xcccccccc, 0xdddddddd, 0xeeeeeeee,
275 		0x00000000, 0x11111111, 0x44444444, 0xdddddddd,
276 		0x33333333, 0x55555555, 0x77777777, 0x66666666,
277 		0x99999999, 0x88888888, 0xeeeeeeee, 0xbbbbbbbb,
278 	};
279 	struct gt215_ltrain *train = &ram->ltrain;
280 	struct nvkm_device *device = ram->base.fb->subdev.device;
281 	struct nvkm_bios *bios = device->bios;
282 	struct nvkm_mem *mem;
283 	struct nvbios_M0205E M0205E;
284 	u8 ver, hdr, cnt, len;
285 	u32 r001700;
286 	int ret, i = 0;
287 
288 	train->state = NVA3_TRAIN_UNSUPPORTED;
289 
290 	/* We support type "5"
291 	 * XXX: training pattern table appears to be unused for this routine */
292 	if (!nvbios_M0205Ep(bios, i, &ver, &hdr, &cnt, &len, &M0205E))
293 		return -ENOENT;
294 
295 	if (M0205E.type != 5)
296 		return 0;
297 
298 	train->state = NVA3_TRAIN_ONCE;
299 
300 	ret = ram->base.func->get(&ram->base, 0x8000, 0x10000, 0, 0x800,
301 				  &ram->ltrain.mem);
302 	if (ret)
303 		return ret;
304 
305 	mem = ram->ltrain.mem;
306 
307 	nvkm_wr32(device, 0x100538, 0x10000000 | (mem->offset >> 16));
308 	nvkm_wr32(device, 0x1005a8, 0x0000ffff);
309 	nvkm_mask(device, 0x10f800, 0x00000001, 0x00000001);
310 
311 	for (i = 0; i < 0x30; i++) {
312 		nvkm_wr32(device, 0x10f8c0, (i << 8) | i);
313 		nvkm_wr32(device, 0x10f900, pattern[i % 16]);
314 	}
315 
316 	for (i = 0; i < 0x30; i++) {
317 		nvkm_wr32(device, 0x10f8e0, (i << 8) | i);
318 		nvkm_wr32(device, 0x10f920, pattern[i % 16]);
319 	}
320 
321 	/* And upload the pattern */
322 	r001700 = nvkm_rd32(device, 0x1700);
323 	nvkm_wr32(device, 0x1700, mem->offset >> 16);
324 	for (i = 0; i < 16; i++)
325 		nvkm_wr32(device, 0x700000 + (i << 2), pattern[i]);
326 	for (i = 0; i < 16; i++)
327 		nvkm_wr32(device, 0x700100 + (i << 2), pattern[i]);
328 	nvkm_wr32(device, 0x1700, r001700);
329 
330 	train->r_100720 = nvkm_rd32(device, 0x100720);
331 	train->r_1111e0 = nvkm_rd32(device, 0x1111e0);
332 	train->r_111400 = nvkm_rd32(device, 0x111400);
333 	return 0;
334 }
335 
336 void
337 gt215_link_train_fini(struct gt215_ram *ram)
338 {
339 	if (ram->ltrain.mem)
340 		ram->base.func->put(&ram->base, &ram->ltrain.mem);
341 }
342 
343 /*
344  * RAM reclocking
345  */
346 #define T(t) cfg->timing_10_##t
347 static int
348 gt215_ram_timing_calc(struct gt215_ram *ram, u32 *timing)
349 {
350 	struct nvbios_ramcfg *cfg = &ram->base.target.bios;
351 	struct nvkm_subdev *subdev = &ram->base.fb->subdev;
352 	struct nvkm_device *device = subdev->device;
353 	int tUNK_base, tUNK_40_0, prevCL;
354 	u32 cur2, cur3, cur7, cur8;
355 
356 	cur2 = nvkm_rd32(device, 0x100228);
357 	cur3 = nvkm_rd32(device, 0x10022c);
358 	cur7 = nvkm_rd32(device, 0x10023c);
359 	cur8 = nvkm_rd32(device, 0x100240);
360 
361 
362 	switch ((!T(CWL)) * ram->base.type) {
363 	case NVKM_RAM_TYPE_DDR2:
364 		T(CWL) = T(CL) - 1;
365 		break;
366 	case NVKM_RAM_TYPE_GDDR3:
367 		T(CWL) = ((cur2 & 0xff000000) >> 24) + 1;
368 		break;
369 	}
370 
371 	prevCL = (cur3 & 0x000000ff) + 1;
372 	tUNK_base = ((cur7 & 0x00ff0000) >> 16) - prevCL;
373 
374 	timing[0] = (T(RP) << 24 | T(RAS) << 16 | T(RFC) << 8 | T(RC));
375 	timing[1] = (T(WR) + 1 + T(CWL)) << 24 |
376 		    max_t(u8,T(18), 1) << 16 |
377 		    (T(WTR) + 1 + T(CWL)) << 8 |
378 		    (5 + T(CL) - T(CWL));
379 	timing[2] = (T(CWL) - 1) << 24 |
380 		    (T(RRD) << 16) |
381 		    (T(RCDWR) << 8) |
382 		    T(RCDRD);
383 	timing[3] = (cur3 & 0x00ff0000) |
384 		    (0x30 + T(CL)) << 24 |
385 		    (0xb + T(CL)) << 8 |
386 		    (T(CL) - 1);
387 	timing[4] = T(20) << 24 |
388 		    T(21) << 16 |
389 		    T(13) << 8 |
390 		    T(13);
391 	timing[5] = T(RFC) << 24 |
392 		    max_t(u8,T(RCDRD), T(RCDWR)) << 16 |
393 		    max_t(u8, (T(CWL) + 6), (T(CL) + 2)) << 8 |
394 		    T(RP);
395 	timing[6] = (0x5a + T(CL)) << 16 |
396 		    max_t(u8, 1, (6 - T(CL) + T(CWL))) << 8 |
397 		    (0x50 + T(CL) - T(CWL));
398 	timing[7] = (cur7 & 0xff000000) |
399 		    ((tUNK_base + T(CL)) << 16) |
400 		    0x202;
401 	timing[8] = cur8 & 0xffffff00;
402 
403 	switch (ram->base.type) {
404 	case NVKM_RAM_TYPE_DDR2:
405 	case NVKM_RAM_TYPE_GDDR3:
406 		tUNK_40_0 = prevCL - (cur8 & 0xff);
407 		if (tUNK_40_0 > 0)
408 			timing[8] |= T(CL);
409 		break;
410 	default:
411 		break;
412 	}
413 
414 	nvkm_debug(subdev, "Entry: 220: %08x %08x %08x %08x\n",
415 		   timing[0], timing[1], timing[2], timing[3]);
416 	nvkm_debug(subdev, "  230: %08x %08x %08x %08x\n",
417 		   timing[4], timing[5], timing[6], timing[7]);
418 	nvkm_debug(subdev, "  240: %08x\n", timing[8]);
419 	return 0;
420 }
421 #undef T
422 
423 static void
424 nvkm_sddr2_dll_reset(struct gt215_ramfuc *fuc)
425 {
426 	ram_mask(fuc, mr[0], 0x100, 0x100);
427 	ram_nsec(fuc, 1000);
428 	ram_mask(fuc, mr[0], 0x100, 0x000);
429 	ram_nsec(fuc, 1000);
430 }
431 
432 static void
433 nvkm_sddr3_dll_disable(struct gt215_ramfuc *fuc, u32 *mr)
434 {
435 	u32 mr1_old = ram_rd32(fuc, mr[1]);
436 
437 	if (!(mr1_old & 0x1)) {
438 		ram_wr32(fuc, 0x1002d4, 0x00000001);
439 		ram_wr32(fuc, mr[1], mr[1]);
440 		ram_nsec(fuc, 1000);
441 	}
442 }
443 
444 static void
445 nvkm_gddr3_dll_disable(struct gt215_ramfuc *fuc, u32 *mr)
446 {
447 	u32 mr1_old = ram_rd32(fuc, mr[1]);
448 
449 	if (!(mr1_old & 0x40)) {
450 		ram_wr32(fuc, mr[1], mr[1]);
451 		ram_nsec(fuc, 1000);
452 	}
453 }
454 
455 static void
456 gt215_ram_lock_pll(struct gt215_ramfuc *fuc, struct gt215_clk_info *mclk)
457 {
458 	ram_wr32(fuc, 0x004004, mclk->pll);
459 	ram_mask(fuc, 0x004000, 0x00000001, 0x00000001);
460 	ram_mask(fuc, 0x004000, 0x00000010, 0x00000000);
461 	ram_wait(fuc, 0x004000, 0x00020000, 0x00020000, 64000);
462 	ram_mask(fuc, 0x004000, 0x00000010, 0x00000010);
463 }
464 
465 static void
466 gt215_ram_gpio(struct gt215_ramfuc *fuc, u8 tag, u32 val)
467 {
468 	struct nvkm_gpio *gpio = fuc->base.fb->subdev.device->gpio;
469 	struct dcb_gpio_func func;
470 	u32 reg, sh, gpio_val;
471 	int ret;
472 
473 	if (nvkm_gpio_get(gpio, 0, tag, DCB_GPIO_UNUSED) != val) {
474 		ret = nvkm_gpio_find(gpio, 0, tag, DCB_GPIO_UNUSED, &func);
475 		if (ret)
476 			return;
477 
478 		reg = func.line >> 3;
479 		sh = (func.line & 0x7) << 2;
480 		gpio_val = ram_rd32(fuc, gpio[reg]);
481 		if (gpio_val & (8 << sh))
482 			val = !val;
483 		if (!(func.log[1] & 1))
484 			val = !val;
485 
486 		ram_mask(fuc, gpio[reg], (0x3 << sh), ((val | 0x2) << sh));
487 		ram_nsec(fuc, 20000);
488 	}
489 }
490 
491 static int
492 gt215_ram_calc(struct nvkm_ram *base, u32 freq)
493 {
494 	struct gt215_ram *ram = gt215_ram(base);
495 	struct gt215_ramfuc *fuc = &ram->fuc;
496 	struct gt215_ltrain *train = &ram->ltrain;
497 	struct nvkm_subdev *subdev = &ram->base.fb->subdev;
498 	struct nvkm_device *device = subdev->device;
499 	struct nvkm_bios *bios = device->bios;
500 	struct gt215_clk_info mclk;
501 	struct nvkm_ram_data *next;
502 	u8  ver, hdr, cnt, len, strap;
503 	u32 data;
504 	u32 r004018, r100760, r100da0, r111100, ctrl;
505 	u32 unk714, unk718, unk71c;
506 	int ret, i;
507 	u32 timing[9];
508 	bool pll2pll;
509 
510 	next = &ram->base.target;
511 	next->freq = freq;
512 	ram->base.next = next;
513 
514 	if (ram->ltrain.state == NVA3_TRAIN_ONCE)
515 		gt215_link_train(ram);
516 
517 	/* lookup memory config data relevant to the target frequency */
518 	data = nvbios_rammapEm(bios, freq / 1000, &ver, &hdr, &cnt, &len,
519 			       &next->bios);
520 	if (!data || ver != 0x10 || hdr < 0x05) {
521 		nvkm_error(subdev, "invalid/missing rammap entry\n");
522 		return -EINVAL;
523 	}
524 
525 	/* locate specific data set for the attached memory */
526 	strap = nvbios_ramcfg_index(subdev);
527 	if (strap >= cnt) {
528 		nvkm_error(subdev, "invalid ramcfg strap\n");
529 		return -EINVAL;
530 	}
531 
532 	data = nvbios_rammapSp(bios, data, ver, hdr, cnt, len, strap,
533 			       &ver, &hdr, &next->bios);
534 	if (!data || ver != 0x10 || hdr < 0x09) {
535 		nvkm_error(subdev, "invalid/missing ramcfg entry\n");
536 		return -EINVAL;
537 	}
538 
539 	/* lookup memory timings, if bios says they're present */
540 	if (next->bios.ramcfg_timing != 0xff) {
541 		data = nvbios_timingEp(bios, next->bios.ramcfg_timing,
542 				       &ver, &hdr, &cnt, &len,
543 				       &next->bios);
544 		if (!data || ver != 0x10 || hdr < 0x17) {
545 			nvkm_error(subdev, "invalid/missing timing entry\n");
546 			return -EINVAL;
547 		}
548 	}
549 
550 	ret = gt215_pll_info(device->clk, 0x12, 0x4000, freq, &mclk);
551 	if (ret < 0) {
552 		nvkm_error(subdev, "failed mclk calculation\n");
553 		return ret;
554 	}
555 
556 	gt215_ram_timing_calc(ram, timing);
557 
558 	ret = ram_init(fuc, ram->base.fb);
559 	if (ret)
560 		return ret;
561 
562 	/* Determine ram-specific MR values */
563 	ram->base.mr[0] = ram_rd32(fuc, mr[0]);
564 	ram->base.mr[1] = ram_rd32(fuc, mr[1]);
565 	ram->base.mr[2] = ram_rd32(fuc, mr[2]);
566 
567 	switch (ram->base.type) {
568 	case NVKM_RAM_TYPE_DDR2:
569 		ret = nvkm_sddr2_calc(&ram->base);
570 		break;
571 	case NVKM_RAM_TYPE_DDR3:
572 		ret = nvkm_sddr3_calc(&ram->base);
573 		break;
574 	case NVKM_RAM_TYPE_GDDR3:
575 		ret = nvkm_gddr3_calc(&ram->base);
576 		break;
577 	default:
578 		ret = -ENOSYS;
579 		break;
580 	}
581 
582 	if (ret)
583 		return ret;
584 
585 	/* XXX: 750MHz seems rather arbitrary */
586 	if (freq <= 750000) {
587 		r004018 = 0x10000000;
588 		r100760 = 0x22222222;
589 		r100da0 = 0x00000010;
590 	} else {
591 		r004018 = 0x00000000;
592 		r100760 = 0x00000000;
593 		r100da0 = 0x00000000;
594 	}
595 
596 	if (!next->bios.ramcfg_DLLoff)
597 		r004018 |= 0x00004000;
598 
599 	/* pll2pll requires to switch to a safe clock first */
600 	ctrl = ram_rd32(fuc, 0x004000);
601 	pll2pll = (!(ctrl & 0x00000008)) && mclk.pll;
602 
603 	/* Pre, NVIDIA does this outside the script */
604 	if (next->bios.ramcfg_10_02_10) {
605 		ram_mask(fuc, 0x111104, 0x00000600, 0x00000000);
606 	} else {
607 		ram_mask(fuc, 0x111100, 0x40000000, 0x40000000);
608 		ram_mask(fuc, 0x111104, 0x00000180, 0x00000000);
609 	}
610 	/* Always disable this bit during reclock */
611 	ram_mask(fuc, 0x100200, 0x00000800, 0x00000000);
612 
613 	/* If switching from non-pll to pll, lock before disabling FB */
614 	if (mclk.pll && !pll2pll) {
615 		ram_mask(fuc, 0x004128, 0x003f3141, mclk.clk | 0x00000101);
616 		gt215_ram_lock_pll(fuc, &mclk);
617 	}
618 
619 	/* Start with disabling some CRTCs and PFIFO? */
620 	ram_wait_vblank(fuc);
621 	ram_wr32(fuc, 0x611200, 0x3300);
622 	ram_mask(fuc, 0x002504, 0x1, 0x1);
623 	ram_nsec(fuc, 10000);
624 	ram_wait(fuc, 0x002504, 0x10, 0x10, 20000); /* XXX: or longer? */
625 	ram_block(fuc);
626 	ram_nsec(fuc, 2000);
627 
628 	if (!next->bios.ramcfg_10_02_10) {
629 		if (ram->base.type == NVKM_RAM_TYPE_GDDR3)
630 			ram_mask(fuc, 0x111100, 0x04020000, 0x00020000);
631 		else
632 			ram_mask(fuc, 0x111100, 0x04020000, 0x04020000);
633 	}
634 
635 	/* If we're disabling the DLL, do it now */
636 	switch (next->bios.ramcfg_DLLoff * ram->base.type) {
637 	case NVKM_RAM_TYPE_DDR3:
638 		nvkm_sddr3_dll_disable(fuc, ram->base.mr);
639 		break;
640 	case NVKM_RAM_TYPE_GDDR3:
641 		nvkm_gddr3_dll_disable(fuc, ram->base.mr);
642 		break;
643 	}
644 
645 	if (next->bios.timing_10_ODT)
646 		gt215_ram_gpio(fuc, 0x2e, 1);
647 
648 	/* Brace RAM for impact */
649 	ram_wr32(fuc, 0x1002d4, 0x00000001);
650 	ram_wr32(fuc, 0x1002d0, 0x00000001);
651 	ram_wr32(fuc, 0x1002d0, 0x00000001);
652 	ram_wr32(fuc, 0x100210, 0x00000000);
653 	ram_wr32(fuc, 0x1002dc, 0x00000001);
654 	ram_nsec(fuc, 2000);
655 
656 	if (device->chipset == 0xa3 && freq <= 500000)
657 		ram_mask(fuc, 0x100700, 0x00000006, 0x00000006);
658 
659 	/* Fiddle with clocks */
660 	/* There's 4 scenario's
661 	 * pll->pll: first switch to a 324MHz clock, set up new PLL, switch
662 	 * clk->pll: Set up new PLL, switch
663 	 * pll->clk: Set up clock, switch
664 	 * clk->clk: Overwrite ctrl and other bits, switch */
665 
666 	/* Switch to regular clock - 324MHz */
667 	if (pll2pll) {
668 		ram_mask(fuc, 0x004000, 0x00000004, 0x00000004);
669 		ram_mask(fuc, 0x004168, 0x003f3141, 0x00083101);
670 		ram_mask(fuc, 0x004000, 0x00000008, 0x00000008);
671 		ram_mask(fuc, 0x1110e0, 0x00088000, 0x00088000);
672 		ram_wr32(fuc, 0x004018, 0x00001000);
673 		gt215_ram_lock_pll(fuc, &mclk);
674 	}
675 
676 	if (mclk.pll) {
677 		ram_mask(fuc, 0x004000, 0x00000105, 0x00000105);
678 		ram_wr32(fuc, 0x004018, 0x00001000 | r004018);
679 		ram_wr32(fuc, 0x100da0, r100da0);
680 	} else {
681 		ram_mask(fuc, 0x004168, 0x003f3141, mclk.clk | 0x00000101);
682 		ram_mask(fuc, 0x004000, 0x00000108, 0x00000008);
683 		ram_mask(fuc, 0x1110e0, 0x00088000, 0x00088000);
684 		ram_wr32(fuc, 0x004018, 0x00009000 | r004018);
685 		ram_wr32(fuc, 0x100da0, r100da0);
686 	}
687 	ram_nsec(fuc, 20000);
688 
689 	if (next->bios.rammap_10_04_08) {
690 		ram_wr32(fuc, 0x1005a0, next->bios.ramcfg_10_06 << 16 |
691 					next->bios.ramcfg_10_05 << 8 |
692 					next->bios.ramcfg_10_05);
693 		ram_wr32(fuc, 0x1005a4, next->bios.ramcfg_10_08 << 8 |
694 					next->bios.ramcfg_10_07);
695 		ram_wr32(fuc, 0x10f804, next->bios.ramcfg_10_09_f0 << 20 |
696 					next->bios.ramcfg_10_03_0f << 16 |
697 					next->bios.ramcfg_10_09_0f |
698 					0x80000000);
699 		ram_mask(fuc, 0x10053c, 0x00001000, 0x00000000);
700 	} else {
701 		if (train->state == NVA3_TRAIN_DONE) {
702 			ram_wr32(fuc, 0x100080, 0x1020);
703 			ram_mask(fuc, 0x111400, 0xffffffff, train->r_111400);
704 			ram_mask(fuc, 0x1111e0, 0xffffffff, train->r_1111e0);
705 			ram_mask(fuc, 0x100720, 0xffffffff, train->r_100720);
706 		}
707 		ram_mask(fuc, 0x10053c, 0x00001000, 0x00001000);
708 		ram_mask(fuc, 0x10f804, 0x80000000, 0x00000000);
709 		ram_mask(fuc, 0x100760, 0x22222222, r100760);
710 		ram_mask(fuc, 0x1007a0, 0x22222222, r100760);
711 		ram_mask(fuc, 0x1007e0, 0x22222222, r100760);
712 	}
713 
714 	if (device->chipset == 0xa3 && freq > 500000) {
715 		ram_mask(fuc, 0x100700, 0x00000006, 0x00000000);
716 	}
717 
718 	/* Final switch */
719 	if (mclk.pll) {
720 		ram_mask(fuc, 0x1110e0, 0x00088000, 0x00011000);
721 		ram_mask(fuc, 0x004000, 0x00000008, 0x00000000);
722 	}
723 
724 	ram_wr32(fuc, 0x1002dc, 0x00000000);
725 	ram_wr32(fuc, 0x1002d4, 0x00000001);
726 	ram_wr32(fuc, 0x100210, 0x80000000);
727 	ram_nsec(fuc, 2000);
728 
729 	/* Set RAM MR parameters and timings */
730 	for (i = 2; i >= 0; i--) {
731 		if (ram_rd32(fuc, mr[i]) != ram->base.mr[i]) {
732 			ram_wr32(fuc, mr[i], ram->base.mr[i]);
733 			ram_nsec(fuc, 1000);
734 		}
735 	}
736 
737 	ram_wr32(fuc, 0x100220[3], timing[3]);
738 	ram_wr32(fuc, 0x100220[1], timing[1]);
739 	ram_wr32(fuc, 0x100220[6], timing[6]);
740 	ram_wr32(fuc, 0x100220[7], timing[7]);
741 	ram_wr32(fuc, 0x100220[2], timing[2]);
742 	ram_wr32(fuc, 0x100220[4], timing[4]);
743 	ram_wr32(fuc, 0x100220[5], timing[5]);
744 	ram_wr32(fuc, 0x100220[0], timing[0]);
745 	ram_wr32(fuc, 0x100220[8], timing[8]);
746 
747 	/* Misc */
748 	ram_mask(fuc, 0x100200, 0x00001000, !next->bios.ramcfg_10_02_08 << 12);
749 
750 	/* XXX: A lot of "chipset"/"ram type" specific stuff...? */
751 	unk714  = ram_rd32(fuc, 0x100714) & ~0xf0000130;
752 	unk718  = ram_rd32(fuc, 0x100718) & ~0x00000100;
753 	unk71c  = ram_rd32(fuc, 0x10071c) & ~0x00000100;
754 	r111100 = ram_rd32(fuc, 0x111100) & ~0x3a800000;
755 
756 	if (next->bios.ramcfg_10_02_04) {
757 		switch (ram->base.type) {
758 		case NVKM_RAM_TYPE_DDR3:
759 			if (device->chipset != 0xa8)
760 				r111100 |= 0x00000004;
761 			/* no break */
762 		case NVKM_RAM_TYPE_DDR2:
763 			r111100 |= 0x08000000;
764 			break;
765 		default:
766 			break;
767 		}
768 	} else {
769 		switch (ram->base.type) {
770 		case NVKM_RAM_TYPE_DDR2:
771 			r111100 |= 0x1a800000;
772 			unk714  |= 0x00000010;
773 			break;
774 		case NVKM_RAM_TYPE_DDR3:
775 			if (device->chipset == 0xa8) {
776 				r111100 |=  0x08000000;
777 			} else {
778 				r111100 &= ~0x00000004;
779 				r111100 |=  0x12800000;
780 			}
781 			unk714  |= 0x00000010;
782 			break;
783 		case NVKM_RAM_TYPE_GDDR3:
784 			r111100 |= 0x30000000;
785 			unk714  |= 0x00000020;
786 			break;
787 		default:
788 			break;
789 		}
790 	}
791 
792 	unk714 |= (next->bios.ramcfg_10_04_01) << 8;
793 
794 	if (next->bios.ramcfg_10_02_20)
795 		unk714 |= 0xf0000000;
796 	if (next->bios.ramcfg_10_02_02)
797 		unk718 |= 0x00000100;
798 	if (next->bios.ramcfg_10_02_01)
799 		unk71c |= 0x00000100;
800 	if (next->bios.timing_10_24 != 0xff) {
801 		unk718 &= ~0xf0000000;
802 		unk718 |= next->bios.timing_10_24 << 28;
803 	}
804 	if (next->bios.ramcfg_10_02_10)
805 		r111100 &= ~0x04020000;
806 
807 	ram_mask(fuc, 0x100714, 0xffffffff, unk714);
808 	ram_mask(fuc, 0x10071c, 0xffffffff, unk71c);
809 	ram_mask(fuc, 0x100718, 0xffffffff, unk718);
810 	ram_mask(fuc, 0x111100, 0xffffffff, r111100);
811 
812 	if (!next->bios.timing_10_ODT)
813 		gt215_ram_gpio(fuc, 0x2e, 0);
814 
815 	/* Reset DLL */
816 	if (!next->bios.ramcfg_DLLoff)
817 		nvkm_sddr2_dll_reset(fuc);
818 
819 	if (ram->base.type == NVKM_RAM_TYPE_GDDR3) {
820 		ram_nsec(fuc, 31000);
821 	} else {
822 		ram_nsec(fuc, 14000);
823 	}
824 
825 	if (ram->base.type == NVKM_RAM_TYPE_DDR3) {
826 		ram_wr32(fuc, 0x100264, 0x1);
827 		ram_nsec(fuc, 2000);
828 	}
829 
830 	ram_nuke(fuc, 0x100700);
831 	ram_mask(fuc, 0x100700, 0x01000000, 0x01000000);
832 	ram_mask(fuc, 0x100700, 0x01000000, 0x00000000);
833 
834 	/* Re-enable FB */
835 	ram_unblock(fuc);
836 	ram_wr32(fuc, 0x611200, 0x3330);
837 
838 	/* Post fiddlings */
839 	if (next->bios.rammap_10_04_02)
840 		ram_mask(fuc, 0x100200, 0x00000800, 0x00000800);
841 	if (next->bios.ramcfg_10_02_10) {
842 		ram_mask(fuc, 0x111104, 0x00000180, 0x00000180);
843 		ram_mask(fuc, 0x111100, 0x40000000, 0x00000000);
844 	} else {
845 		ram_mask(fuc, 0x111104, 0x00000600, 0x00000600);
846 	}
847 
848 	if (mclk.pll) {
849 		ram_mask(fuc, 0x004168, 0x00000001, 0x00000000);
850 		ram_mask(fuc, 0x004168, 0x00000100, 0x00000000);
851 	} else {
852 		ram_mask(fuc, 0x004000, 0x00000001, 0x00000000);
853 		ram_mask(fuc, 0x004128, 0x00000001, 0x00000000);
854 		ram_mask(fuc, 0x004128, 0x00000100, 0x00000000);
855 	}
856 
857 	return 0;
858 }
859 
860 static int
861 gt215_ram_prog(struct nvkm_ram *base)
862 {
863 	struct gt215_ram *ram = gt215_ram(base);
864 	struct gt215_ramfuc *fuc = &ram->fuc;
865 	struct nvkm_device *device = ram->base.fb->subdev.device;
866 	bool exec = nvkm_boolopt(device->cfgopt, "NvMemExec", true);
867 
868 	if (exec) {
869 		nvkm_mask(device, 0x001534, 0x2, 0x2);
870 
871 		ram_exec(fuc, true);
872 
873 		/* Post-processing, avoids flicker */
874 		nvkm_mask(device, 0x002504, 0x1, 0x0);
875 		nvkm_mask(device, 0x001534, 0x2, 0x0);
876 
877 		nvkm_mask(device, 0x616308, 0x10, 0x10);
878 		nvkm_mask(device, 0x616b08, 0x10, 0x10);
879 	} else {
880 		ram_exec(fuc, false);
881 	}
882 	return 0;
883 }
884 
885 static void
886 gt215_ram_tidy(struct nvkm_ram *base)
887 {
888 	struct gt215_ram *ram = gt215_ram(base);
889 	ram_exec(&ram->fuc, false);
890 }
891 
892 static int
893 gt215_ram_init(struct nvkm_ram *base)
894 {
895 	struct gt215_ram *ram = gt215_ram(base);
896 	gt215_link_train_init(ram);
897 	return 0;
898 }
899 
900 static void *
901 gt215_ram_dtor(struct nvkm_ram *base)
902 {
903 	struct gt215_ram *ram = gt215_ram(base);
904 	gt215_link_train_fini(ram);
905 	return ram;
906 }
907 
908 static const struct nvkm_ram_func
909 gt215_ram_func = {
910 	.dtor = gt215_ram_dtor,
911 	.init = gt215_ram_init,
912 	.get = nv50_ram_get,
913 	.put = nv50_ram_put,
914 	.calc = gt215_ram_calc,
915 	.prog = gt215_ram_prog,
916 	.tidy = gt215_ram_tidy,
917 };
918 
919 int
920 gt215_ram_new(struct nvkm_fb *fb, struct nvkm_ram **pram)
921 {
922 	struct gt215_ram *ram;
923 	int ret, i;
924 
925 	if (!(ram = kzalloc(sizeof(*ram), GFP_KERNEL)))
926 		return -ENOMEM;
927 	*pram = &ram->base;
928 
929 	ret = nv50_ram_ctor(&gt215_ram_func, fb, &ram->base);
930 	if (ret)
931 		return ret;
932 
933 	ram->fuc.r_0x001610 = ramfuc_reg(0x001610);
934 	ram->fuc.r_0x001700 = ramfuc_reg(0x001700);
935 	ram->fuc.r_0x002504 = ramfuc_reg(0x002504);
936 	ram->fuc.r_0x004000 = ramfuc_reg(0x004000);
937 	ram->fuc.r_0x004004 = ramfuc_reg(0x004004);
938 	ram->fuc.r_0x004018 = ramfuc_reg(0x004018);
939 	ram->fuc.r_0x004128 = ramfuc_reg(0x004128);
940 	ram->fuc.r_0x004168 = ramfuc_reg(0x004168);
941 	ram->fuc.r_0x100080 = ramfuc_reg(0x100080);
942 	ram->fuc.r_0x100200 = ramfuc_reg(0x100200);
943 	ram->fuc.r_0x100210 = ramfuc_reg(0x100210);
944 	for (i = 0; i < 9; i++)
945 		ram->fuc.r_0x100220[i] = ramfuc_reg(0x100220 + (i * 4));
946 	ram->fuc.r_0x100264 = ramfuc_reg(0x100264);
947 	ram->fuc.r_0x1002d0 = ramfuc_reg(0x1002d0);
948 	ram->fuc.r_0x1002d4 = ramfuc_reg(0x1002d4);
949 	ram->fuc.r_0x1002dc = ramfuc_reg(0x1002dc);
950 	ram->fuc.r_0x10053c = ramfuc_reg(0x10053c);
951 	ram->fuc.r_0x1005a0 = ramfuc_reg(0x1005a0);
952 	ram->fuc.r_0x1005a4 = ramfuc_reg(0x1005a4);
953 	ram->fuc.r_0x100700 = ramfuc_reg(0x100700);
954 	ram->fuc.r_0x100714 = ramfuc_reg(0x100714);
955 	ram->fuc.r_0x100718 = ramfuc_reg(0x100718);
956 	ram->fuc.r_0x10071c = ramfuc_reg(0x10071c);
957 	ram->fuc.r_0x100720 = ramfuc_reg(0x100720);
958 	ram->fuc.r_0x100760 = ramfuc_stride(0x100760, 4, ram->base.part_mask);
959 	ram->fuc.r_0x1007a0 = ramfuc_stride(0x1007a0, 4, ram->base.part_mask);
960 	ram->fuc.r_0x1007e0 = ramfuc_stride(0x1007e0, 4, ram->base.part_mask);
961 	ram->fuc.r_0x100da0 = ramfuc_stride(0x100da0, 4, ram->base.part_mask);
962 	ram->fuc.r_0x10f804 = ramfuc_reg(0x10f804);
963 	ram->fuc.r_0x1110e0 = ramfuc_stride(0x1110e0, 4, ram->base.part_mask);
964 	ram->fuc.r_0x111100 = ramfuc_reg(0x111100);
965 	ram->fuc.r_0x111104 = ramfuc_reg(0x111104);
966 	ram->fuc.r_0x1111e0 = ramfuc_reg(0x1111e0);
967 	ram->fuc.r_0x111400 = ramfuc_reg(0x111400);
968 	ram->fuc.r_0x611200 = ramfuc_reg(0x611200);
969 
970 	if (ram->base.ranks > 1) {
971 		ram->fuc.r_mr[0] = ramfuc_reg2(0x1002c0, 0x1002c8);
972 		ram->fuc.r_mr[1] = ramfuc_reg2(0x1002c4, 0x1002cc);
973 		ram->fuc.r_mr[2] = ramfuc_reg2(0x1002e0, 0x1002e8);
974 		ram->fuc.r_mr[3] = ramfuc_reg2(0x1002e4, 0x1002ec);
975 	} else {
976 		ram->fuc.r_mr[0] = ramfuc_reg(0x1002c0);
977 		ram->fuc.r_mr[1] = ramfuc_reg(0x1002c4);
978 		ram->fuc.r_mr[2] = ramfuc_reg(0x1002e0);
979 		ram->fuc.r_mr[3] = ramfuc_reg(0x1002e4);
980 	}
981 	ram->fuc.r_gpio[0] = ramfuc_reg(0x00e104);
982 	ram->fuc.r_gpio[1] = ramfuc_reg(0x00e108);
983 	ram->fuc.r_gpio[2] = ramfuc_reg(0x00e120);
984 	ram->fuc.r_gpio[3] = ramfuc_reg(0x00e124);
985 
986 	return 0;
987 }
988