blob: 3dd00fb2b6217b028423bb62d387125bddb64865 [file] [log] [blame]
Damien Zammit4b513a62015-08-20 00:37:05 +10001/*
2 * This file is part of the coreboot project.
3 *
4 * Copyright (C) 2015 Damien Zammit <damien@zamaudio.com>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License as
8 * published by the Free Software Foundation; either version 2 of
9 * the License, or (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 */
16
17#include <stdint.h>
18#include <arch/io.h>
19#include <arch/cpu.h>
20#include <console/console.h>
21#include <commonlib/helpers.h>
22#include <delay.h>
Martin Rothcbe38922016-01-05 19:40:41 -070023#include "iomap.h"
24#include "x4x.h"
Damien Zammit4b513a62015-08-20 00:37:05 +100025
Damien Zammit9fb08f52016-01-22 18:56:23 +110026#define ME_UMA_SIZEMB 0
27
Damien Zammit4b513a62015-08-20 00:37:05 +100028static inline void barrier(void)
29{
30 asm volatile("mfence":::);
31}
32
33static u32 fsb2mhz(u32 speed)
34{
35 return (speed * 267) + 800;
36}
37
38static u32 ddr2mhz(u32 speed)
39{
40 static const u16 mhz[] = { 0, 0, 667, 800, 1067, 1333 };
41
42 if (speed >= ARRAY_SIZE(mhz))
43 return 0;
44
45 return mhz[speed];
46}
47
Damien Zammitd63115d2016-01-22 19:11:44 +110048/* Find MSB bitfield location using bit scan reverse instruction */
49static u8 msbpos(u32 val)
Damien Zammit4b513a62015-08-20 00:37:05 +100050{
Damien Zammitd63115d2016-01-22 19:11:44 +110051 u32 pos;
52
53 if (val == 0) {
54 printk(BIOS_WARNING, "WARNING: Input to BSR is zero\n");
55 return 0;
Damien Zammit4b513a62015-08-20 00:37:05 +100056 }
Damien Zammitd63115d2016-01-22 19:11:44 +110057
58 asm ("bsrl %1, %0"
59 :"=r"(pos)
60 :"r"(val)
61 );
62
63 return (u8)(pos & 0xff);
Damien Zammit4b513a62015-08-20 00:37:05 +100064}
65
66static void sdram_detect_smallest_params2(struct sysinfo *s)
67{
68 u16 mult[6] = {
69 5000, // 400
70 3750, // 533
71 3000, // 667
72 2500, // 800
73 1875, // 1066
74 1500, // 1333
75 };
76
77 u8 i;
78 u32 tmp;
79 u32 maxtras = 0;
80 u32 maxtrp = 0;
81 u32 maxtrcd = 0;
82 u32 maxtwr = 0;
83 u32 maxtrfc = 0;
84 u32 maxtwtr = 0;
85 u32 maxtrrd = 0;
86 u32 maxtrtp = 0;
87
88 FOR_EACH_POPULATED_DIMM(s->dimms, i) {
89 maxtras = MAX(maxtras, s->dimms[i].spd_data[30] * 1000);
90 maxtrp = MAX(maxtrp, (s->dimms[i].spd_data[27] * 1000) >> 2);
91 maxtrcd = MAX(maxtrcd, (s->dimms[i].spd_data[29] * 1000) >> 2);
92 maxtwr = MAX(maxtwr, (s->dimms[i].spd_data[36] * 1000) >> 2);
93 maxtrfc = MAX(maxtrfc, s->dimms[i].spd_data[42] * 1000 +
94 (s->dimms[i].spd_data[40] & 0xf));
95 maxtwtr = MAX(maxtwtr, (s->dimms[i].spd_data[37] * 1000) >> 2);
96 maxtrrd = MAX(maxtrrd, (s->dimms[i].spd_data[28] * 1000) >> 2);
97 maxtrtp = MAX(maxtrtp, (s->dimms[i].spd_data[38] * 1000) >> 2);
98 }
99 for (i = 9; i < 24; i++) {
100 tmp = mult[s->selected_timings.mem_clk] * i;
101 if (tmp >= maxtras) {
102 s->selected_timings.tRAS = i;
103 break;
104 }
105 }
106 for (i = 3; i < 10; i++) {
107 tmp = mult[s->selected_timings.mem_clk] * i;
108 if (tmp >= maxtrp) {
109 s->selected_timings.tRP = i;
110 break;
111 }
112 }
113 for (i = 3; i < 10; i++) {
114 tmp = mult[s->selected_timings.mem_clk] * i;
115 if (tmp >= maxtrcd) {
116 s->selected_timings.tRCD = i;
117 break;
118 }
119 }
120 for (i = 3; i < 15; i++) {
121 tmp = mult[s->selected_timings.mem_clk] * i;
122 if (tmp >= maxtwr) {
123 s->selected_timings.tWR = i;
124 break;
125 }
126 }
127 for (i = 15; i < 78; i++) {
128 tmp = mult[s->selected_timings.mem_clk] * i;
129 if (tmp >= maxtrfc) {
130 s->selected_timings.tRFC = ((i + 16) & 0xfe) - 15;
131 break;
132 }
133 }
134 for (i = 4; i < 15; i++) {
135 tmp = mult[s->selected_timings.mem_clk] * i;
136 if (tmp >= maxtwtr) {
137 s->selected_timings.tWTR = i;
138 break;
139 }
140 }
141 for (i = 2; i < 15; i++) {
142 tmp = mult[s->selected_timings.mem_clk] * i;
143 if (tmp >= maxtrrd) {
144 s->selected_timings.tRRD = i;
145 break;
146 }
147 }
148 for (i = 4; i < 15; i++) {
149 tmp = mult[s->selected_timings.mem_clk] * i;
150 if (tmp >= maxtrtp) {
151 s->selected_timings.tRTP = i;
152 break;
153 }
154 }
155
156 s->selected_timings.fsb_clk = s->max_fsb;
157
158 printk(BIOS_DEBUG, "Selected timings:\n");
159 printk(BIOS_DEBUG, "\tFSB: %dMHz\n", fsb2mhz(s->selected_timings.fsb_clk));
160 printk(BIOS_DEBUG, "\tDDR: %dMHz\n", ddr2mhz(s->selected_timings.mem_clk));
161
162 printk(BIOS_DEBUG, "\tCAS: %d\n", s->selected_timings.CAS);
163 printk(BIOS_DEBUG, "\ttRAS: %d\n", s->selected_timings.tRAS);
164 printk(BIOS_DEBUG, "\ttRP: %d\n", s->selected_timings.tRP);
165 printk(BIOS_DEBUG, "\ttRCD: %d\n", s->selected_timings.tRCD);
166 printk(BIOS_DEBUG, "\ttWR: %d\n", s->selected_timings.tWR);
167 printk(BIOS_DEBUG, "\ttRFC: %d\n", s->selected_timings.tRFC);
168 printk(BIOS_DEBUG, "\ttWTR: %d\n", s->selected_timings.tWTR);
169 printk(BIOS_DEBUG, "\ttRRD: %d\n", s->selected_timings.tRRD);
170 printk(BIOS_DEBUG, "\ttRTP: %d\n", s->selected_timings.tRTP);
171}
172
173static void clkcross_ddr2(struct sysinfo *s)
174{
175 u8 i, j;
176 MCHBAR16(0xc1c) = MCHBAR16(0xc1c) | (1 << 15);
177
178#define TAB_M667F800 {0x1f1f1f1f, 0x1a07070b, 0x0, 0x10000000, 0x20010208, \
179 0x04080000, 0x10010002, 0x0, 0x0, 0x02000000, \
180 0x04000100, 0x08000000, 0x10200204}
181#define TAB_M800F800 {0xffffffff, 0x05030305, 0x0000ffff, 0x0, 0x08010204, \
182 0x0, 0x08010204, 0x0, 0x0, 0x0, 0x00020001, 0x0, 0x04080102}
183#define TAB_M667F1067 {0x6d5b1f1f, 0x0f0f0f0f, 0x0, 0x20000000, 0x80020410, \
184 0x02040008, 0x10000100, 0x0, 0x0, 0x04000000, \
185 0x08000102, 0x20000000, 0x40010208}
186#define TAB_M800F1067 {0x07070707, 0x06030303, 0x0, 0x0, 0x08010200, \
187 0x0, 0x04000102, 0x0, 0x0, 0x0, 0x00020001, \
188 0x0, 0x02040801}
189#define TAB_M1067F1067 {0xffffffff, 0x05030305, 0x0000ffff, 0x0, 0x04080102, \
190 0x0, 0x08010204, 0x0, 0x0, 0x0, 0x00020001, \
191 0x0, 0x02040801}
192#define TAB_M667F1333 {0x05050303, 0xffffffff, 0xffff0000, 0x0, 0x08020000, \
193 0x0, 0x00020001, 0x0, 0x0, 0x0, 0x08010204, \
194 0x0, 0x04010000}
195#define TAB_M800F1333 {0x0d0b0707, 0x3e1f1f2f, 0x01010000, 0x0, 0x10020400, \
196 0x02000000, 0x00040100, 0x0, 0x0, 0x04080000, \
197 0x00100102, 0x0, 0x08100200}
198#define TAB_M1067F1333 {0x0f0f0f0f, 0x5b1f1f6d, 0x0, 0x0, 0x08010204, \
199 0x04000000, 0x00080102, 0x0, 0x0, 0x02000408, \
200 0x00100001, 0x0, 0x04080102}
201#define TAB_M1333F1333 {0xffffffff, 0x05030305, 0x0000ffff, 0x0, 0x04080102, \
202 0x0, 0x04080102, 0x0, 0x0, 0x0, 0x0, 0x0, 0x02040801}
203
204 static const u32 clkxtab[6][3][13] = {
205 {{}, {}, {}}, // MEMCLK 400 N/A
206 {{}, {}, {}}, // MEMCLK 533 N/A
207 {TAB_M667F800, TAB_M667F1067, TAB_M667F1333, },
208 {TAB_M800F800, TAB_M800F1067, TAB_M800F1333, },
209 {{}, TAB_M1067F1067, TAB_M1067F1333, },
210 {{}, {}, TAB_M1333F1333, },
211 };
212
213 i = (u8)s->selected_timings.mem_clk;
214 j = (u8)s->selected_timings.fsb_clk;
215
216 MCHBAR32(0xc04) = clkxtab[i][j][0];
217 MCHBAR32(0xc50) = clkxtab[i][j][1];
218 MCHBAR32(0xc54) = clkxtab[i][j][2];
219 MCHBAR8(0xc08) = MCHBAR8(0xc08) | (1 << 7);
220 MCHBAR32(0x6d8) = clkxtab[i][j][3];
221 MCHBAR32(0x6e0) = clkxtab[i][j][3];
222 MCHBAR32(0x6dc) = clkxtab[i][j][4];
223 MCHBAR32(0x6e4) = clkxtab[i][j][4];
224 MCHBAR32(0x6e8) = clkxtab[i][j][5];
225 MCHBAR32(0x6f0) = clkxtab[i][j][5];
226 MCHBAR32(0x6ec) = clkxtab[i][j][6];
227 MCHBAR32(0x6f4) = clkxtab[i][j][6];
228 MCHBAR32(0x6f8) = clkxtab[i][j][7];
229 MCHBAR32(0x6fc) = clkxtab[i][j][8];
230 MCHBAR32(0x708) = clkxtab[i][j][11];
231 MCHBAR32(0x70c) = clkxtab[i][j][12];
232}
233
234static void checkreset_ddr2(struct sysinfo *s)
235{
236 u8 pmcon2;
237 u8 reset = 0;
238
239 pmcon2 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa2);
240 if (!(pmcon2 & 0x80)) {
241 pmcon2 |= 0x80;
242 pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, pmcon2);
243 reset = 1;
244
245 /* do magic 0xf0 thing. */
246 u8 reg8 = pci_read_config8(PCI_DEV(0, 0, 0), 0xf0);
247 pci_write_config8(PCI_DEV(0, 0, 0), 0xf0, reg8 & ~(1 << 2));
248 reg8 = pci_read_config8(PCI_DEV(0, 0, 0), 0xf0);
249 pci_write_config8(PCI_DEV(0, 0, 0), 0xf0, reg8 | (1 << 2));
250 }
251 if (reset) {
252 printk(BIOS_DEBUG, "Reset...\n");
253 outb(0xe, 0xcf9);
254 asm ("hlt");
255 }
256 pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, pmcon2 | 0x80);
257}
258
259static void setioclk_ddr2(struct sysinfo *s)
260{
261 MCHBAR32(0x1bc) = 0x08060402;
262 MCHBAR16(0x1c0) = MCHBAR16(0x1c0) | 0x200;
263 MCHBAR16(0x1c0) = MCHBAR16(0x1c0) | 0x100;
264 MCHBAR16(0x1c0) = MCHBAR16(0x1c0) | 0x20;
265 MCHBAR16(0x1c0) = MCHBAR16(0x1c0) & ~1;
266 switch (s->selected_timings.mem_clk) {
267 default:
268 case MEM_CLOCK_800MHz:
269 case MEM_CLOCK_1066MHz:
270 MCHBAR8(0x5d9) = (MCHBAR8(0x5d9) & ~0x2) | 0x2;
271 MCHBAR8(0x9d9) = (MCHBAR8(0x9d9) & ~0x2) | 0x2;
272 MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0xc0;
273 MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0xe0;
274 MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0xa0;
275 break;
276 case MEM_CLOCK_667MHz:
277 case MEM_CLOCK_1333MHz:
278 MCHBAR8(0x5d9) = MCHBAR8(0x5d9) & ~0x2;
279 MCHBAR8(0x9d9) = MCHBAR8(0x9d9) & ~0x2;
280 MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0x40;
281 break;
282 }
283 MCHBAR32(0x594) = MCHBAR32(0x594) | (1 << 31);
284 MCHBAR32(0x994) = MCHBAR32(0x994) | (1 << 31);
285}
286
287static void launch_ddr2(struct sysinfo *s)
288{
289 u8 i;
290 u32 launch1 = 0x58001117;
291 u32 launch2 = 0;
292 u32 launch3 = 0;
293
294 if (s->selected_timings.CAS == 5) {
295 launch2 = 0x00220201;
296 } else if ((s->selected_timings.mem_clk == MEM_CLOCK_800MHz) &&
297 (s->selected_timings.CAS == 6)) {
298 launch2 = 0x00230302;
299 } else {
300 die("Unsupported CAS & Frequency combination detected\n");
301 }
302
303 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
304 MCHBAR32(0x400*i + 0x220) = launch1;
305 MCHBAR32(0x400*i + 0x224) = launch2;
306 MCHBAR32(0x400*i + 0x21c) = launch3;
307 MCHBAR32(0x400*i + 0x248) = MCHBAR32(0x400*i + 0x248) | (1 << 23);
308 }
309
310 MCHBAR32(0x2c0) = (MCHBAR32(0x2c0) & ~0x58000000) | 0x48000000;
311 MCHBAR32(0x2c0) = MCHBAR32(0x2c0) | 0x1e0;
312 MCHBAR32(0x2c4) = (MCHBAR32(0x2c4) & ~0xf) | 0xc;
313}
314
315static void clkset0(u8 ch, u8 setting[5])
316{
317 MCHBAR16(0x400*ch + 0x5a0) = (MCHBAR16(0x400*ch + 0x5a0) & ~0xc440) |
318 (setting[4] << 14) |
319 (setting[3] << 6) |
320 (setting[2] << 10);
321 MCHBAR8(0x400*ch + 0x581) = (MCHBAR8(0x400*ch + 0x581) & ~0x70) |
322 (setting[1] << 4);
323 MCHBAR8(0x400*ch + 0x581) = (MCHBAR8(0x400*ch + 0x581) & ~0xf) |
324 setting[0];
325}
326
327static void clkset1(u8 ch, u8 setting[5])
328{
329 MCHBAR32(0x400*ch + 0x5a0) = (MCHBAR32(0x400*ch + 0x5a0) & ~0x30880) |
330 (setting[4] << 16) |
331 (setting[3] << 7) |
332 (setting[2] << 11);
333 MCHBAR8(0x400*ch + 0x582) = (MCHBAR8(0x400*ch + 0x582) & ~0x70) |
334 (setting[1] << 4);
335 MCHBAR8(0x400*ch + 0x582) = (MCHBAR8(0x400*ch + 0x582) & ~0xf) |
336 setting[0];
337}
338
339static void ctrlset0(u8 ch, u8 setting[5])
340{
341 MCHBAR32(0x400*ch + 0x59c) = (MCHBAR32(0x400*ch + 0x59c) & ~0x3300000) |
342 (setting[4] << 24) |
343 (setting[3] << 20) |
344 (setting[2] << 21);
345 MCHBAR8(0x400*ch + 0x584) = (MCHBAR8(0x400*ch + 0x584) & ~0x70) |
346 (setting[1] << 4);
347 MCHBAR8(0x400*ch + 0x584) = (MCHBAR8(0x400*ch + 0x584) & ~0xf) |
348 setting[0];
349}
350
351static void ctrlset1(u8 ch, u8 setting[5])
352{
353 MCHBAR32(0x400*ch + 0x59c) = (MCHBAR32(0x400*ch + 0x59c) & ~0x18c00000) |
354 (setting[4] << 27) |
355 (setting[3] << 22) |
356 (setting[2] << 23);
357 MCHBAR8(0x400*ch + 0x585) = (MCHBAR8(0x400*ch + 0x585) & ~0x70) |
358 (setting[1] << 4);
359 MCHBAR8(0x400*ch + 0x585) = (MCHBAR8(0x400*ch + 0x585) & ~0xf) |
360 setting[0];
361}
362
363static void ctrlset2(u8 ch, u8 setting[5])
364{
365 MCHBAR32(0x400*ch + 0x598) = (MCHBAR32(0x400*ch + 0x598) & ~0x18c00000) |
366 (setting[4] << 14) |
367 (setting[3] << 12) |
368 (setting[2] << 13);
369 MCHBAR8(0x400*ch + 0x586) = (MCHBAR8(0x400*ch + 0x586) & ~0x70) |
370 (setting[1] << 4);
371 MCHBAR8(0x400*ch + 0x586) = (MCHBAR8(0x400*ch + 0x586) & ~0xf) |
372 setting[0];
373}
374
375static void ctrlset3(u8 ch, u8 setting[5])
376{
377 MCHBAR32(0x400*ch + 0x598) = (MCHBAR32(0x400*ch + 0x598) & ~0x18c00000) |
378 (setting[4] << 10) |
379 (setting[3] << 8) |
380 (setting[2] << 9);
381 MCHBAR8(0x400*ch + 0x587) = (MCHBAR8(0x400*ch + 0x587) & ~0x70) |
382 (setting[1] << 4);
383 MCHBAR8(0x400*ch + 0x587) = (MCHBAR8(0x400*ch + 0x587) & ~0xf) |
384 setting[0];
385}
386
387static void cmdset(u8 ch, u8 setting[5])
388{
389 MCHBAR8(0x400*ch + 0x598) = (MCHBAR8(0x400*ch + 0x598) & ~0x30) |
390 (setting[4] << 4);
391 MCHBAR8(0x400*ch + 0x594) = (MCHBAR8(0x400*ch + 0x594) & ~0x60) |
392 (setting[3] << 5) |
393 (setting[2] << 6);
394 MCHBAR8(0x400*ch + 0x580) = (MCHBAR8(0x400*ch + 0x580) & ~0x70) |
395 (setting[1] << 4);
396 MCHBAR8(0x400*ch + 0x580) = (MCHBAR8(0x400*ch + 0x580) & ~0xf) |
397 setting[0];
398}
399
400static void dqsset(u8 ch, u8 lane, u8 setting[5])
401{
402 MCHBAR32(0x400*ch + 0x5fc) = MCHBAR32(0x400*ch + 0x5fc) & ~(2 << (lane*4));
403
404 MCHBAR32(0x400*ch + 0x5b4) = (MCHBAR32(0x400*ch + 0x5b4) & ~(0x201 << lane)) |
405 (setting[2] << (9 + lane)) |
406 (setting[3] << lane);
407 MCHBAR32(0x400*ch + 0x5b8) = (MCHBAR32(0x400*ch + 0x5b8) & ~(0x201 << lane)) |
408 (setting[2] << (9 + lane)) |
409 (setting[3] << lane);
410 MCHBAR32(0x400*ch + 0x5bc) = (MCHBAR32(0x400*ch + 0x5bc) & ~(0x201 << lane)) |
411 (setting[2] << (9 + lane)) |
412 (setting[3] << lane);
413 MCHBAR32(0x400*ch + 0x5c0) = (MCHBAR32(0x400*ch + 0x5c0) & ~(0x201 << lane)) |
414 (setting[2] << (9 + lane)) |
415 (setting[3] << lane);
416
417 MCHBAR32(0x400*ch + 0x5c8) = (MCHBAR32(0x400*ch + 0x5c8) & ~(0x3 << (16+lane*2))) |
418 (setting[4] << (16+lane*2));
419 MCHBAR32(0x400*ch + 0x5cc) = (MCHBAR32(0x400*ch + 0x5cc) & ~(0x3 << (16+lane*2))) |
420 (setting[4] << (16+lane*2));
421 MCHBAR32(0x400*ch + 0x5d0) = (MCHBAR32(0x400*ch + 0x5d0) & ~(0x3 << (16+lane*2))) |
422 (setting[4] << (16+lane*2));
423 MCHBAR32(0x400*ch + 0x5d4) = (MCHBAR32(0x400*ch + 0x5d4) & ~(0x3 << (16+lane*2))) |
424 (setting[4] << (16+lane*2));
425
426 MCHBAR8(0x400*ch + 0x520 + lane*4) = (MCHBAR8(0x400*ch + 0x520 + lane*4) & ~0x70) |
427 (setting[1] << 4);
428 MCHBAR8(0x400*ch + 0x520 + lane*4) = (MCHBAR8(0x400*ch + 0x520 + lane*4) & ~0xf) |
429 setting[0];
430 MCHBAR8(0x400*ch + 0x521 + lane*4) = (MCHBAR8(0x400*ch + 0x521 + lane*4) & ~0x70) |
431 (setting[1] << 4);
432 MCHBAR8(0x400*ch + 0x521 + lane*4) = (MCHBAR8(0x400*ch + 0x521 + lane*4) & ~0xf) |
433 setting[0];
434 MCHBAR8(0x400*ch + 0x522 + lane*4) = (MCHBAR8(0x400*ch + 0x522 + lane*4) & ~0x70) |
435 (setting[1] << 4);
436 MCHBAR8(0x400*ch + 0x522 + lane*4) = (MCHBAR8(0x400*ch + 0x522 + lane*4) & ~0xf) |
437 setting[0];
438 MCHBAR8(0x400*ch + 0x523 + lane*4) = (MCHBAR8(0x400*ch + 0x523 + lane*4) & ~0x70) |
439 (setting[1] << 4);
440 MCHBAR8(0x400*ch + 0x523 + lane*4) = (MCHBAR8(0x400*ch + 0x523 + lane*4) & ~0xf) |
441 setting[0];
442}
443
444static void dqset(u8 ch, u8 lane, u8 setting[5])
445{
446 MCHBAR32(0x400*ch + 0x5fc) = MCHBAR32(0x400*ch + 0x5fc) & ~(1 << (lane*4));
447
448 MCHBAR32(0x400*ch + 0x5a4) = (MCHBAR32(0x400*ch + 0x5a4) & ~(0x201 << lane)) |
449 (setting[2] << (9+lane)) |
450 (setting[3] << lane);
451 MCHBAR32(0x400*ch + 0x5a8) = (MCHBAR32(0x400*ch + 0x5a8) & ~(0x201 << lane)) |
452 (setting[2] << (9+lane)) |
453 (setting[3] << lane);
454 MCHBAR32(0x400*ch + 0x5ac) = (MCHBAR32(0x400*ch + 0x5ac) & ~(0x201 << lane)) |
455 (setting[2] << (9+lane)) |
456 (setting[3] << lane);
457 MCHBAR32(0x400*ch + 0x5b0) = (MCHBAR32(0x400*ch + 0x5b0) & ~(0x201 << lane)) |
458 (setting[2] << (9+lane)) |
459 (setting[3] << lane);
460
461 MCHBAR32(0x400*ch + 0x5c8) = (MCHBAR32(0x400*ch + 0x5c8) & ~(0x3 << (lane*2))) |
462 (setting[4] << (2*lane));
463 MCHBAR32(0x400*ch + 0x5cc) = (MCHBAR32(0x400*ch + 0x5cc) & ~(0x3 << (lane*2))) |
464 (setting[4] << (2*lane));
465 MCHBAR32(0x400*ch + 0x5d0) = (MCHBAR32(0x400*ch + 0x5d0) & ~(0x3 << (lane*2))) |
466 (setting[4] << (2*lane));
467 MCHBAR32(0x400*ch + 0x5d4) = (MCHBAR32(0x400*ch + 0x5d4) & ~(0x3 << (lane*2))) |
468 (setting[4] << (2*lane));
469
470 MCHBAR8(0x400*ch + 0x500 + lane*4) = (MCHBAR8(0x400*ch + 0x500 + lane*4) & ~0x70) |
471 (setting[1] << 4);
472 MCHBAR8(0x400*ch + 0x500 + lane*4) = (MCHBAR8(0x400*ch + 0x500 + lane*4) & ~0xf) |
473 setting[0];
474 MCHBAR8(0x400*ch + 0x501 + lane*4) = (MCHBAR8(0x400*ch + 0x501 + lane*4) & ~0x70) |
475 (setting[1] << 4);
476 MCHBAR8(0x400*ch + 0x501 + lane*4) = (MCHBAR8(0x400*ch + 0x501 + lane*4) & ~0xf) |
477 setting[0];
478 MCHBAR8(0x400*ch + 0x502 + lane*4) = (MCHBAR8(0x400*ch + 0x502 + lane*4) & ~0x70) |
479 (setting[1] << 4);
480 MCHBAR8(0x400*ch + 0x502 + lane*4) = (MCHBAR8(0x400*ch + 0x502 + lane*4) & ~0xf) |
481 setting[0];
482 MCHBAR8(0x400*ch + 0x503 + lane*4) = (MCHBAR8(0x400*ch + 0x503 + lane*4) & ~0x70) |
483 (setting[1] << 4);
484 MCHBAR8(0x400*ch + 0x503 + lane*4) = (MCHBAR8(0x400*ch + 0x503 + lane*4) & ~0xf) |
485 setting[0];
486}
487
488static void timings_ddr2(struct sysinfo *s)
489{
490 u8 i;
491 u8 twl, ta1, ta2, ta3, ta4;
492 u8 reg8;
493 u8 flag1 = 0;
494 u8 flag2 = 0;
495 u16 reg16;
496 u32 reg32;
497 u16 ddr, fsb;
498 u8 trpmod = 0;
499 u8 bankmod = 1;
500 u8 pagemod = 0;
501
502 u16 fsb2ps[3] = {
503 5000, // 800
504 3750, // 1067
505 3000 // 1333
506 };
507
508 u16 ddr2ps[6] = {
509 5000, // 400
510 3750, // 533
511 3000, // 667
512 2500, // 800
513 1875, // 1067
514 1500 // 1333
515 };
516
517 u16 lut1[6] = {
518 0,
519 0,
520 2600,
521 3120,
522 4171,
523 5200
524 };
525
526 ta1 = 6;
527 ta2 = 6;
528 ta3 = 5;
529 ta4 = 8;
530
531 twl = s->selected_timings.CAS - 1;
532
533 FOR_EACH_POPULATED_DIMM(s->dimms, i) {
534 if (s->dimms[i].banks == 1) { // 8 banks
535 trpmod = 1;
536 bankmod = 0;
537 }
538 if (s->dimms[i].page_size == 2048) {
539 pagemod = 1;
540 }
541 }
542
543 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
544 MCHBAR8(0x400*i + 0x2f6) = MCHBAR8(0x400*i + 0x2f6) | 0x3;
545 MCHBAR8(0x400*i + 0x228) = (MCHBAR8(0x400*i + 0x228) & ~0x7) | 0x2;
546 MCHBAR8(0x400*i + 0x240) = (MCHBAR8(0x400*i + 0x240) & ~0xf0) | (twl << 4);
547 MCHBAR8(0x400*i + 0x240) = (MCHBAR8(0x400*i + 0x240) & ~0xf) |
548 s->selected_timings.CAS;
549 MCHBAR16(0x400*i + 0x265) = (MCHBAR16(0x400*i + 0x265) & ~0x3f00) |
550 ((s->selected_timings.CAS + 9) << 8);
551
552 reg16 = (s->selected_timings.tRAS << 11) |
553 ((twl + 4 + s->selected_timings.tWR) << 6) |
554 ((2 + MAX(s->selected_timings.tRTP, 2)) << 2) | 1;
555 MCHBAR16(0x400*i + 0x250) = reg16;
556
557 reg32 = (bankmod << 21) |
558 (s->selected_timings.tRRD << 17) |
559 (s->selected_timings.tRP << 13) |
560 ((s->selected_timings.tRP + trpmod) << 9) |
561 s->selected_timings.tRFC;
562 reg8 = (MCHBAR8(0x400*i + 0x26f) >> 1) & 1;
563 if (bankmod) {
564 switch (s->selected_timings.mem_clk) {
565 default:
566 case MEM_CLOCK_667MHz:
567 if (reg8) {
568 if (pagemod) {
569 reg32 |= 16 << 22;
570 } else {
571 reg32 |= 12 << 22;
572 }
573 } else {
574 if (pagemod) {
575 reg32 |= 18 << 22;
576 } else {
577 reg32 |= 14 << 22;
578 }
579 }
580 break;
581 case MEM_CLOCK_800MHz:
582 if (reg8) {
583 if (pagemod) {
584 reg32 |= 18 << 22;
585 } else {
586 reg32 |= 14 << 22;
587 }
588 } else {
589 if (pagemod) {
590 reg32 |= 20 << 22;
591 } else {
592 reg32 |= 16 << 22;
593 }
594 }
595 break;
596 }
597 }
598 MCHBAR32(0x400*i + 0x252) = reg32;
599
600 MCHBAR16(0x400*i + 0x256) = (s->selected_timings.tRCD << 12) |
601 (0x4 << 8) | (ta2 << 4) | ta4;
602
603 MCHBAR32(0x400*i + 0x258) = (s->selected_timings.tRCD << 17) |
604 ((twl + 4 + s->selected_timings.tWTR) << 12) |
605 (ta3 << 8) | (4 << 4) | ta1;
606
607 MCHBAR16(0x400*i + 0x25b) = ((s->selected_timings.tRP + trpmod) << 9) |
608 s->selected_timings.tRFC;
609
610 MCHBAR16(0x400*i + 0x260) = (MCHBAR16(0x400*i + 0x260) & ~0x3fe) | (100 << 1);
611 MCHBAR8(0x400*i + 0x264) = 0xff;
612 MCHBAR8(0x400*i + 0x25d) = (MCHBAR8(0x400*i + 0x25d) & ~0x3f) |
613 s->selected_timings.tRAS;
614 MCHBAR16(0x400*i + 0x244) = 0x2310;
615
616 switch (s->selected_timings.mem_clk) {
617 case MEM_CLOCK_667MHz:
618 reg8 = 0;
619 break;
620 default:
621 reg8 = 1;
622 break;
623 }
624
625 MCHBAR8(0x400*i + 0x246) = (MCHBAR8(0x400*i + 0x246) & ~0x1f) |
626 (reg8 << 2) | 1;
627
628 fsb = fsb2ps[s->selected_timings.fsb_clk];
629 ddr = ddr2ps[s->selected_timings.mem_clk];
630 reg32 = (u32)((s->selected_timings.CAS + 7 + reg8) * ddr);
631 reg32 = (u32)((reg32 / fsb) << 8);
632 reg32 |= 0x0e000000;
633 if ((fsb2mhz(s->selected_timings.fsb_clk) /
634 ddr2mhz(s->selected_timings.mem_clk)) > 2) {
635 reg32 |= 1 << 24;
636 }
637 MCHBAR32(0x400*i + 0x248) = (MCHBAR32(0x400*i + 0x248) & ~0x0f001f00) |
638 reg32;
639
640 if (twl > 2) {
641 flag1 = 1;
642 }
643 if (s->selected_timings.mem_clk >= MEM_CLOCK_800MHz) {
644 flag2 = 1;
645 }
646 reg16 = (u8)(twl - 1 - flag1 - flag2);
647 reg16 |= reg16 << 4;
648 if (s->selected_timings.mem_clk == MEM_CLOCK_1333MHz) {
649 if (reg16) {
650 reg16--;
651 }
652 }
653 reg16 |= flag1 << 8;
654 reg16 |= flag2 << 9;
655 MCHBAR16(0x400*i + 0x24d) = (MCHBAR16(0x400*i + 0x24d) & ~0x1ff) | reg16;
656 MCHBAR16(0x400*i + 0x25e) = 0x15a5;
657 MCHBAR32(0x400*i + 0x265) = MCHBAR32(0x400*i + 0x265) & ~0x1f;
658 MCHBAR32(0x400*i + 0x269) = (MCHBAR32(0x400*i + 0x269) & ~0x000fffff) |
659 (0x3f << 14) | lut1[s->selected_timings.mem_clk];
660 MCHBAR8(0x400*i + 0x274) = MCHBAR8(0x400*i + 0x274) | 1;
661 MCHBAR8(0x400*i + 0x24c) = MCHBAR8(0x400*i + 0x24c) & ~0x3;
662
663 reg16 = 0;
664 switch (s->selected_timings.mem_clk) {
665 default:
666 case MEM_CLOCK_667MHz:
667 reg16 = 0x99;
668 break;
669 case MEM_CLOCK_800MHz:
670 if (s->selected_timings.CAS == 5) {
671 reg16 = 0x19a;
672 } else if (s->selected_timings.CAS == 6) {
673 reg16 = 0x9a;
674 }
675 break;
676 }
677 reg16 &= 0x7;
678 reg16 += twl + 9;
679 reg16 <<= 10;
680 MCHBAR16(0x400*i + 0x24d) = (MCHBAR16(0x400*i + 0x24d) & ~0x7c00) | reg16;
681 MCHBAR8(0x400*i + 0x267) = (MCHBAR8(0x400*i + 0x267) & ~0x3f) | 0x13;
682 MCHBAR8(0x400*i + 0x268) = (MCHBAR8(0x400*i + 0x268) & ~0xff) | 0x4a;
683
684 reg16 = (MCHBAR16(0x400*i + 0x269) & 0xc000) >> 2;
685 reg16 += 2 << 12;
686 reg16 |= (0x15 << 6) | 0x1f;
687 MCHBAR16(0x400*i + 0x26d) = (MCHBAR16(0x400*i + 0x26d) & ~0x7fff) | reg16;
688
689 reg32 = (1 << 25) | (6 << 27);
690 MCHBAR32(0x400*i + 0x269) = (MCHBAR32(0x400*i + 0x269) & ~0xfa300000) | reg32;
691 MCHBAR8(0x400*i + 0x271) = MCHBAR8(0x400*i + 0x271) & ~0x80;
692 MCHBAR8(0x400*i + 0x274) = MCHBAR8(0x400*i + 0x274) & ~0x6;
693 } // END EACH POPULATED CHANNEL
694
695 reg16 = 0x1f << 5;
696 reg16 |= 0xe << 10;
697 MCHBAR16(0x125) = (MCHBAR16(0x125) & ~0x3fe0) | reg16;
698 MCHBAR16(0x127) = (MCHBAR16(0x127) & ~0x7ff) | 0x540;
699 MCHBAR8(0x129) = MCHBAR8(0x129) | 0x1f;
700 MCHBAR8(0x12c) = MCHBAR8(0x12c) | 0xa0;
701 MCHBAR32(0x241) = (MCHBAR32(0x241) & ~0x1ffff) | 0x11;
702 MCHBAR32(0x641) = (MCHBAR32(0x641) & ~0x1ffff) | 0x11;
703 MCHBAR8(0x246) = MCHBAR8(0x246) & ~0x10;
704 MCHBAR8(0x646) = MCHBAR8(0x646) & ~0x10;
705 MCHBAR32(0x120) = (2 << 29) | (1 << 28) | (1 << 23) | 0xd7f5f;
706 reg8 = (u8)((MCHBAR32(0x252) & 0x1e000) >> 13);
707 MCHBAR8(0x12d) = (MCHBAR8(0x12d) & ~0xf0) | (reg8 << 4);
708 reg8 = (u8)((MCHBAR32(0x258) & ~0x1e0000) >> 17);
709 MCHBAR8(0x12d) = (MCHBAR8(0x12d) & ~0xf) | reg8;
710 MCHBAR8(0x12f) = 0x4c;
711 reg32 = (1 << 31) | (0x80 << 14) | (1 << 13) | (0xa << 9);
712 MCHBAR32(0x6c0) = (MCHBAR32(0x6c0) & ~0xffffff00) | reg32;
713 MCHBAR8(0x6c4) = (MCHBAR8(0x6c4) & ~0x7) | 0x2;
714}
715
716static void dll_ddr2(struct sysinfo *s)
717{
718 u8 i, j, r, reg8, clk, async;
719 u16 reg16 = 0;
720 u32 reg32 = 0;
721 u8 lane;
722
723 MCHBAR16(0x180) = (MCHBAR16(0x180) & ~0x7e06) | 0xc04;
724 MCHBAR16(0x182) = (MCHBAR16(0x182) & ~0x3ff) | 0xc8;
725 MCHBAR16(0x18a) = (MCHBAR16(0x18a) & ~0x1f1f) | 0x0f0f;
726 MCHBAR16(0x1b4) = (MCHBAR16(0x1b4) & ~0x8020) | 0x100;
727 MCHBAR8(0x194) = (MCHBAR8(0x194) & ~0x77) | 0x33;
728 switch (s->selected_timings.mem_clk) {
729 default:
730 case MEM_CLOCK_667MHz:
731 reg16 = (0xa << 9) | 0xa;
732 break;
733 case MEM_CLOCK_800MHz:
734 reg16 = (0x9 << 9) | 0x9;
735 break;
736 }
737 MCHBAR16(0x19c) = (MCHBAR16(0x19c) & ~0x1e0f) | reg16;
738 MCHBAR16(0x19c) = (MCHBAR16(0x19c) & ~0x2030) | 0x2010;
739 udelay(1);
740 MCHBAR16(0x198) = MCHBAR16(0x198) & ~0x100;
741
742 MCHBAR16(0x1c8) = (MCHBAR16(0x1c8) & ~0x1f) | 0xd;
743
744 udelay(1);
745 MCHBAR8(0x190) = MCHBAR8(0x190) & ~1;
746 udelay(1); // 533ns
747 MCHBAR32(0x198) = MCHBAR32(0x198) & ~0x11554000;
748 udelay(1);
749 MCHBAR32(0x198) = MCHBAR32(0x198) & ~0x1455;
750 udelay(1);
751 MCHBAR8(0x583) = MCHBAR8(0x583) & ~0x1c;
752 MCHBAR8(0x983) = MCHBAR8(0x983) & ~0x1c;
753 udelay(1); // 533ns
754 MCHBAR8(0x583) = MCHBAR8(0x583) & ~0x3;
755 MCHBAR8(0x983) = MCHBAR8(0x983) & ~0x3;
756 udelay(1); // 533ns
757
758 // ME related
759 MCHBAR32(0x1a0) = (MCHBAR32(0x1a0) & ~0x7ffffff) | 0x551803;
760
761 MCHBAR16(0x1b4) = MCHBAR16(0x1b4) & ~0x800;
762 MCHBAR8(0x1a8) = MCHBAR8(0x1a8) | 0xf0;
763
764 FOR_EACH_CHANNEL(i) {
765 reg16 = 0;
766 MCHBAR16(0x400*i + 0x59c) = MCHBAR16(0x400*i + 0x59c) & ~0x3000;
767
768 reg32 = 0;
769 FOR_EACH_RANK_IN_CHANNEL(r) if (!RANK_IS_POPULATED(s->dimms, i, r)) {
770 reg32 |= 0x111 << r;
771 }
772 MCHBAR32(0x400*i + 0x59c) = (MCHBAR32(0x400*i + 0x59c) & ~0xfff) | reg32;
773 MCHBAR8(0x400*i + 0x594) = MCHBAR8(0x400*i + 0x594) & ~1;
774
775 if (!CHANNEL_IS_POPULATED(s->dimms, i)) {
776 printk(BIOS_DEBUG, "No dimms in channel %d\n", i);
777 reg8 = 0x3f;
778 } else if(ONLY_DIMMA_IS_POPULATED(s->dimms, i)) {
779 printk(BIOS_DEBUG, "DimmA populated only in channel %d\n", i);
780 reg8 = 0x38;
781 } else if(ONLY_DIMMB_IS_POPULATED(s->dimms, i)) {
782 printk(BIOS_DEBUG, "DimmB populated only in channel %d\n", i);
783 reg8 = 0x7;
784 } else if(BOTH_DIMMS_ARE_POPULATED(s->dimms, i)) {
785 printk(BIOS_DEBUG, "Both dimms populated in channel %d\n", i);
786 reg8 = 0;
787 } else {
788 die("Unhandled case\n");
789 }
790
791 //reg8 = 0x00; // FIXME dont switch on all clocks anyway
792
793 MCHBAR32(0x400*i + 0x5a0) = (MCHBAR32(0x400*i + 0x5a0) & ~0x3f000000) |
794 ((u32)(reg8 << 24));
795 } // END EACH CHANNEL
796
797 MCHBAR8(0x1a8) = MCHBAR8(0x1a8) | 1;
798 MCHBAR8(0x1a8) = MCHBAR8(0x1a8) & ~0x4;
799
800 // Update DLL timing
801 MCHBAR8(0x1a4) = MCHBAR8(0x1a4) & ~0x80;
802 MCHBAR8(0x1a4) = MCHBAR8(0x1a4) | 0x40;
803 MCHBAR16(0x5f0) = (MCHBAR16(0x5f0) & ~0x400) | 0x400;
804
805 u8 dll_setting_667[23][5] = {
806 // tap pi db delay
807 {13, 0, 1,0, 0},
808 {4, 1, 0,0, 0},
809 {13, 0, 1,0, 0},
810 {4, 5, 0,0, 0},
811 {4, 1, 0,0, 0},
812 {4, 1, 0,0, 0},
813 {4, 1, 0,0, 0},
814 {1, 5, 1,1, 1},
815 {1, 6, 1,1, 1},
816 {2, 0, 1,1, 1},
817 {2, 1, 1,1, 1},
818 {2, 1, 1,1, 1},
819 {14, 6, 1,0, 0},
820 {14, 3, 1,0, 0},
821 {14, 0, 1,0, 0},
822 {9, 0, 0,0, 1},
823 {9, 1, 0,0, 1},
824 {9, 2, 0,0, 1},
825 {9, 2, 0,0, 1},
826 {9, 1, 0,0, 1},
827 {6, 4, 0,0, 1},
828 {6, 2, 0,0, 1},
829 {5, 4, 0,0, 1}
830 };
831
832 u8 dll_setting_800[23][5] = {
833 // tap pi db delay
834 {11, 5, 1,0, 0},
835 {0, 5, 1,1, 0},
836 {11, 5, 1,0, 0},
837 {1, 4, 1,1, 0},
838 {0, 5, 1,1, 0},
839 {0, 5, 1,1, 0},
840 {0, 5, 1,1, 0},
841 {2, 5, 1,1, 1},
842 {2, 6, 1,1, 1},
843 {3, 0, 1,1, 1},
844 {3, 0, 1,1, 1},
845 {3, 3, 1,1, 1},
846 {2, 0, 1,1, 1},
847 {1, 3, 1,1, 1},
848 {0, 3, 1,1, 1},
849 {9, 3, 0,0, 1},
850 {9, 4, 0,0, 1},
851 {9, 5, 0,0, 1},
852 {9, 6, 0,0, 1},
853 {10, 0, 0,0, 1},
854 {8, 1, 0,0, 1},
855 {7, 5, 0,0, 1},
856 {6, 2, 0,0, 1}
857 };
858
859 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
860 MCHBAR16(0x400*i + 0x5f0) = (MCHBAR16(0x400*i + 0x5f0) & ~0x3fc) | 0x3fc;
861 MCHBAR32(0x400*i + 0x5fc) = MCHBAR32(0x400*i + 0x5fc) & ~0xcccccccc;
862 MCHBAR8(0x400*i + 0x5d9) = (MCHBAR8(0x400*i + 0x5d9) & ~0xf0) | 0x70;
863 MCHBAR16(0x400*i + 0x590) = (MCHBAR16(0x400*i + 0x590) & ~0xffff) | 0x5555;
864 }
865
866 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
867 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz) {
868 clkset0(i, &dll_setting_667[CLKSET0][0]);
869 clkset1(i, &dll_setting_667[CLKSET1][0]);
870 ctrlset0(i, &dll_setting_667[CTRL0][0]);
871 ctrlset1(i, &dll_setting_667[CTRL1][0]);
872 ctrlset2(i, &dll_setting_667[CTRL2][0]);
873 ctrlset3(i, &dll_setting_667[CTRL3][0]);
874 cmdset(i, &dll_setting_667[CMD][0]);
875 } else {
876 clkset0(i, &dll_setting_800[CLKSET0][0]);
877 clkset1(i, &dll_setting_800[CLKSET1][0]);
878 ctrlset0(i, &dll_setting_800[CTRL0][0]);
879 ctrlset1(i, &dll_setting_800[CTRL1][0]);
880 ctrlset2(i, &dll_setting_800[CTRL2][0]);
881 ctrlset3(i, &dll_setting_800[CTRL3][0]);
882 cmdset(i, &dll_setting_800[CMD][0]);
883 }
884 }
885
886 // XXX if not async mode
887 MCHBAR16(0x180) = MCHBAR16(0x180) & ~0x8200;
888 MCHBAR8(0x180) = MCHBAR8(0x180) | 0x4;
889 j = 0;
890 for (i = 0; i < 16; i++) {
891 MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
892 MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
893 while (MCHBAR8(0x180) & 0x10);
894 if (MCHBAR32(0x184) == 0xffffffff) {
895 j++;
896 if (j >= 2)
897 break;
898
899 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz) {
900 j = 2;
901 break;
902 }
903 } else {
904 j = 0;
905 }
906 }
907 if (i == 1 || ((i == 0) && s->selected_timings.mem_clk == MEM_CLOCK_667MHz)) {
908 j = 0;
909 i++;
910 for (; i < 16; i++) {
911 MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
912 MCHBAR8(0x180) = MCHBAR8(0x180) | 0x4;
913 while (MCHBAR8(0x180) & 0x10);
914 if (MCHBAR32(0x184) == 0) {
915 i++;
916 break;
917 }
918 }
919 for (; i < 16; i++) {
920 MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
921 MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
922 while (MCHBAR8(0x180) & 0x10);
923 if (MCHBAR32(0x184) == 0xffffffff) {
924 j++;
925 if (j >= 2)
926 break;
927 } else {
928 j = 0;
929 }
930 }
931 if (j < 2) {
932 MCHBAR8(0x1c8) = MCHBAR8(0x1c8) & ~0x1f;
933 MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
934 while (MCHBAR8(0x180) & 0x10);
935 j = 2;
936 }
937 }
938
939 if (j < 2) {
940 MCHBAR8(0x1c8) = MCHBAR8(0x1c8) & ~0x1f;
941 async = 1;
942 }
943
944 clk = 0x1a;
945 if (async != 1) {
946 reg8 = MCHBAR8(0x188) & 0x1e;
947 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz &&
948 s->selected_timings.fsb_clk == FSB_CLOCK_800MHz) {
949 clk = 0x10;
950 } else if (s->selected_timings.mem_clk == MEM_CLOCK_800MHz) {
951 clk = 0x10;
952 } else {
953 clk = 0x1a;
954 }
955 }
956 MCHBAR8(0x180) = MCHBAR8(0x180) & ~0x80;
957
958 if ((s->selected_timings.fsb_clk == FSB_CLOCK_800MHz) &&
959 (s->selected_timings.mem_clk == MEM_CLOCK_667MHz)) {
960 i = MCHBAR8(0x180) & 0xf;
961 i = (i + 10) % 14;
962 MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
963 MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
964 while(MCHBAR8(0x180) & 0x10);
965 }
966
967 reg8 = MCHBAR8(0x188) & ~1;
968 MCHBAR8(0x188) = reg8;
969 reg8 &= ~0x3e;
970 reg8 |= clk;
971 MCHBAR8(0x188) = reg8;
972 reg8 |= 1;
973 MCHBAR8(0x188) = reg8;
974
975 if (s->selected_timings.mem_clk == MEM_CLOCK_1333MHz) {
976 MCHBAR8(0x18c) = MCHBAR8(0x18c) | 1;
977 }
978
979 // Program DQ/DQS dll settings
980 reg32 = 0;
981 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
982 for (lane = 0; lane < 8; lane++) {
983 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz) {
984 reg32 = 0x06db7777;
985 } else if (s->selected_timings.mem_clk == MEM_CLOCK_800MHz) {
986 reg32 = 0x00007777;
987 }
988 MCHBAR32(0x400*i + 0x540 + lane*4) =
989 (MCHBAR32(0x400*i + 0x540 + lane*4) & 0x0fffffff) |
990 reg32;
991 }
992 }
993
994 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
995 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz) {
996 for (lane = 0; lane < 8; lane++) {
997 dqsset(i, lane, &dll_setting_667[DQS1+lane][0]);
998 }
999 for (lane = 0; lane < 8; lane++) {
1000 dqset(i, lane, &dll_setting_667[DQ1+lane][0]);
1001 }
1002 } else {
1003 for (lane = 0; lane < 8; lane++) {
1004 dqsset(i, lane, &dll_setting_800[DQS1+lane][0]);
1005 }
1006 for (lane = 0; lane < 8; lane++) {
1007 dqset(i, lane, &dll_setting_800[DQ1+lane][0]);
1008 }
1009 }
1010 }
1011}
1012
1013static void rcomp_ddr2(struct sysinfo *s)
1014{
1015 u8 i, j, k;
1016 u32 x32a[8] = { 0x04040404, 0x06050505, 0x09090807, 0x0D0C0B0A, 0x04040404, 0x08070605, 0x0C0B0A09, 0x100F0E0D };
1017 u16 x378[6] = { 0, 0xAAAA, 0x7777, 0x7777, 0x7777, 0x7777 };
1018 u32 x382[6] = { 0, 0x02020202, 0x02020202, 0x02020202, 0x04030303, 0x04030303 };
1019 u32 x386[6] = { 0, 0x03020202, 0x03020202, 0x03020202, 0x05040404, 0x05040404 };
1020 u32 x38a[6] = { 0, 0x04040303, 0x04040303, 0x04040303, 0x07070605, 0x07070605 };
1021 u32 x38e[6] = { 0, 0x06060505, 0x06060505, 0x06060505, 0x09090808, 0x09090808 };
1022 u32 x392[6] = { 0, 0x02020202, 0x02020202, 0x02020202, 0x03030202, 0x03030202 };
1023 u32 x396[6] = { 0, 0x03030202, 0x03030202, 0x03030202, 0x05040303, 0x05040303 };
1024 u32 x39a[6] = { 0, 0x04040403, 0x04040403, 0x04040403, 0x07070605, 0x07070605 };
1025 u32 x39e[6] = { 0, 0x06060505, 0x06060505, 0x06060505, 0x08080808, 0x08080808 };
1026 u16 addr[6] = { 0x31c, 0x374, 0x3a2, 0x3d0, 0x3fe, 0x42c };
1027 u8 bit[6] = { 0, 0, 1, 1, 0, 0 };
1028
1029 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
1030 for (j = 0; j < 6; j++) {
1031 if (j == 0) {
1032 MCHBAR32(0x400*i + addr[j]) =
1033 (MCHBAR32(0x400*i + addr[j]) & ~0xff000) | 0xaa000;
1034 MCHBAR16(0x400*i + 0x320) = (MCHBAR16(0x400*i + 0x320) & ~0xffff) | 0x6666;
1035 for (k = 0; k < 8; k++) {
1036 MCHBAR32(0x400*i + addr[j] + 0xe + (k << 2)) =
1037 (MCHBAR32(0x400*i + addr[j] + 0xe + (k << 2)) & ~0x3f3f3f3f) | x32a[k];
1038 MCHBAR32(0x400*i + addr[j] + 0x2e + (k << 2)) =
1039 (MCHBAR32(0x400*i + addr[j] + 0x2e + (k << 2)) & ~0x3f3f3f3f) | x32a[k];
1040 }
1041 } else {
1042 MCHBAR16(0x400*i + addr[j]) = (MCHBAR16(0x400*i + addr[j]) & ~0xf000) | 0xa000;
1043 MCHBAR16(0x400*i + addr[j] + 4) = (MCHBAR16(0x400*i + addr[j] + 4) & ~0xffff) |
1044 x378[j];
1045 MCHBAR32(0x400*i + addr[j] + 0xe) =
1046 (MCHBAR32(0x400*i + addr[j] + 0xe) & ~0x3f3f3f3f) | x382[j];
1047 MCHBAR32(0x400*i + addr[j] + 0x12) =
1048 (MCHBAR32(0x400*i + addr[j] + 0x12) & ~0x3f3f3f3f) | x386[j];
1049 MCHBAR32(0x400*i + addr[j] + 0x16) =
1050 (MCHBAR32(0x400*i + addr[j] + 0x16) & ~0x3f3f3f3f) | x38a[j];
1051 MCHBAR32(0x400*i + addr[j] + 0x1a) =
1052 (MCHBAR32(0x400*i + addr[j] + 0x1a) & ~0x3f3f3f3f) | x38e[j];
1053 MCHBAR32(0x400*i + addr[j] + 0x1e) =
1054 (MCHBAR32(0x400*i + addr[j] + 0x1e) & ~0x3f3f3f3f) | x392[j];
1055 MCHBAR32(0x400*i + addr[j] + 0x22) =
1056 (MCHBAR32(0x400*i + addr[j] + 0x22) & ~0x3f3f3f3f) | x396[j];
1057 MCHBAR32(0x400*i + addr[j] + 0x26) =
1058 (MCHBAR32(0x400*i + addr[j] + 0x26) & ~0x3f3f3f3f) | x39a[j];
1059 MCHBAR32(0x400*i + addr[j] + 0x2a) =
1060 (MCHBAR32(0x400*i + addr[j] + 0x2a) & ~0x3f3f3f3f) | x39e[j];
1061 }
1062 MCHBAR8(0x400*i + addr[j]) = (MCHBAR8(0x400*i + addr[j]) & ~1) | bit[j];
1063 }
1064 MCHBAR8(0x400*i + 0x45a) = (MCHBAR8(0x400*i + 0x45a) & ~0x3f) | 0x12;
1065 MCHBAR8(0x400*i + 0x45e) = (MCHBAR8(0x400*i + 0x45e) & ~0x3f) | 0x12;
1066 MCHBAR8(0x400*i + 0x462) = (MCHBAR8(0x400*i + 0x462) & ~0x3f) | 0x12;
1067 MCHBAR8(0x400*i + 0x466) = (MCHBAR8(0x400*i + 0x466) & ~0x3f) | 0x12;
1068 } // END EACH POPULATED CHANNEL
1069
1070 MCHBAR32(0x134) = (MCHBAR32(0x134) & ~0x63c00) | 0x63c00;
1071 MCHBAR16(0x174) = (MCHBAR16(0x174) & ~0x63ff) | 0x63ff;
1072 MCHBAR16(0x178) = 0x0135;
1073 MCHBAR32(0x130) = (MCHBAR32(0x130) & ~0x7bdffe0) | 0x7a9ffa0;
1074
1075 if (!CHANNEL_IS_POPULATED(s->dimms, 0)) {
1076 MCHBAR32(0x130) = MCHBAR32(0x130) & ~(1 << 27);
1077 }
1078 if (!CHANNEL_IS_POPULATED(s->dimms, 1)) {
1079 MCHBAR32(0x130) = MCHBAR32(0x130) & ~(1 << 28);
1080 }
1081
1082 MCHBAR8(0x130) = MCHBAR8(0x130) | 1;
1083}
1084
1085static void odt_ddr2(struct sysinfo *s)
1086{
1087 u8 i;
1088 u16 odt[16][2] = {
1089 { 0x0000,0x0000 }, // NC_NC
1090 { 0x0000,0x0001 }, // x8SS_NC
1091 { 0x0000,0x0011 }, // x8DS_NC
1092 { 0x0000,0x0001 }, // x16SS_NC
1093 { 0x0004,0x0000 }, // NC_x8SS
1094 { 0x0101,0x0404 }, // x8SS_x8SS
1095 { 0x0101,0x4444 }, // x8DS_x8SS
1096 { 0x0101,0x0404 }, // x16SS_x8SS
1097 { 0x0044,0x0000 }, // NC_x8DS
1098 { 0x1111,0x0404 }, // x8SS_x8DS
1099 { 0x1111,0x4444 }, // x8DS_x8DS
1100 { 0x1111,0x0404 }, // x16SS_x8DS
1101 { 0x0004,0x0000 }, // NC_x16SS
1102 { 0x0101,0x0404 }, // x8SS_x16SS
1103 { 0x0101,0x4444 }, // x8DS_x16SS
1104 { 0x0101,0x0404 }, // x16SS_x16SS
1105 };
1106
1107 FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
1108 MCHBAR16(0x400*i + 0x298) = odt[s->dimm_config[i]][1];
1109 MCHBAR16(0x400*i + 0x294) = odt[s->dimm_config[i]][0];
1110 MCHBAR16(0x400*i + 0x29c) = (MCHBAR16(0x400*i + 0x29c) & ~0xfff) | 0x66b;
1111 MCHBAR32(0x400*i + 0x260) = (MCHBAR32(0x400*i + 0x260) & ~0x70e3c00) | 0x3063c00;
1112 }
1113}
1114
1115static void dojedec_ddr2(u8 r, u8 ch, u8 cmd, u16 val)
1116{
1117 u32 addr = (ch << 29) | (r*0x08000000);
1118 volatile u32 rubbish;
1119
1120 MCHBAR8(0x271) = (MCHBAR8(0x271) & ~0x3e) | cmd;
1121 MCHBAR8(0x671) = (MCHBAR8(0x671) & ~0x3e) | cmd;
1122 rubbish = read32((void*)((val<<3) | addr));
1123 udelay(10);
1124 MCHBAR8(0x271) = (MCHBAR8(0x271) & ~0x3e) | NORMALOP_CMD;
1125 MCHBAR8(0x671) = (MCHBAR8(0x671) & ~0x3e) | NORMALOP_CMD;
1126}
1127
1128static void jedec_ddr2(struct sysinfo *s)
1129{
1130 u8 i;
1131 u16 mrsval, ch, r, v;
1132
1133 u8 odt[16][4] = {
1134 {0x00, 0x00, 0x00, 0x00},
1135 {0x01, 0x00, 0x00, 0x00},
1136 {0x01, 0x01, 0x00, 0x00},
1137 {0x01, 0x00, 0x00, 0x00},
1138 {0x00, 0x00, 0x01, 0x00},
1139 {0x11, 0x00, 0x11, 0x00},
1140 {0x11, 0x11, 0x11, 0x00},
1141 {0x11, 0x00, 0x11, 0x00},
1142 {0x00, 0x00, 0x01, 0x01},
1143 {0x11, 0x00, 0x11, 0x11},
1144 {0x11, 0x11, 0x11, 0x11},
1145 {0x11, 0x00, 0x11, 0x11},
1146 {0x00, 0x00, 0x01, 0x00},
1147 {0x11, 0x00, 0x11, 0x00},
1148 {0x11, 0x11, 0x11, 0x00},
1149 {0x11, 0x00, 0x11, 0x00}
1150 };
1151
1152 u16 jedec[12][2] = {
1153 {NOP_CMD, 0x0},
1154 {PRECHARGE_CMD, 0x0},
1155 {EMRS2_CMD, 0x0},
1156 {EMRS3_CMD, 0x0},
1157 {EMRS1_CMD, 0x0},
1158 {MRS_CMD, 0x100}, // DLL Reset
1159 {PRECHARGE_CMD, 0x0},
1160 {CBR_CMD, 0x0},
1161 {CBR_CMD, 0x0},
1162 {MRS_CMD, 0x0}, // DLL out of reset
1163 {EMRS1_CMD, 0x380}, // OCD calib default
1164 {EMRS1_CMD, 0x0}
1165 };
1166
1167 mrsval = (s->selected_timings.CAS << 4) | ((s->selected_timings.tWR - 1) << 9) | 0xb;
1168
1169 printk(BIOS_DEBUG, "MRS...\n");
1170
1171 udelay(200);
1172
1173 FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
1174 printk(BIOS_DEBUG, "CH%d: Found Rank %d\n", ch, r);
1175 for (i = 0; i < 12; i++) {
1176 v = jedec[i][1];
1177 switch (jedec[i][0]) {
1178 case EMRS1_CMD:
1179 v |= (odt[s->dimm_config[ch]][r] << 2);
1180 break;
1181 case MRS_CMD:
1182 v |= mrsval;
1183 break;
1184 default:
1185 break;
1186 }
1187 dojedec_ddr2(r + ch*4, ch, jedec[i][0], v);
1188 udelay(1);
1189 //printk(BIOS_DEBUG, "Jedec step %d\n", i);
1190 }
1191 }
1192 printk(BIOS_DEBUG, "MRS done\n");
1193}
1194
1195static u8 sampledqs(u16 mchloc, u32 addr, u8 hilow, u8 repeat)
1196{
1197 u8 dqsmatch = 1;
1198 volatile u32 strobe;
1199
1200 while (repeat-- > 0) {
1201 MCHBAR8(0x5d8) = MCHBAR8(0x5d8) & ~0x2;
1202 udelay(2);
1203 MCHBAR8(0x5d8) = MCHBAR8(0x5d8) | 0x2;
1204 udelay(2);
1205 MCHBAR8(0x9d8) = MCHBAR8(0x9d8) & ~0x2;
1206 udelay(2);
1207 MCHBAR8(0x9d8) = MCHBAR8(0x9d8) | 0x2;
1208 udelay(2);
1209 barrier();
1210 strobe = read32((u32 *)addr);
1211 barrier();
1212 if (((MCHBAR32(mchloc) & 0x40) >> 6) != hilow) {
1213 dqsmatch = 0;
1214 }
1215 }
1216 return dqsmatch;
1217}
1218
1219static void rcven_ddr2(struct sysinfo *s)
1220{
1221 u8 i, reg8, ch, lane;
1222 u32 addr;
1223 u8 tap = 0;
1224 u8 savecc, savemedium, savetap, coarsecommon, medium;
1225 u8 lanecoarse[8] = {0};
1226 u8 mincoarse = 0xff;
1227 u8 pitap[2][8];
1228 u16 coarsectrl[2];
1229 u16 coarsedelay[2];
1230 u16 mediumphase[2];
1231 u16 readdelay[2];
1232 u16 mchbar;
1233 MCHBAR8(0x5d8) = MCHBAR8(0x5d8) & ~0xc;
1234 MCHBAR8(0x9d8) = MCHBAR8(0x9d8) & ~0xc;
1235 MCHBAR8(0x5dc) = MCHBAR8(0x5dc) & ~0x80;
1236
1237 FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
1238 addr = (ch << 29);
1239 for (i = 0; !RANK_IS_POPULATED(s->dimms, ch, i); i++) {
1240 addr += 128*1024*1024;
1241 }
1242 for (lane = 0; lane < 8; lane++) {
1243 printk(BIOS_DEBUG, "Channel %d, Lane %d addr=0x%08x\n", ch, lane, addr);
1244 coarsecommon = (s->selected_timings.CAS - 1);
1245 switch (lane) {
1246 case 0: case 1: medium = 0; break;
1247 case 2: case 3: medium = 1; break;
1248 case 4: case 5: medium = 2; break;
1249 case 6: case 7: medium = 3; break;
1250 default: medium = 0; break;
1251 }
1252 mchbar = 0x400*ch + 0x561 + (lane << 2);
1253 tap = 0;
1254 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) |
1255 (coarsecommon << 16);
1256 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) & ~(3 << (lane*2))) |
1257 (medium << (lane*2));
1258 MCHBAR8(0x400*ch + 0x560 + lane*4) = MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0xf;
1259 MCHBAR8(0x400*ch + 0x560 + lane*4) = MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0x70;
1260 savecc = coarsecommon;
1261 savemedium = medium;
1262 savetap = 0;
1263
1264 MCHBAR16(0x400*ch + 0x588) = (MCHBAR16(0x400*ch + 0x588) & ~(3 << (lane*2))) |
1265 (1 << (lane*2));
1266
1267 printk(BIOS_DEBUG, "rcven 0.1 coarse=%d\n", coarsecommon);
1268 while (sampledqs(mchbar, addr, 1, 1) == 1) {
1269 if (medium < 3) {
1270 medium++;
1271 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1272 ~(3 << (lane*2))) | (medium << (lane*2));
1273 } else {
1274 medium = 0;
1275 coarsecommon++;
1276 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1277 ~0xf0000) | (coarsecommon << 16);
1278 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1279 ~(3 << (lane*2))) | (medium << (lane*2));
1280 }
1281 if (coarsecommon > 16) {
1282 die("Coarse > 16: DQS tuning failed, halt\n");
1283 break;
1284 }
1285 }
1286 printk(BIOS_DEBUG, " GOT IT (high -> low transition) coarse=%d medium=%d\n", coarsecommon, medium);
1287
1288 savemedium = medium;
1289 savecc = coarsecommon;
1290 if (medium < 3) {
1291 medium++;
1292 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1293 ~(3 << (lane*2))) | (medium << (lane*2));
1294 } else {
1295 medium = 0;
1296 coarsecommon++;
1297
1298 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) |
1299 (coarsecommon << 16);
1300 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) & ~(3 << (lane*2))) |
1301 (medium << (lane*2));
1302 }
1303
1304 printk(BIOS_DEBUG, "rcven 0.2\n");
1305 while (sampledqs(mchbar, addr, 0, 1) == 1) {
1306 savemedium = medium;
1307 savecc = coarsecommon;
1308 if (medium < 3) {
1309 medium++;
1310 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1311 ~(3 << (lane*2))) | (medium << (lane*2));
1312 } else {
1313 medium = 0;
1314 coarsecommon++;
1315 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1316 ~0xf0000) | (coarsecommon << 16);
1317 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1318 ~(3 << (lane*2))) | (medium << (lane*2));
1319 }
1320 if (coarsecommon > 16) {
1321 die("Coarse DQS tuning 2 failed, halt\n");
1322 break;
1323 }
1324 }
1325 printk(BIOS_DEBUG, " GOT IT (low -> high transition) coarse=%d medium=%d\n", coarsecommon, medium);
1326
1327
1328 coarsecommon = savecc;
1329 medium = savemedium;
1330 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1331 ~0xf0000) | (coarsecommon << 16);
1332 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1333 ~(3 << (lane*2))) | (medium << (lane*2));
1334
1335 printk(BIOS_DEBUG, "rcven 0.3\n");
1336 tap = 0;
1337 while (sampledqs(mchbar, addr, 1, 1) == 0) {
1338 savetap = tap;
1339 tap++;
1340 if (tap > 14) {
1341 break;
1342 }
1343 MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
1344 (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0xf) | tap;
1345 }
1346
1347 tap = savetap;
1348 MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
1349 (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0xf) | tap;
1350 MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
1351 (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0x70) | 0x30;
1352 if (medium < 3) {
1353 medium++;
1354 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1355 ~(3 << (lane*2))) | (medium << (lane*2));
1356 } else {
1357 medium = 0;
1358 coarsecommon++;
1359 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1360 ~0xf0000) | (coarsecommon << 16);
1361 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1362 ~(3 << (lane*2))) | (medium << (lane*2));
1363 }
1364 if (sampledqs(mchbar, addr, 1, 1) == 0) {
1365 die("Not at DQS high, doh\n");
1366 }
1367
1368 printk(BIOS_DEBUG, "rcven 0.4\n");
1369 while (sampledqs(mchbar, addr, 1, 1) == 1) {
1370 coarsecommon--;
1371 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1372 ~0xf0000) | (coarsecommon << 16);
1373 if (coarsecommon == 0) {
1374 die("Couldn't find DQS-high 0 indicator, halt\n");
1375 break;
1376 }
1377 }
1378 printk(BIOS_DEBUG, " GOT IT (high -> low transition) coarse=%d medium=%d\n", coarsecommon, medium);
1379
1380 printk(BIOS_DEBUG, "rcven 0.5\n");
1381 while (sampledqs(mchbar, addr, 0, 1) == 1) {
1382 savemedium = medium;
1383 savecc = coarsecommon;
1384 if (medium < 3) {
1385 medium++;
1386 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1387 ~(3 << (lane*2))) | (medium << (lane*2));
1388 } else {
1389 medium = 0;
1390 coarsecommon++;
1391 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1392 ~0xf0000) | (coarsecommon << 16);
1393 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1394 ~(3 << (lane*2))) | (medium << (lane*2));
1395 }
1396 if (coarsecommon > 16) {
1397 die("Coarse DQS tuning 5 failed, halt\n");
1398 break;
1399 }
1400 }
1401 printk(BIOS_DEBUG, " GOT IT (low -> high transition) coarse=%d medium=%d\n", coarsecommon, medium);
1402
1403 printk(BIOS_DEBUG, "rcven 0.6\n");
1404 coarsecommon = savecc;
1405 medium = savemedium;
1406 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
1407 ~0xf0000) | (coarsecommon << 16);
1408 MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
1409 ~(3 << (lane*2))) | (medium << (lane*2));
1410 while (sampledqs(mchbar, addr, 1, 1) == 0) {
1411 savetap = tap;
1412 tap++;
1413 if (tap > 14) {
1414 break;
1415 }
1416 MCHBAR8(0x400*ch + 0x560 + lane*4) =
1417 (MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0xf) | tap;
1418 }
1419 tap = savetap;
1420 MCHBAR8(0x400*ch + 0x560 + lane*4) =
1421 (MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0xf) | tap;
1422 MCHBAR8(0x400*ch + 0x560 + lane*4) =
1423 (MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0x70) | 0x70;
1424
1425 pitap[ch][lane] = 0x70 | tap;
1426
1427 MCHBAR16(0x400*ch + 0x588) = MCHBAR16(0x400*ch + 0x588) & ~(3 << (lane*2));
1428 lanecoarse[lane] = coarsecommon;
1429 printk(BIOS_DEBUG, "rcven 0.7\n");
1430 } // END EACH LANE
1431
1432 // Find minimum coarse value
1433 for (lane = 0; lane < 8; lane++) {
1434 if (mincoarse > lanecoarse[lane]) {
1435 mincoarse = lanecoarse[lane];
1436 }
1437 }
1438
1439 printk(BIOS_DEBUG, "Found min coarse value = %d\n", mincoarse);
1440
1441 for (lane = 0; lane < 8; lane++) {
1442 reg8 = (lanecoarse[lane] == 0) ? 0 : lanecoarse[lane] - mincoarse;
1443 MCHBAR16(0x400*ch + 0x5fa) = (MCHBAR16(0x400*ch + 0x5fa) & ~(3 << (lane*2))) |
1444 (reg8 << (lane*2));
1445 }
1446 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) | (mincoarse << 16);
1447 coarsectrl[ch] = mincoarse;
1448 coarsedelay[ch] = MCHBAR16(0x400*ch + 0x5fa);
1449 mediumphase[ch] = MCHBAR16(0x400*ch + 0x58c);
1450 readdelay[ch] = MCHBAR16(0x400*ch + 0x588);
1451 } // END EACH POPULATED CHANNEL
1452
1453 /* TODO: Resume support using this */
1454 FOR_EACH_CHANNEL(ch) {
1455 for (lane = 0; lane < 8; lane++) {
1456 MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
1457 (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0xf) | pitap[ch][lane];
1458 }
1459 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) |
1460 (coarsectrl[ch] << 16);
1461 MCHBAR16(0x400*ch + 0x5fa) = coarsedelay[ch];
1462 MCHBAR16(0x400*ch + 0x58c) = mediumphase[ch];
1463 }
1464 printk(BIOS_DEBUG, "End rcven\n");
1465}
1466
1467static void dradrb_ddr2(struct sysinfo *s)
1468{
1469 u8 map, i, ch, r, rankpop0, rankpop1;
1470 u32 c0dra = 0;
1471 u32 c1dra = 0;
1472 u32 c0drb = 0;
1473 u32 c1drb = 0;
1474 u32 dra;
1475 u32 dra0;
1476 u32 dra1;
1477 u16 totalmemorymb;
Damien Zammit9fb08f52016-01-22 18:56:23 +11001478 u32 size, offset;
1479 u32 size0, size1;
Damien Zammit4b513a62015-08-20 00:37:05 +10001480 u8 dratab[2][2][2][4] = {
1481 {
1482 {
1483 {0xff, 0xff, 0xff, 0xff},
1484 {0xff, 0x00, 0x02, 0xff}
1485 },
1486 {
1487 {0xff, 0x01, 0xff, 0xff},
1488 {0xff, 0x03, 0xff, 0xff}
1489 }
1490 },
1491 {
1492 {
1493 {0xff, 0xff, 0xff, 0xff},
1494 {0xff, 0x04, 0x06, 0x08}
1495 },
1496 {
1497 {0xff, 0xff, 0xff, 0xff},
1498 {0x05, 0x07, 0x09, 0xff}
1499 }
1500 }
1501 };
1502
1503 u8 drbtab[10] = {0x04, 0x02, 0x08, 0x04, 0x08, 0x04, 0x10, 0x08, 0x20, 0x10};
1504
1505 // DRA
1506 rankpop0 = 0;
1507 rankpop1 = 0;
1508 FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
1509 if ((s->dimms[ch<<1].card_type && ((r) < s->dimms[ch<<1].ranks))) {
1510 i = ch << 1;
1511 } else {
1512 i = (ch << 1) + 1;
1513 }
1514 dra = dratab[s->dimms[i].banks]
1515 [s->dimms[i].width]
1516 [s->dimms[i].cols-9]
1517 [s->dimms[i].rows-12];
1518 if (s->dimms[i].banks == 1) {
1519 dra |= 0x80;
1520 }
1521 if (ch == 0) {
1522 c0dra |= dra << (r*8);
1523 rankpop0 |= 1 << r;
1524 } else {
1525 c1dra |= dra << (r*8);
1526 rankpop1 |= 1 << r;
1527 }
1528 }
1529 MCHBAR32(0x208) = c0dra;
1530 MCHBAR32(0x608) = c1dra;
1531
1532 MCHBAR8(0x262) = (MCHBAR8(0x262) & ~0xf0) | ((rankpop0 << 4) & 0xf0);
1533 MCHBAR8(0x662) = (MCHBAR8(0x662) & ~0xf0) | ((rankpop1 << 4) & 0xf0);
1534
1535 if (ONLY_DIMMA_IS_POPULATED(s->dimms, 0) || ONLY_DIMMB_IS_POPULATED(s->dimms, 0)) {
1536 MCHBAR8(0x260) = MCHBAR8(0x260) | 1;
1537 }
1538 if (ONLY_DIMMA_IS_POPULATED(s->dimms, 1) || ONLY_DIMMB_IS_POPULATED(s->dimms, 1)) {
1539 MCHBAR8(0x660) = MCHBAR8(0x660) | 1;
1540 }
1541
1542 // DRB
1543 FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
1544 if ((s->dimms[ch<<1].card_type && ((r) < s->dimms[ch<<1].ranks))) {
1545 i = ch << 1;
1546 } else {
1547 i = (ch << 1) + 1;
1548 }
1549 if (ch == 0) {
1550 dra0 = (c0dra >> (8*r)) & 0x7f;
1551 c0drb = (u16)(c0drb + drbtab[dra0]);
1552 s->dimms[i].rank_capacity_mb = drbtab[dra0] << 6;
1553 MCHBAR16(0x200 + 2*r) = c0drb;
1554 } else {
1555 dra1 = (c1dra >> (8*r)) & 0x7f;
1556 c1drb = (u16)(c1drb + drbtab[dra1]);
1557 s->dimms[i].rank_capacity_mb = drbtab[dra1] << 6;
1558 MCHBAR16(0x600 + 2*r) = c1drb;
1559 }
1560 }
1561
1562 s->channel_capacity[0] = c0drb << 6;
1563 s->channel_capacity[1] = c1drb << 6;
1564 totalmemorymb = s->channel_capacity[0] + s->channel_capacity[1];
1565 printk(BIOS_DEBUG, "Total memory: %d + %d = %dMiB\n",
1566 s->channel_capacity[0], s->channel_capacity[1], totalmemorymb);
1567
1568 rankpop1 >>= 4;
1569 if (rankpop1) {
1570 MCHBAR16(0x600 + 2*msbpos(rankpop1)) = c0drb + c1drb;
1571 MCHBAR16(0x602 + 2*msbpos(rankpop1)) = c0drb + c1drb;
1572 MCHBAR16(0x604 + 2*msbpos(rankpop1)) = c0drb + c1drb;
1573 MCHBAR16(0x606 + 2*msbpos(rankpop1)) = c0drb + c1drb;
1574 }
1575
Damien Zammit9fb08f52016-01-22 18:56:23 +11001576 /* Populated channel sizes in MiB */
1577 size0 = s->channel_capacity[0];
1578 size1 = s->channel_capacity[1];
1579
1580 MCHBAR8(0x111) = MCHBAR8(0x111) & ~0x2;
1581 MCHBAR8(0x111) = MCHBAR8(0x111) | (1 << 4);
1582
1583 /* Set ME UMA size in MiB */
1584 MCHBAR16(0x100) = ME_UMA_SIZEMB;
1585
1586 /* Set ME UMA Present bit */
1587 MCHBAR32(0x111) = MCHBAR32(0x111) | 1;
1588
1589 size = MIN(size0 - ME_UMA_SIZEMB, size1) * 2;
1590
1591 MCHBAR16(0x104) = size;
1592 MCHBAR16(0x102) = size0 + size1 - size;
1593
Damien Zammit4b513a62015-08-20 00:37:05 +10001594 map = 0;
Damien Zammit9fb08f52016-01-22 18:56:23 +11001595 if (size0 == 0) {
Damien Zammit4b513a62015-08-20 00:37:05 +10001596 map = 0;
Damien Zammit9fb08f52016-01-22 18:56:23 +11001597 } else if (size1 == 0) {
Damien Zammit4b513a62015-08-20 00:37:05 +10001598 map |= 0x20;
1599 } else {
1600 map |= 0x40;
1601 }
Damien Zammit9fb08f52016-01-22 18:56:23 +11001602 if (size == 0) {
1603 map |= 0x18;
1604 }
1605
1606 if (size0 - ME_UMA_SIZEMB >= size1) {
Damien Zammit4b513a62015-08-20 00:37:05 +10001607 map |= 0x4;
1608 }
1609 MCHBAR8(0x110) = map;
1610 MCHBAR16(0x10e) = 0;
Damien Zammit9fb08f52016-01-22 18:56:23 +11001611
1612 if (size1 != 0) {
Damien Zammit4b513a62015-08-20 00:37:05 +10001613 offset = 0;
Damien Zammit9fb08f52016-01-22 18:56:23 +11001614 } else if ((size0 > size1) && ((map & 0x7) == 0x4)) {
1615 offset = size/2 + (size0 + size1 - size);
Damien Zammit4b513a62015-08-20 00:37:05 +10001616 } else {
Damien Zammit9fb08f52016-01-22 18:56:23 +11001617 offset = size/2 + ME_UMA_SIZEMB;
Damien Zammit4b513a62015-08-20 00:37:05 +10001618 }
1619 MCHBAR16(0x108) = offset;
Damien Zammit9fb08f52016-01-22 18:56:23 +11001620 MCHBAR16(0x10a) = size/2;
Damien Zammit4b513a62015-08-20 00:37:05 +10001621}
1622
1623static void mmap_ddr2(struct sysinfo *s)
1624{
Damien Zammitd63115d2016-01-22 19:11:44 +11001625 bool reclaim;
1626 u32 gfxsize, gttsize, tsegsize, mmiosize, tom, tolud, touud;
1627 u32 gfxbase, gttbase, tsegbase, reclaimbase, reclaimlimit;
Damien Zammit4b513a62015-08-20 00:37:05 +10001628 u16 ggc;
1629 u16 ggc2uma[] = { 0, 0, 0, 0, 0, 32, 48, 64, 128, 256, 96, 160, 224, 352 };
1630 u8 ggc2gtt[] = { 0, 1, 0, 2, 0, 0, 0, 0, 0, 2, 3, 4};
1631
1632 ggc = pci_read_config16(PCI_DEV(0,0,0), 0x52);
1633 gfxsize = ggc2uma[(ggc & 0xf0) >> 4];
1634 gttsize = ggc2gtt[(ggc & 0xf00) >> 8];
1635 tsegsize = 1; // 1MB TSEG
1636 mmiosize = 0x400; // 1GB MMIO
Damien Zammit9fb08f52016-01-22 18:56:23 +11001637 tom = s->channel_capacity[0] + s->channel_capacity[1] - ME_UMA_SIZEMB;
Damien Zammit4b513a62015-08-20 00:37:05 +10001638 tolud = MIN(0x1000 - mmiosize, tom);
Damien Zammitd63115d2016-01-22 19:11:44 +11001639
1640 reclaim = false;
1641 if ((tom - tolud) > 0x40)
1642 reclaim = true;
1643
1644 if (reclaim) {
1645 tolud = tolud & ~0x3f;
1646 tom = tom & ~0x3f;
1647 reclaimbase = MAX(0x1000, tom);
1648 reclaimlimit = reclaimbase + (MIN(0x1000, tom) - tolud) - 0x40;
1649 }
1650
Damien Zammit4b513a62015-08-20 00:37:05 +10001651 touud = tom;
Damien Zammitd63115d2016-01-22 19:11:44 +11001652 if (reclaim)
1653 touud = reclaimlimit + 0x40;
1654
Damien Zammit4b513a62015-08-20 00:37:05 +10001655 gfxbase = tolud - gfxsize;
1656 gttbase = gfxbase - gttsize;
1657 tsegbase = gttbase - tsegsize;
1658
1659 pci_write_config16(PCI_DEV(0,0,0), 0xb0, tolud << 4);
1660 pci_write_config16(PCI_DEV(0,0,0), 0xa0, tom >> 6);
Damien Zammitd63115d2016-01-22 19:11:44 +11001661 if (reclaim) {
1662 pci_write_config16(PCI_DEV(0,0,0), 0x98,
1663 (u16)(reclaimbase >> 6));
1664 pci_write_config16(PCI_DEV(0,0,0), 0x9a,
1665 (u16)(reclaimlimit >> 6));
1666 }
Damien Zammit4b513a62015-08-20 00:37:05 +10001667 pci_write_config16(PCI_DEV(0,0,0), 0xa2, touud);
1668 pci_write_config32(PCI_DEV(0,0,0), 0xa4, gfxbase << 20);
1669 pci_write_config32(PCI_DEV(0,0,0), 0xa8, gttbase << 20);
1670 pci_write_config32(PCI_DEV(0,0,0), 0xac, tsegbase << 20);
1671}
1672
1673static void enhanced_ddr2(struct sysinfo *s)
1674{
1675 u8 ch, reg8;
1676
1677 MCHBAR32(0xfb0) = 0x1000d024;
1678 MCHBAR32(0xfb4) = 0xc842;
1679 MCHBAR32(0xfbc) = 0xf;
1680 MCHBAR32(0xfc4) = 0xfe22244;
1681 MCHBAR8(0x12f) = 0x5c;
1682 MCHBAR8(0xfb0) = (MCHBAR8(0xfb0) & ~1) | 1;
1683 MCHBAR8(0x12f) = MCHBAR8(0x12f) | 0x2;
1684 MCHBAR8(0x6c0) = (MCHBAR8(0x6c0) & ~0xf0) | 0xa0;
1685 MCHBAR32(0xfa8) = 0x30d400;
1686
1687 FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
1688 MCHBAR8(0x400*ch + 0x26c) = MCHBAR8(0x400*ch + 0x26c) | 1;
1689 MCHBAR32(0x400*ch + 0x278) = 0x88141881;
1690 MCHBAR16(0x400*ch + 0x27c) = 0x0041;
1691 MCHBAR8(0x400*ch + 0x292) = 0xf2;
1692 MCHBAR16(0x400*ch + 0x272) = MCHBAR16(0x400*ch + 0x272) | 0x100;
1693 MCHBAR8(0x400*ch + 0x243) = (MCHBAR8(0x400*ch + 0x243) & ~0x2) | 1;
1694 MCHBAR32(0x400*ch + 0x288) = 0x8040200;
1695 MCHBAR32(0x400*ch + 0x28c) = 0xff402010;
1696 MCHBAR32(0x400*ch + 0x290) = 0x4f2091c;
1697 }
1698
1699 reg8 = pci_read_config8(PCI_DEV(0,0,0), 0xf0);
1700 pci_write_config8(PCI_DEV(0,0,0), 0xf0, reg8 | 1);
1701 MCHBAR32(0xfa0) = (MCHBAR32(0xfa0) & ~0x20002) | 0x2;
1702 MCHBAR32(0xfa4) = (MCHBAR32(0xfa4) & ~0x219100c3) | 0x219100c2;
1703 MCHBAR32(0x2c) = 0x44a53;
1704 MCHBAR32(0x30) = 0x1f5a86;
1705 MCHBAR32(0x34) = 0x1902810;
1706 MCHBAR32(0x38) = 0xf7000000;
1707 MCHBAR32(0x3c) = 0x23014410;
1708 MCHBAR32(0x40) = (MCHBAR32(0x40) & ~0x8f038000) | 0x8f038000;
1709 MCHBAR32(0x20) = 0x33001;
1710 pci_write_config8(PCI_DEV(0,0,0), 0xf0, reg8 & ~1);
1711}
1712
1713static void power_ddr2(struct sysinfo *s)
1714{
1715 u32 reg1, reg2, reg3, reg4, clkgate, x592;
1716 u8 lane, ch;
1717 u8 twl = 0;
1718 u16 x264, x23c;
1719
1720 twl = s->selected_timings.CAS - 1;
1721 x264 = 0x78;
1722 switch (s->selected_timings.mem_clk) {
1723 default:
1724 case MEM_CLOCK_667MHz:
1725 reg1 = 0x99;
1726 reg2 = 0x1048a9;
1727 clkgate = 0x230000;
1728 x23c = 0x7a89;
1729 break;
1730 case MEM_CLOCK_800MHz:
1731 if (s->selected_timings.CAS == 5) {
1732 reg1 = 0x19a;
1733 reg2 = 0x1048aa;
1734 } else {
1735 reg1 = 0x9a;
1736 reg2 = 0x2158aa;
1737 x264 = 0x89;
1738 }
1739 clkgate = 0x280000;
1740 x23c = 0x7b89;
1741 break;
1742 }
1743 reg3 = 0x232;
1744 reg4 = 0x2864;
1745
1746 if (CHANNEL_IS_POPULATED(s->dimms, 0) && CHANNEL_IS_POPULATED(s->dimms, 1)) {
1747 MCHBAR32(0x14) = 0x0010461f;
1748 } else {
1749 MCHBAR32(0x14) = 0x0010691f;
1750 }
1751 MCHBAR32(0x18) = 0xdf6437f7;
1752 MCHBAR32(0x1c) = 0x0;
1753 MCHBAR32(0x24) = (MCHBAR32(0x24) & ~0xe0000000) | 0x30000000;
1754 MCHBAR32(0x44) = (MCHBAR32(0x44) & ~0x1fef0000) | 0x6b0000;
1755 MCHBAR16(0x115) = (u16) reg1;
1756 MCHBAR32(0x117) = (MCHBAR32(0x117) & ~0xffffff) | reg2;
1757 MCHBAR8(0x124) = 0x7;
1758 MCHBAR16(0x12a) = (MCHBAR16(0x12a) & 0) | 0x80;
1759 MCHBAR8(0x12c) = (MCHBAR8(0x12c) & 0) | 0xa0;
1760 MCHBAR16(0x174) = MCHBAR16(0x174) & ~(1 << 15);
1761 MCHBAR16(0x188) = (MCHBAR16(0x188) & ~0x1f00) | 0x1f00;
1762 MCHBAR8(0x18c) = MCHBAR8(0x18c) & ~0x8;
1763 MCHBAR8(0x192) = (MCHBAR8(0x192) & ~1) | 1;
1764 MCHBAR8(0x193) = (MCHBAR8(0x193) & ~0xf) | 0xf;
1765 MCHBAR16(0x1b4) = (MCHBAR16(0x1b4) & ~0x480) | 0x80;
1766 MCHBAR16(0x210) = (MCHBAR16(0x210) & ~0x1fff) | 0x3f; // | clockgatingiii
1767 MCHBAR32(0x6d1) = (MCHBAR32(0x6d1) & ~0xff03ff) | 0x100 | clkgate;
1768 MCHBAR8(0x212) = (MCHBAR8(0x212) & ~0x7f) | 0x7f;
1769 MCHBAR32(0x2c0) = (MCHBAR32(0x2c0) & ~0xffff0) | 0xcc5f0;
1770 MCHBAR8(0x2c4) = (MCHBAR8(0x2c4) & ~0x70) | 0x70;
1771 MCHBAR32(0x2d1) = (MCHBAR32(0x2d1) & ~0xffffff) | 0xff2831; // | clockgatingi
1772 MCHBAR32(0x2d4) = 0x40453600;
1773 MCHBAR32(0x300) = 0xc0b0a08;
1774 MCHBAR32(0x304) = 0x6040201;
1775 MCHBAR32(0x30c) = (MCHBAR32(0x30c) & ~0x43c0f) | 0x41405;
1776 MCHBAR16(0x610) = 0x232;
1777 MCHBAR16(0x612) = 0x2864;
1778 MCHBAR32(0x62c) = (MCHBAR32(0x62c) & ~0xc000000) | 0x4000000;
1779 MCHBAR32(0xae4) = 0;
1780 MCHBAR32(0xc00) = (MCHBAR32(0xc00) & ~0xf0000) | 0x10000;
1781 MCHBAR32(0xf00) = 0x393a3b3c;
1782 MCHBAR32(0xf04) = 0x3d3e3f40;
1783 MCHBAR32(0xf08) = 0x393a3b3c;
1784 MCHBAR32(0xf0c) = 0x3d3e3f40;
1785 MCHBAR32(0xf18) = MCHBAR32(0xf18) & ~0xfff00001;
1786 MCHBAR32(0xf48) = 0xfff0ffe0;
1787 MCHBAR32(0xf4c) = 0xffc0ff00;
1788 MCHBAR32(0xf50) = 0xfc00f000;
1789 MCHBAR32(0xf54) = 0xc0008000;
1790 MCHBAR32(0xf6c) = (MCHBAR32(0xf6c) & ~0xffff0000) | 0xffff0000;
1791 MCHBAR32(0xfac) = MCHBAR32(0xfac) & ~0x80000000;
1792 MCHBAR32(0xfb8) = MCHBAR32(0xfb8) & ~0xff000000;
1793 MCHBAR32(0xfbc) = (MCHBAR32(0xfbc) & ~0x7f800) | 0xf000;
1794 MCHBAR32(0x1104) = 0x3003232;
1795 MCHBAR32(0x1108) = 0x74;
1796 if (s->selected_timings.fsb_clk == FSB_CLOCK_800MHz) {
1797 MCHBAR32(0x110c) = 0xaa;
1798 } else {
1799 MCHBAR32(0x110c) = 0x100;
1800 }
1801 MCHBAR32(0x1110) = 0x10810350 & ~0x78;
1802 MCHBAR32(0x1114) = 0;
1803 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz) {
1804 twl = 5;
1805 } else {
1806 twl = 6;
1807 }
1808 x592 = 0xff;
1809 if (pci_read_config8(PCI_DEV(0,0,0), 0x8) < 3) {
1810 x592 = ~0x4;
1811 }
1812 FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
1813 MCHBAR8(0x400*ch + 0x239) = twl + 15;
1814 MCHBAR16(0x400*ch + 0x23c) = x23c;
1815 MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0x706033) | 0x406033;
1816 MCHBAR32(0x400*ch + 0x260) = (MCHBAR32(0x400*ch + 0x260) & ~(1 << 16)) | (1 << 16);
1817 MCHBAR8(0x400*ch + 0x264) = x264;
1818 MCHBAR8(0x400*ch + 0x592) = (MCHBAR8(0x400*ch + 0x592) & ~0x3f) | (0x3c & x592);
1819 MCHBAR8(0x400*ch + 0x593) = (MCHBAR8(0x400*ch + 0x593) & ~0x1f) | 0x1e;
1820 }
1821
1822 for (lane = 0; lane < 8; lane++) {
1823 MCHBAR8(0x561 + (lane << 2)) = MCHBAR8(0x561 + (lane << 2)) & ~(1 << 3);
1824 }
1825}
1826
1827void raminit_ddr2(struct sysinfo *s)
1828{
1829 u8 ch;
1830 u8 r, bank;
1831 u32 reg32;
1832
1833 // Select timings based on SPD info
1834 sdram_detect_smallest_params2(s);
1835
1836 // Reset if required
1837 checkreset_ddr2(s);
1838
1839 // Clear self refresh
1840 MCHBAR32(0xf14) = MCHBAR32(0xf14) | 0x3;
1841
1842 // Clear host clk gate reg
1843 MCHBAR32(0x1c) = MCHBAR32(0x1c) | 0xffffffff;
1844
1845 // Select DDR2
1846 MCHBAR8(0x1a8) = MCHBAR8(0x1a8) & ~0x4;
1847
1848 // Set freq
1849 MCHBAR32(0xc00) = (MCHBAR32(0xc00) & ~0x70) |
1850 (s->selected_timings.mem_clk << 4) | (1 << 10);
1851
1852 // Overwrite freq if chipset rejects it
1853 s->selected_timings.mem_clk = (MCHBAR8(0xc00) & 0x70) >> 4;
1854 if (s->selected_timings.mem_clk > (s->max_fsb + 3)) {
1855 die("Error: DDR is faster than FSB, halt\n");
1856 }
1857
1858 udelay(250000);
1859
1860 // Program clock crossing
1861 clkcross_ddr2(s);
1862 printk(BIOS_DEBUG, "Done clk crossing\n");
1863
1864 // DDR2 IO
1865 setioclk_ddr2(s);
1866 printk(BIOS_DEBUG, "Done I/O clk\n");
1867
1868 // Grant to launch
1869 launch_ddr2(s);
1870 printk(BIOS_DEBUG, "Done launch\n");
1871
1872 // Program DDR2 timings
1873 timings_ddr2(s);
1874 printk(BIOS_DEBUG, "Done timings\n");
1875
1876 // Program DLL
1877 dll_ddr2(s);
1878
1879 // RCOMP
1880 rcomp_ddr2(s);
1881 printk(BIOS_DEBUG, "RCOMP\n");
1882
1883 // ODT
1884 odt_ddr2(s);
1885 printk(BIOS_DEBUG, "Done ODT\n");
1886
1887 // RCOMP update
1888 while ((MCHBAR8(0x130) & 1) != 0 );
1889 printk(BIOS_DEBUG, "Done RCOMP update\n");
1890
1891 // Set defaults
1892 MCHBAR32(0x260) = (MCHBAR32(0x260) & ~1) | 0xf00000;
1893 MCHBAR32(0x660) = (MCHBAR32(0x660) & ~1) | 0xf00000;
1894 MCHBAR32(0x208) = 0x01010101;
1895 MCHBAR32(0x608) = 0x01010101;
1896 MCHBAR32(0x200) = 0x00040002;
1897 MCHBAR32(0x204) = 0x00080006;
1898 MCHBAR32(0x600) = 0x00040002;
1899 MCHBAR32(0x604) = 0x00100006;
1900 MCHBAR8(0x111) = MCHBAR8(0x111) | 0x2;
1901 MCHBAR32(0x104) = 0;
1902 MCHBAR16(0x102) = 0x400;
1903 MCHBAR8(0x100) = (2 << 5) | (3 << 3);
1904 MCHBAR16(0x10e) = 0;
1905 MCHBAR32(0x108) = 0;
1906 pci_write_config16(PCI_DEV(0,0,0), 0xb0, 0x4000);
1907 pci_write_config16(PCI_DEV(0,0,0), 0xa0, 0x0010);
1908 pci_write_config16(PCI_DEV(0,0,0), 0xa2, 0x0400);
1909 pci_write_config32(PCI_DEV(0,0,0), 0xa4, 0x40000000);
1910 pci_write_config32(PCI_DEV(0,0,0), 0xa8, 0x40000000);
1911 pci_write_config32(PCI_DEV(0,0,0), 0xac, 0x40000000);
1912
1913 // IOBUFACT
1914 if (CHANNEL_IS_POPULATED(s->dimms, 0)) {
1915 MCHBAR8(0x5dd) = (MCHBAR8(0x5dd) & ~0x3f) | 0x3f;
1916 MCHBAR8(0x5d8) = MCHBAR8(0x5d8) | 0x7;
1917 }
1918 if (CHANNEL_IS_POPULATED(s->dimms, 1)) {
1919 if (pci_read_config8(PCI_DEV(0,0,0), 0x8) < 2) {
1920 MCHBAR8(0x5dd) = (MCHBAR8(0x5dd) & ~0x3f) | 0x3f;
1921 MCHBAR8(0x5d8) = MCHBAR8(0x5d8) | 1;
1922 }
1923 MCHBAR8(0x9dd) = (MCHBAR8(0x9dd) & ~0x3f) | 0x3f;
1924 MCHBAR8(0x9d8) = MCHBAR8(0x9d8) | 0x7;
1925 }
1926
1927 // Pre jedec
1928 MCHBAR8(0x40) = MCHBAR8(0x40) | 0x2;
1929 FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
1930 MCHBAR32(0x400*ch + 0x260) = MCHBAR32(0x400*ch + 0x260) | (1 << 27);
1931 }
1932 MCHBAR16(0x212) = (MCHBAR16(0x212) & ~0xf000) | 0xf000;
1933 MCHBAR16(0x212) = (MCHBAR16(0x212) & ~0xf00) | 0xf00;
1934 printk(BIOS_DEBUG, "Done pre-jedec\n");
1935
1936 // JEDEC reset
1937 jedec_ddr2(s);
1938
1939 printk(BIOS_DEBUG, "Done jedec steps\n");
1940
1941 // After JEDEC reset
1942 MCHBAR8(0x40) = MCHBAR8(0x40) & ~0x2;
1943 FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
1944 if (s->selected_timings.mem_clk == MEM_CLOCK_667MHz) {
1945 reg32 = (2 << 18) | (3 << 13) | (5 << 8);
1946 } else {
1947 reg32 = (2 << 18) | (3 << 13) | (4 << 8);
1948 }
1949 MCHBAR32(0x400*ch + 0x274) = (MCHBAR32(0x400*ch + 0x274) & ~0xfff00) | reg32;
1950 MCHBAR8(0x400*ch + 0x274) = MCHBAR8(0x400*ch + 0x274) & ~0x80;
1951 MCHBAR8(0x400*ch + 0x26c) = MCHBAR8(0x400*ch + 0x26c) | 1;
1952 MCHBAR32(0x400*ch + 0x278) = 0x88141881;
1953 MCHBAR16(0x400*ch + 0x27c) = 0x41;
1954 MCHBAR8(0x400*ch + 0x292) = 0xf2;
1955 MCHBAR8(0x400*ch + 0x271) = (MCHBAR8(0x400*ch + 0x271) & ~0xe) | 0xe;
1956 }
1957 MCHBAR8(0x2c4) = MCHBAR8(0x2c4) | 0x8;
1958 MCHBAR8(0x2c3) = MCHBAR8(0x2c3) | 0x40;
1959 MCHBAR8(0x2c4) = MCHBAR8(0x2c4) | 0x4;
1960
1961 printk(BIOS_DEBUG, "Done post-jedec\n");
1962
1963 // Set DDR2 init complete
1964 FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
1965 MCHBAR32(0x400*ch + 0x268) = (MCHBAR32(0x400*ch + 0x268) & ~0xc0000000) | 0xc0000000;
1966 }
1967
1968 // Receive enable
1969 rcven_ddr2(s);
1970 printk(BIOS_DEBUG, "Done rcven\n");
1971
1972 // Finish rcven
1973 FOR_EACH_CHANNEL(ch) {
1974 MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) & ~0xe;
1975 MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) | 0x2;
1976 MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) | 0x4;
1977 MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) | 0x8;
1978 }
1979 MCHBAR8(0x5dc) = MCHBAR8(0x5dc) | 0x80;
1980 MCHBAR8(0x5dc) = MCHBAR8(0x5dc) & ~0x80;
1981 MCHBAR8(0x5dc) = MCHBAR8(0x5dc) | 0x80;
1982
1983 // Dummy writes / reads
1984 volatile u32 data;
1985 FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
1986 for (bank = 0; bank < 4; bank++) {
1987 reg32 = (ch << 29) | (r*0x8000000) | (bank << 12);
1988 write32((u32 *)reg32, 0xffffffff);
1989 data = read32((u32 *)reg32);
1990 printk(BIOS_DEBUG, "Wrote ones, Read: [0x%08x]=0x%08x\n", reg32, data);
1991 write32((u32 *)reg32, 0x00000000);
1992 data = read32((u32 *)reg32);
1993 printk(BIOS_DEBUG, "Wrote zeros, Read: [0x%08x]=0x%08x\n", reg32, data);
1994 }
1995 }
1996 printk(BIOS_DEBUG, "Done dummy reads\n");
1997
1998 // XXX tRD
1999
2000 // XXX Write training
2001
2002 // XXX Read training
2003
2004 // DRADRB
2005 dradrb_ddr2(s);
2006 printk(BIOS_DEBUG, "Done DRADRB\n");
2007
2008 // Memory map
2009 mmap_ddr2(s);
2010 printk(BIOS_DEBUG, "Done memory map\n");
2011
2012 // Enhanced mode
2013 enhanced_ddr2(s);
2014 printk(BIOS_DEBUG, "Done enhanced mode\n");
2015
2016 // Periodic RCOMP
2017 MCHBAR16(0x160) = (MCHBAR16(0x160) & ~0xfff) | 0x999;
2018 MCHBAR16(0x1b4) = MCHBAR16(0x1b4) | 0x3000;
2019 MCHBAR8(0x130) = MCHBAR8(0x130) | 0x82;
2020 printk(BIOS_DEBUG, "Done PRCOMP\n");
2021
2022 // Power settings
2023 power_ddr2(s);
2024 printk(BIOS_DEBUG, "Done power settings\n");
2025
2026 // ME related
Damien Zammitd63115d2016-01-22 19:11:44 +11002027 if (RANK_IS_POPULATED(s->dimms, 0, 0)
2028 || RANK_IS_POPULATED(s->dimms, 1, 0)) {
2029 MCHBAR8(0xa2f) = MCHBAR8(0xa2f) | (1 << 0);
2030 }
2031 if (RANK_IS_POPULATED(s->dimms, 0, 1)
2032 || RANK_IS_POPULATED(s->dimms, 1, 1)) {
2033 MCHBAR8(0xa2f) = MCHBAR8(0xa2f) | (1 << 1);
2034 }
2035 MCHBAR32(0xa30) = MCHBAR32(0xa30) | (1 << 26);
Damien Zammit4b513a62015-08-20 00:37:05 +10002036
2037 printk(BIOS_DEBUG, "Done ddr2\n");
2038}