blob: 2248d03c89959cbd6c761d5281da909410827abc [file] [log] [blame]
/* SPDX-License-Identifier: GPL-2.0-or-later */
#include <cf9_reset.h>
#include <device/mmio.h>
#include <device/pci_ops.h>
#include <device/smbus_host.h>
#include <commonlib/helpers.h>
#include <console/console.h>
#include <delay.h>
#include <lib.h>
#include "pineview.h"
#include "raminit.h"
#include <spd.h>
#include <string.h>
/* Debugging macros */
#if CONFIG(DEBUG_RAM_SETUP)
#define PRINTK_DEBUG(x...) printk(BIOS_DEBUG, x)
#else
#define PRINTK_DEBUG(x...)
#endif
#define MAX_TCLK_667 0x30
#define MAX_TCLK_800 0x25
#define MAX_TAC_667 0x45
#define MAX_TAC_800 0x40
#define NOP_CMD (1 << 1)
#define PRE_CHARGE_CMD (1 << 2)
#define MRS_CMD ((1 << 2) | (1 << 1))
#define EMRS_CMD (1 << 3)
#define EMRS1_CMD (EMRS_CMD | (1 << 4))
#define EMRS2_CMD (EMRS_CMD | (1 << 5))
#define EMRS3_CMD (EMRS_CMD | (1 << 5) | (1 << 4))
#define ZQCAL_CMD ((1 << 3) | (1 << 1))
#define CBR_CMD ((1 << 3) | (1 << 2))
#define NORMAL_OP_CMD ((1 << 3) | (1 << 2) | (1 << 1))
#define UBDIMM 1
#define SODIMM 2
#define TOTAL_CHANNELS 1
#define TOTAL_DIMMS 2
#define DIMM_IS_POPULATED(dimms, idx) (dimms[idx].card_type != 0)
#define IF_DIMM_POPULATED(dimms, idx) if (dimms[idx].card_type != 0)
#define ONLY_DIMMA_IS_POPULATED(dimms, ch) (\
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2) && \
!DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3)))
#define ONLY_DIMMB_IS_POPULATED(dimms, ch) (\
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3) && \
!DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2)))
#define BOTH_DIMMS_ARE_POPULATED(dimms, ch) (\
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2) && \
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3))))
#define FOR_EACH_DIMM(idx) \
for (idx = 0; idx < TOTAL_DIMMS; ++idx)
#define FOR_EACH_POPULATED_DIMM(dimms, idx) \
FOR_EACH_DIMM(idx) IF_DIMM_POPULATED(dimms, idx)
#define CHANNEL_IS_POPULATED(dimms, idx) ((dimms[idx<<1].card_type != 0) || (dimms[(idx<<1) + 1].card_type != 0))
#define CHANNEL_IS_CARDF(dimms, idx) ((dimms[idx<<1].card_type == 0xf) || (dimms[(idx<<1) + 1].card_type == 0xf))
#define IF_CHANNEL_POPULATED(dimms, idx) if ((dimms[idx<<1].card_type != 0) || (dimms[(idx<<1) + 1].card_type != 0))
#define FOR_EACH_CHANNEL(idx) \
for (idx = 0; idx < TOTAL_CHANNELS; ++idx)
#define FOR_EACH_POPULATED_CHANNEL(dimms, idx) \
FOR_EACH_CHANNEL(idx) IF_CHANNEL_POPULATED(dimms, idx)
#define RANKS_PER_CHANNEL 4
#define FOR_EACH_RANK_IN_CHANNEL(r) \
for (r = 0; r < RANKS_PER_CHANNEL; ++r)
#define FOR_EACH_POPULATED_RANK_IN_CHANNEL(dimms, ch, r) \
FOR_EACH_RANK_IN_CHANNEL(r) if (rank_is_populated(dimms, ch, r))
#define FOR_EACH_RANK(ch, r) \
FOR_EACH_CHANNEL(ch) FOR_EACH_RANK_IN_CHANNEL(r)
#define FOR_EACH_POPULATED_RANK(dimms, ch, r) \
FOR_EACH_RANK(ch, r) if (rank_is_populated(dimms, ch, r))
static bool rank_is_populated(struct dimminfo dimms[], u8 ch, u8 r)
{
return ((dimms[ch<<1].card_type && ((r) < dimms[ch<<1].ranks))
|| (dimms[(ch<<1) + 1].card_type
&& ((r) >= 2)
&& ((r) < (dimms[(ch<<1) + 1].ranks + 2))));
}
static inline void barrier(void)
{
__asm__ __volatile__("": : :"memory");
}
static int decode_spd(struct dimminfo *d, int i)
{
d->type = 0;
if (d->spd_data[20] == 0x2) {
d->type = UBDIMM;
} else if (d->spd_data[20] == 0x4) {
d->type = SODIMM;
}
d->sides = (d->spd_data[5] & 0x7) + 1;
d->banks = (d->spd_data[17] >> 2) - 1;
d->chip_capacity = d->banks;
d->rows = d->spd_data[3];// - 12;
d->cols = d->spd_data[4];// - 9;
d->cas_latencies = 0x78;
d->cas_latencies &= d->spd_data[18];
if (d->cas_latencies == 0)
d->cas_latencies = 7;
d->tAAmin = d->spd_data[26];
d->tCKmin = d->spd_data[25];
d->width = (d->spd_data[13] >> 3) - 1;
d->page_size = (d->width+1) * (1 << d->cols); // Bytes
d->tRAS = d->spd_data[30];
d->tRP = d->spd_data[27];
d->tRCD = d->spd_data[29];
d->tWR = d->spd_data[36];
d->ranks = d->sides; // XXX
#if CONFIG(DEBUG_RAM_SETUP)
const char *ubso[2] = { "UB", "SO" };
#endif
PRINTK_DEBUG("%s-DIMM %d\n", &ubso[d->type][0], i);
PRINTK_DEBUG(" Sides : %d\n", d->sides);
PRINTK_DEBUG(" Banks : %d\n", d->banks);
PRINTK_DEBUG(" Ranks : %d\n", d->ranks);
PRINTK_DEBUG(" Rows : %d\n", d->rows);
PRINTK_DEBUG(" Cols : %d\n", d->cols);
PRINTK_DEBUG(" Page size : %d\n", d->page_size);
PRINTK_DEBUG(" Width : %d\n", (d->width + 1) * 8);
return 0;
}
/*
* RAM Config: DIMMB-DIMMA
* 0 EMPTY-EMPTY
* 1 EMPTY-x16SS
* 2 EMPTY-x16DS
* 3 x16SS-x16SS
* 4 x16DS-x16DS
* 5 EMPTY- x8DS
* 6 x8DS - x8DS
*/
static void find_ramconfig(struct sysinfo *s, u32 chan)
{
if (s->dimms[chan>>1].sides == 0) {
// NC
if (s->dimms[(chan>>1) + 1].sides == 0) {
// NC/NC
s->dimm_config[chan] = 0;
} else if (s->dimms[(chan>>1) + 1].sides == 1) {
// NC/SS
if (s->dimms[(chan>>1) + 1].width == 0) {
// NC/8SS
s->dimm_config[chan] = 1;
} else {
// NC/16SS
s->dimm_config[chan] = 1;
}
} else {
// NC/DS
if (s->dimms[(chan>>1) + 1].width == 0) {
// NC/8DS
s->dimm_config[chan] = 5;
} else {
// NC/16DS
s->dimm_config[chan] = 2;
}
}
} else if (s->dimms[chan>>1].sides == 1) {
// SS
if (s->dimms[(chan>>1) + 1].sides == 0) {
// SS/NC
if (s->dimms[chan>>1].width == 0) {
// 8SS/NC
s->dimm_config[chan] = 1;
} else {
// 16SS/NC
s->dimm_config[chan] = 1;
}
} else if (s->dimms[(chan>>1) + 1].sides == 1) {
// SS/SS
if (s->dimms[chan>>1].width == 0) {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 8SS/8SS
s->dimm_config[chan] = 3;
} else {
// 8SS/16SS
die("Mixed Not supported\n");
}
} else {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 16SS/8SS
die("Mixed Not supported\n");
} else {
// 16SS/16SS
s->dimm_config[chan] = 3;
}
}
} else {
// SS/DS
if (s->dimms[chan>>1].width == 0) {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 8SS/8DS
die("Mixed Not supported\n");
} else {
die("Mixed Not supported\n");
}
} else {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 16SS/8DS
die("Mixed Not supported\n");
} else {
die("Mixed Not supported\n");
}
}
}
} else {
// DS
if (s->dimms[(chan>>1) + 1].sides == 0) {
// DS/NC
if (s->dimms[chan>>1].width == 0) {
// 8DS/NC
s->dimm_config[chan] = 5;
} else {
s->dimm_config[chan] = 4;
}
} else if (s->dimms[(chan>>1) + 1].sides == 1) {
// DS/SS
if (s->dimms[chan>>1].width == 0) {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 8DS/8SS
die("Mixed Not supported\n");
} else {
// 8DS/16SS
die("Mixed Not supported\n");
}
} else {
if (s->dimms[(chan>>1) + 1].width == 0) {
die("Mixed Not supported\n");
} else {
// 16DS/16DS
s->dimm_config[chan] = 4;
}
}
} else {
// DS/DS
if (s->dimms[chan>>1].width == 0 && s->dimms[(chan>>1)+1].width == 0) {
// 8DS/8DS
s->dimm_config[chan] = 6;
}
}
}
}
static void sdram_read_spds(struct sysinfo *s)
{
u8 i, chan;
s->dt0mode = 0;
FOR_EACH_DIMM(i) {
if (i2c_eeprom_read(s->spd_map[i], 0, 64, s->dimms[i].spd_data) != 64)
s->dimms[i].card_type = 0;
s->dimms[i].card_type = s->dimms[i].spd_data[62] & 0x1f;
hexdump(s->dimms[i].spd_data, 64);
}
s->spd_type = 0;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
switch (s->dimms[i].spd_data[2]) {
case 0x8:
s->spd_type = DDR2;
break;
case 0xb:
default:
die("DIMM type mismatch\n");
break;
}
}
int err = 1;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
err = decode_spd(&s->dimms[i], i);
s->dt0mode |= (s->dimms[i].spd_data[49] & 0x2) >> 1;
}
if (err) {
die("No memory dimms, halt\n");
}
FOR_EACH_POPULATED_CHANNEL(s->dimms, chan) {
find_ramconfig(s, chan);
PRINTK_DEBUG(" Config[CH%d] : %d\n", chan, s->dimm_config[chan]);
}
}
#if CONFIG(DEBUG_RAM_SETUP)
static u32 fsb_reg_to_mhz(u32 speed)
{
return (speed * 133) + 667;
}
static u32 ddr_reg_to_mhz(u32 speed)
{
return (speed == 0) ? 667 : (speed == 1) ? 800 : 0;
}
#endif
// Return the position of the least significant set bit, 0-indexed.
// 0 does not have a lsb, so return -1 for error.
static int lsbpos(u8 val)
{
for (int i = 0; i < 8; i++)
if (val & (1 << i))
return i;
return -1;
}
// Return the position of the most significant set bit, 0-indexed.
// 0 does not have a msb, so return -1 for error.
static int msbpos(u8 val)
{
for (int i = 7; i >= 0; i--)
if (val & (1 << i))
return i;
return -1;
}
static void sdram_detect_smallest_params(struct sysinfo *s)
{
static const u16 mult[6] = {
3000, // 667
2500, // 800
};
u8 i;
u32 maxtras = 0;
u32 maxtrp = 0;
u32 maxtrcd = 0;
u32 maxtwr = 0;
u32 maxtrfc = 0;
u32 maxtwtr = 0;
u32 maxtrrd = 0;
u32 maxtrtp = 0;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
maxtras = MAX(maxtras, (s->dimms[i].spd_data[30] * 1000));
maxtrp = MAX(maxtrp, (s->dimms[i].spd_data[27] * 1000) >> 2);
maxtrcd = MAX(maxtrcd, (s->dimms[i].spd_data[29] * 1000) >> 2);
maxtwr = MAX(maxtwr, (s->dimms[i].spd_data[36] * 1000) >> 2);
maxtrfc = MAX(maxtrfc, (s->dimms[i].spd_data[42] * 1000) +
(s->dimms[i].spd_data[40] & 0xf));
maxtwtr = MAX(maxtwtr, (s->dimms[i].spd_data[37] * 1000) >> 2);
maxtrrd = MAX(maxtrrd, (s->dimms[i].spd_data[28] * 1000) >> 2);
maxtrtp = MAX(maxtrtp, (s->dimms[i].spd_data[38] * 1000) >> 2);
}
/*
* TODO: on DDR3 there might be some minimal required values for some
* Timings: MIN_TRAS = 9, MIN_TRP = 3, MIN_TRCD = 3, MIN_TWR = 3,
* MIN_TWTR = 4, MIN_TRRD = 2, MIN_TRTP = 4
*/
s->selected_timings.tRAS = MIN(24, DIV_ROUND_UP(maxtras,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRP = MIN(10, DIV_ROUND_UP(maxtrp,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRCD = MIN(10, DIV_ROUND_UP(maxtrcd,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tWR = MIN(15, DIV_ROUND_UP(maxtwr,
mult[s->selected_timings.mem_clock]));
/* Needs to be even */
s->selected_timings.tRFC = 0xfe & (MIN(78, DIV_ROUND_UP(maxtrfc,
mult[s->selected_timings.mem_clock])) + 1);
s->selected_timings.tWTR = MIN(15, DIV_ROUND_UP(maxtwtr,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRRD = MIN(15, DIV_ROUND_UP(maxtrrd,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRTP = MIN(15, DIV_ROUND_UP(maxtrtp,
mult[s->selected_timings.mem_clock]));
PRINTK_DEBUG("Selected timings:\n");
PRINTK_DEBUG("\tFSB: %dMHz\n", fsb_reg_to_mhz(s->selected_timings.fsb_clock));
PRINTK_DEBUG("\tDDR: %dMHz\n", ddr_reg_to_mhz(s->selected_timings.mem_clock));
PRINTK_DEBUG("\tCAS: %d\n", s->selected_timings.CAS);
PRINTK_DEBUG("\ttRAS: %d\n", s->selected_timings.tRAS);
PRINTK_DEBUG("\ttRP: %d\n", s->selected_timings.tRP);
PRINTK_DEBUG("\ttRCD: %d\n", s->selected_timings.tRCD);
PRINTK_DEBUG("\ttWR: %d\n", s->selected_timings.tWR);
PRINTK_DEBUG("\ttRFC: %d\n", s->selected_timings.tRFC);
PRINTK_DEBUG("\ttWTR: %d\n", s->selected_timings.tWTR);
PRINTK_DEBUG("\ttRRD: %d\n", s->selected_timings.tRRD);
PRINTK_DEBUG("\ttRTP: %d\n", s->selected_timings.tRTP);
}
static void sdram_detect_ram_speed(struct sysinfo *s)
{
u8 cas, reg8;
u32 reg32;
u32 freq = 0;
u32 fsb = 0;
u8 i;
u8 commoncas = 0;
u8 highcas = 0;
u8 lowcas = 0;
// Core frequency
fsb = (pci_read_config8(HOST_BRIDGE, 0xe3) & 0x70) >> 4;
if (fsb) {
fsb = 5 - fsb;
} else {
fsb = FSB_CLOCK_800MHz;
}
// DDR frequency
freq = (pci_read_config8(HOST_BRIDGE, 0xe3) & 0x80) >> 7;
freq |= (pci_read_config8(HOST_BRIDGE, 0xe4) & 0x03) << 1;
if (freq) {
freq = 6 - freq;
} else {
freq = MEM_CLOCK_800MHz;
}
// Detect a common CAS latency
commoncas = 0xff;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
commoncas &= s->dimms[i].spd_data[18];
}
if (commoncas == 0) {
die("No common CAS among dimms\n");
}
// commoncas is nonzero, so these calls will not error
u8 msbp = (u8)msbpos(commoncas);
u8 lsbp = (u8)lsbpos(commoncas);
// Start with fastest common CAS
cas = 0;
highcas = msbp;
lowcas = MAX(lsbp, 5);
while (cas == 0 && highcas >= lowcas) {
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
switch (freq) {
case MEM_CLOCK_800MHz:
if ((s->dimms[i].spd_data[9] > 0x25) ||
(s->dimms[i].spd_data[10] > 0x40)) {
// CAS too fast, lower it
highcas--;
break;
} else {
cas = highcas;
}
break;
case MEM_CLOCK_667MHz:
default:
if ((s->dimms[i].spd_data[9] > 0x30) ||
(s->dimms[i].spd_data[10] > 0x45)) {
// CAS too fast, lower it
highcas--;
break;
} else {
cas = highcas;
}
break;
}
}
}
if (highcas < lowcas) {
// Timings not supported by MCH, lower the frequency
if (freq == MEM_CLOCK_800MHz) {
freq--;
PRINTK_DEBUG("Run DDR clock speed reduced due to timings\n");
} else {
die("Timings not supported by MCH\n");
}
cas = 0;
highcas = msbp;
lowcas = lsbp;
while (cas == 0 && highcas >= lowcas) {
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
if ((s->dimms[i].spd_data[9] > 0x30) ||
(s->dimms[i].spd_data[10] > 0x45)) {
// CAS too fast, lower it
highcas--;
} else {
cas = highcas;
}
}
}
if (cas == 0) {
die("Unsupported dimms\n");
}
}
s->selected_timings.CAS = cas;
s->selected_timings.mem_clock = freq;
s->selected_timings.fsb_clock = fsb;
PRINTK_DEBUG("Drive Memory at %dMHz with CAS = %d clocks\n",
ddr_reg_to_mhz(s->selected_timings.mem_clock), s->selected_timings.CAS);
// Set memory frequency
if (s->boot_path == BOOT_PATH_RESET)
return;
MCHBAR32_OR(PMSTS, 1);
reg32 = (MCHBAR32(CLKCFG) & ~0x70) | (1 << 10);
if (s->selected_timings.mem_clock == MEM_CLOCK_800MHz) {
reg8 = 3;
} else {
reg8 = 2;
}
reg32 |= reg8 << 4;
MCHBAR32(CLKCFG) = reg32;
s->selected_timings.mem_clock = ((MCHBAR32(CLKCFG) >> 4) & 0x7) - 2;
if (s->selected_timings.mem_clock == MEM_CLOCK_800MHz) {
PRINTK_DEBUG("MCH validated at 800MHz\n");
s->nodll = 0;
s->maxpi = 63;
s->pioffset = 0;
} else if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
PRINTK_DEBUG("MCH validated at 667MHz\n");
s->nodll = 1;
s->maxpi = 15;
s->pioffset = 1;
} else {
PRINTK_DEBUG("MCH set to unknown (%02x)\n",
(uint8_t) s->selected_timings.mem_clock & 0xff);
}
}
#define HPET_BASE 0xfed00000
#define HPET32(x) *((volatile u32 *)(HPET_BASE + x))
static void enable_hpet(void)
{
u32 reg32;
reg32 = RCBA32(HPTC);
reg32 &= ~0x03;
reg32 |= (1 << 7);
RCBA32(HPTC) = reg32;
/* On NM10 this only works if read back */
RCBA32(HPTC);
HPET32(0x10) = HPET32(0x10) | 1;
}
static void sdram_clk_crossing(struct sysinfo *s)
{
u8 ddr_freq, fsb_freq;
static const u32 clkcross[2][2][4] = {
{
{0xFFFFFFFF, 0x05030305, 0x0000FFFF, 0x00000000}, /* FSB = 667, DDR = 667 */
{0x1F1F1F1F, 0x2A1F1FA5, 0x00000000, 0x05000002}, /* FSB = 667, DDR = 800 */
},
{
{0x1F1F1F1F, 0x0D07070B, 0x00000000, 0x00000000}, /* FSB = 800, DDR = 667 */
{0xFFFFFFFF, 0x05030305, 0x0000FFFF, 0x00000000}, /* FSB = 800, DDR = 800 */
},
};
ddr_freq = s->selected_timings.mem_clock;
fsb_freq = s->selected_timings.fsb_clock;
MCHBAR32(HMCCMP) = clkcross[fsb_freq][ddr_freq][0];
MCHBAR32(HMDCMP) = clkcross[fsb_freq][ddr_freq][1];
MCHBAR32(HMBYPCP) = clkcross[fsb_freq][ddr_freq][2];
MCHBAR32(HMCCPEXT) = 0;
MCHBAR32(HMDCPEXT) = clkcross[fsb_freq][ddr_freq][3];
MCHBAR32_OR(HMCCMC, 1 << 7);
if ((fsb_freq == 0) && (ddr_freq == 1)) {
MCHBAR8(CLKXSSH2MCBYPPHAS) = 0;
MCHBAR32(CLKXSSH2MD) = 0;
MCHBAR32(CLKXSSH2MD + 4) = 0;
}
static const u32 clkcross2[2][2][8] = {
{
{ // FSB = 667, DDR = 667
0x00000000, 0x08010204, 0x00000000, 0x08010204,
0x00000000, 0x00000000, 0x00000000, 0x04080102,
},
{ // FSB = 667, DDR = 800
0x04080000, 0x10010002, 0x10000000, 0x20010208,
0x00000000, 0x00000004, 0x02040000, 0x08100102,
},
},
{
{ // FSB = 800, DDR = 667
0x10000000, 0x20010208, 0x04080000, 0x10010002,
0x00000000, 0x00000000, 0x08000000, 0x10200204,
},
{ // FSB = 800, DDR = 800
0x00000000, 0x08010204, 0x00000000, 0x08010204,
0x00000000, 0x00000000, 0x00000000, 0x04080102,
},
},
};
MCHBAR32(CLKXSSH2MCBYP) = clkcross2[fsb_freq][ddr_freq][0];
MCHBAR32(CLKXSSH2MCRDQ) = clkcross2[fsb_freq][ddr_freq][0];
MCHBAR32(CLKXSSH2MCRDCST) = clkcross2[fsb_freq][ddr_freq][0];
MCHBAR32(CLKXSSH2MCBYP + 4) = clkcross2[fsb_freq][ddr_freq][1];
MCHBAR32(CLKXSSH2MCRDQ + 4) = clkcross2[fsb_freq][ddr_freq][1];
MCHBAR32(CLKXSSH2MCRDCST + 4) = clkcross2[fsb_freq][ddr_freq][1];
MCHBAR32(CLKXSSMC2H) = clkcross2[fsb_freq][ddr_freq][2];
MCHBAR32(CLKXSSMC2H + 4) = clkcross2[fsb_freq][ddr_freq][3];
MCHBAR32(CLKXSSMC2HALT) = clkcross2[fsb_freq][ddr_freq][4];
MCHBAR32(CLKXSSMC2HALT + 4) = clkcross2[fsb_freq][ddr_freq][5];
MCHBAR32(CLKXSSH2X2MD) = clkcross2[fsb_freq][ddr_freq][6];
MCHBAR32(CLKXSSH2X2MD + 4) = clkcross2[fsb_freq][ddr_freq][7];
}
static void sdram_clkmode(struct sysinfo *s)
{
u8 ddr_freq;
u16 mpll_ctl;
MCHBAR16_AND(CSHRMISCCTL1, ~(1 << 8));
MCHBAR8_AND(CSHRMISCCTL1, ~0x3f);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
ddr_freq = 0;
mpll_ctl = 1;
} else {
ddr_freq = 1;
mpll_ctl = (1 << 8) | (1 << 5);
}
if (s->boot_path != BOOT_PATH_RESET)
MCHBAR16_AND_OR(MPLLCTL, ~(0x033f), mpll_ctl);
MCHBAR32(C0GNT2LNCH1) = 0x58001117;
MCHBAR32_OR(C0STATRDCTRL, 1 << 23);
const u32 cas_to_reg[2][4] = {
{0x00000000, 0x00030100, 0x0C240201, 0x00000000}, /* DDR = 667 */
{0x00000000, 0x00030100, 0x0C240201, 0x10450302} /* DDR = 800 */
};
MCHBAR32(C0GNT2LNCH2) = cas_to_reg[ddr_freq][s->selected_timings.CAS - 3];
}
static void sdram_timings(struct sysinfo *s)
{
u8 i, j, ch, r, ta1, ta2, ta3, ta4, trp, bank, page, flag;
u8 reg8, wl;
u16 reg16;
u32 reg32, reg2;
static const u8 pagetab[2][2] = {
{0x0e, 0x12},
{0x10, 0x14},
};
/* Only consider DDR2 */
wl = s->selected_timings.CAS - 1;
ta1 = ta2 = 6;
ta3 = s->selected_timings.CAS;
ta4 = 8;
s->selected_timings.tRFC = (s->selected_timings.tRFC + 1) & 0xfe;
trp = 0;
bank = 1;
page = 0;
MCHBAR8(C0LATCTRL) = ((wl - 3) << 4) | (s->selected_timings.CAS - 3);
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
i = ch << 1;
if (s->dimms[i].banks == 1) {
trp = 1;
bank = 0;
}
if (s->dimms[i].page_size == 2048) {
page = 1;
}
}
PRINTK_DEBUG("trp=%d bank=%d page=%d\n",trp, bank, page);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
flag = 0;
} else {
flag = 1;
}
MCHBAR8_OR(C0PVCFG, 0x03);
MCHBAR16(C0CYCTRKPCHG) = ((wl + 4 + s->selected_timings.tWR) << 6) |
((2 + MAX(s->selected_timings.tRTP, 2)) << 2) | 1;
reg32 = (bank << 21) | (s->selected_timings.tRRD << 17) |
(s->selected_timings.tRP << 13) | ((s->selected_timings.tRP + trp) << 9) |
s->selected_timings.tRFC;
if (bank == 0) {
reg32 |= (pagetab[flag][page] << 22);
}
/* FIXME: Why not do a single dword write? */
MCHBAR16(C0CYCTRKACT) = (u16) (reg32);
MCHBAR16(C0CYCTRKACT + 2) = (u16) (reg32 >> 16);
/* FIXME: Only applies to DDR2 */
reg16 = (MCHBAR16(C0CYCTRKACT + 2) & 0x0fc0) >> 6;
MCHBAR16_AND_OR(SHCYCTRKCKEL, ~0x1f80, (reg16 << 7));
reg16 = (s->selected_timings.tRCD << 12) | (4 << 8) | (ta2 << 4) | ta4;
MCHBAR16(C0CYCTRKWR) = reg16;
reg32 = (s->selected_timings.tRCD << 17) | ((wl + 4 + s->selected_timings.tWTR) << 12) |
(ta3 << 8) | (4 << 4) | ta1;
MCHBAR32(C0CYCTRKRD) = reg32;
reg16 = ((s->selected_timings.tRP + trp) << 9) | s->selected_timings.tRFC;
/* FIXME: Why not do a single word write? */
MCHBAR8(C0CYCTRKREFR) = (u8) (reg16);
MCHBAR8(C0CYCTRKREFR + 1) = (u8) (reg16 >> 8);
MCHBAR16_AND_OR(C0CKECTRL, ~0x03fe, 100 << 1);
MCHBAR8_AND_OR(C0CYCTRKPCHG2, ~0x3f, s->selected_timings.tRAS);
MCHBAR16(C0ARBCTRL) = 0x2310;
MCHBAR8_AND_OR(C0ADDCSCTRL, ~0x1f, 1);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
reg32 = 3000;
} else {
reg32 = 2500;
}
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) {
reg2 = 6000;
} else {
reg2 = 5000;
}
reg16 = (u16)((((s->selected_timings.CAS + 7) * (reg32)) / reg2) << 8);
MCHBAR16_AND_OR(C0STATRDCTRL, ~0x1f00, reg16);
flag = 0;
if (wl > 2) {
flag = 1;
}
reg16 = (u8) (wl - 1 - flag);
reg16 |= reg16 << 4;
reg16 |= flag << 8;
MCHBAR16_AND_OR(C0WRDATACTRL, ~0x01ff, reg16);
MCHBAR16(C0RDQCTRL) = 0x1585;
MCHBAR8_AND(C0PWLRCTRL, ~0x1f);
/* rdmodwr_window[5..0] = CL+4+5 265[13..8] (264[21..16]) */
MCHBAR16_AND_OR(C0PWLRCTRL, ~0x3f00, (s->selected_timings.CAS + 9) << 8);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
reg16 = 0x0514;
reg32 = 0x0a28;
} else {
reg16 = 0x0618;
reg32 = 0x0c30;
}
MCHBAR32_AND_OR(C0REFRCTRL2, ~0x0fffff00, (0x3f << 22) | (reg32 << 8));
/* FIXME: Is this weird access necessary? Reference code does it */
MCHBAR8(C0REFRCTRL + 3) = 0;
MCHBAR16_AND_OR(C0REFCTRL, 0xc000, reg16);
/* NPUT Static Mode */
MCHBAR8_OR(C0DYNRDCTRL, 1);
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x7f000000, 0xb << 25);
i = s->selected_timings.mem_clock;
j = s->selected_timings.fsb_clock;
if (i > j) {
MCHBAR32_OR(C0STATRDCTRL, 1 << 24);
}
MCHBAR8_AND(C0RDFIFOCTRL, ~0x3);
MCHBAR16_AND_OR(C0WRDATACTRL, ~0x7c00, (wl + 10) << 10);
MCHBAR32_AND_OR(C0CKECTRL, ~0x070e0000, (3 << 24) | (3 << 17));
reg16 = 0x15 << 6;
reg16 |= 0x1f;
reg16 |= (0x6 << 12);
MCHBAR16_AND_OR(C0REFRCTRL + 4, ~0x7fff, reg16);
reg32 = (0x6 << 27) | (1 << 25); /* FIXME: For DDR3, set BIT26 as well */
MCHBAR32_AND_OR(C0REFRCTRL2, ~0x30000000, reg32 << 8);
MCHBAR8_AND_OR(C0REFRCTRL + 3, ~0xfa, reg32 >> 24);
MCHBAR8_AND(C0JEDEC, ~(1 << 7));
MCHBAR8_AND(C0DYNRDCTRL, ~0x6);
/* Note: This is a 64-bit register, [34..30] = 0b00110 is split across two writes */
reg32 = ((6 & 3) << 30) | (4 << 25) | (1 << 20) | (8 << 15) | (6 << 10) | (4 << 5) | 1;
MCHBAR32(C0WRWMFLSH) = reg32;
MCHBAR16_AND_OR(C0WRWMFLSH + 4, ~0x1ff, (8 << 3) | (6 >> 2));
MCHBAR16_OR(SHPENDREG, 0x1c00 | (0x1f << 5));
/* FIXME: Why not do a single word write? */
MCHBAR8_AND_OR(SHPAGECTRL, ~0xff, 0x40);
MCHBAR8_AND_OR(SHPAGECTRL + 1, ~0x07, 0x05);
MCHBAR8_OR(SHCMPLWRCMD, 0x1f);
reg8 = (3 << 6);
reg8 |= (s->dt0mode << 4);
reg8 |= 0x0c;
MCHBAR8_AND_OR(SHBONUSREG, ~0xdf, reg8);
MCHBAR8_AND(CSHRWRIOMLNS, ~0x02);
MCHBAR8_AND_OR(C0MISCTM, ~0x07, 0x02);
MCHBAR16_AND_OR(C0BYPCTRL, ~0x3fc, 4 << 2);
/* [31..29] = 0b010 for kN = 2 (2N) */
reg32 = (2 << 29) | (1 << 28) | (1 << 23);
MCHBAR32_AND_OR(WRWMCONFIG, ~0xffb00000, reg32);
reg8 = (u8) ((MCHBAR16(C0CYCTRKACT) & 0xe000) >> 13);
reg8 |= (u8) ((MCHBAR16(C0CYCTRKACT + 2) & 1) << 3);
MCHBAR8_AND_OR(BYPACTSF, ~0xf0, reg8 << 4);
reg8 = (u8) ((MCHBAR32(C0CYCTRKRD) & 0x000f0000) >> 17);
MCHBAR8_AND_OR(BYPACTSF, ~0x0f, reg8);
/* FIXME: Why not clear everything at once? */
MCHBAR8_AND(BYPKNRULE, ~0xfc);
MCHBAR8_AND(BYPKNRULE, ~0x03);
MCHBAR8_AND(SHBONUSREG, ~0x03);
MCHBAR8_OR(C0BYPCTRL, 1);
MCHBAR16_OR(CSHRMISCCTL1, 1 << 9);
for (i = 0; i < 8; i++) {
/* FIXME: Hardcoded for DDR2 SO-DIMMs */
MCHBAR32_AND_OR(C0DLLRCVCTLy(i), ~0x3f3f3f3f, 0x0c0c0c0c);
}
/* RDCS to RCVEN delay: Program coarse common to all bytelanes to default tCL + 1 */
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x000f0000, (s->selected_timings.CAS + 1) << 16);
/* Program RCVEN delay with DLL-safe settings */
for (i = 0; i < 8; i++) {
MCHBAR8_AND(C0RXRCVyDLL(i), ~0x3f);
MCHBAR16_AND(C0RCVMISCCTL2, (u16) ~(3 << (i * 2)));
MCHBAR16_AND(C0RCVMISCCTL1, (u16) ~(3 << (i * 2)));
MCHBAR16_AND(C0COARSEDLY0, (u16) ~(3 << (i * 2)));
}
MCHBAR8_AND(C0DLLPIEN, ~1); /* Power up receiver */
MCHBAR8_OR(C0DLLPIEN, 2); /* Enable RCVEN DLL */
MCHBAR8_OR(C0DLLPIEN, 4); /* Enable receiver DQS DLL */
MCHBAR32_OR(C0COREBONUS, 0x000c0400);
MCHBAR32_OR(C0CMDTX1, 1 << 31);
}
/* Program clkset0's register for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_clkset0(const struct pllparam *pll, u8 f, u8 i)
{
MCHBAR16_AND_OR(C0CKTX, ~0xc440,
(pll->clkdelay[f][i] << 14) |
(pll->dben[f][i] << 10) |
(pll->dbsel[f][i] << 6));
MCHBAR8_AND_OR(C0TXCK0DLL, ~0x3f, pll->pi[f][i]);
}
/* Program clkset1's register for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_clkset1(const struct pllparam *pll, u8 f, u8 i)
{
/* FIXME: This is actually a dword write! */
MCHBAR16_AND_OR(C0CKTX, ~0x00030880,
(pll->clkdelay[f][i] << 16) |
(pll->dben[f][i] << 11) |
(pll->dbsel[f][i] << 7));
MCHBAR8_AND_OR(C0TXCK1DLL, ~0x3f, pll->pi[f][i]);
}
/* Program CMD0 and CMD1 registers for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_cmd(const struct pllparam *pll, u8 f, u8 i)
{
u8 reg8;
/* Clock Group Index 3 */
reg8 = pll->dbsel[f][i] << 5;
reg8 |= pll->dben[f][i] << 6;
MCHBAR8_AND_OR(C0CMDTX1, ~0x60, reg8);
reg8 = pll->clkdelay[f][i] << 4;
MCHBAR8_AND_OR(C0CMDTX2, ~0x30, reg8);
reg8 = pll->pi[f][i];
MCHBAR8_AND_OR(C0TXCMD0DLL, ~0x3f, reg8);
MCHBAR8_AND_OR(C0TXCMD1DLL, ~0x3f, reg8);
}
/* Program CTRL registers for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_ctrl(const struct pllparam *pll, u8 f, u8 i)
{
u8 reg8;
u32 reg32;
/* CTRL0 and CTRL1 */
reg32 = ((u32) pll->dbsel[f][i]) << 20;
reg32 |= ((u32) pll->dben[f][i]) << 21;
reg32 |= ((u32) pll->dbsel[f][i]) << 22;
reg32 |= ((u32) pll->dben[f][i]) << 23;
reg32 |= ((u32) pll->clkdelay[f][i]) << 24;
reg32 |= ((u32) pll->clkdelay[f][i]) << 27;
MCHBAR32_AND_OR(C0CTLTX2, ~0x01bf0000, reg32);
reg8 = pll->pi[f][i];
MCHBAR8_AND_OR(C0TXCTL0DLL, ~0x3f, reg8);
MCHBAR8_AND_OR(C0TXCTL1DLL, ~0x3f, reg8);
/* CTRL2 and CTRL3 */
reg32 = ((u32) pll->dbsel[f][i]) << 12;
reg32 |= ((u32) pll->dben[f][i]) << 13;
reg32 |= ((u32) pll->dbsel[f][i]) << 8;
reg32 |= ((u32) pll->dben[f][i]) << 9;
reg32 |= ((u32) pll->clkdelay[f][i]) << 14;
reg32 |= ((u32) pll->clkdelay[f][i]) << 10;
MCHBAR32_AND_OR(C0CMDTX2, ~0xff00, reg32);
reg8 = pll->pi[f][i];
MCHBAR8_AND_OR(C0TXCTL2DLL, ~0x3f, reg8);
MCHBAR8_AND_OR(C0TXCTL3DLL, ~0x3f, reg8);
}
static void sdram_p_dqs(struct pllparam *pll, u8 f, u8 clk)
{
u8 rank, dqs, reg8, j;
u32 reg32;
j = clk - 40;
reg8 = 0;
reg32 = 0;
rank = j % 4;
dqs = j / 4;
reg32 |= ((u32) pll->dben[f][clk]) << (dqs + 9);
reg32 |= ((u32) pll->dbsel[f][clk]) << dqs;
/* FIXME: Somehow, touching this changes the binary... */
MCHBAR32(C0DQSRyTX1(rank)) = (MCHBAR32(0x5b4 + (rank * 4))
& ~((1 << (dqs + 9)) | (1 << dqs))) | reg32;
reg32 = ((u32) pll->clkdelay[f][clk]) << ((dqs * 2) + 16);
MCHBAR32_AND_OR(C0DQSDQRyTX3(rank), ~((1 << (dqs * 2 + 17)) | (1 << (dqs * 2 + 16))),
reg32);
reg8 = pll->pi[f][clk];
MCHBAR8_AND_OR(C0TXDQS0R0DLL + j, ~0x3f, reg8);
}
static void sdram_p_dq(struct pllparam *pll, u8 f, u8 clk)
{
u8 rank, dq, reg8, j;
u32 reg32;
j = clk - 8;
reg8 = 0;
reg32 = 0;
rank = j % 4;
dq = j / 4;
reg32 |= ((u32) pll->dben[f][clk]) << (dq + 9);
reg32 |= ((u32) pll->dbsel[f][clk]) << dq;
/* FIXME: Somehow, touching this changes the binary... */
MCHBAR32(C0DQRyTX1(rank)) = (MCHBAR32(0x5a4 + rank * 4)
& ~((1 << (dq + 9)) | (1 << dq))) | reg32;
reg32 = ((u32) pll->clkdelay[f][clk]) << (dq*2);
MCHBAR32_AND_OR(C0DQSDQRyTX3(rank), ~((1 << (dq * 2 + 1)) | (1 << (dq * 2))), reg32);
reg8 = pll->pi[f][clk];
MCHBAR8_AND_OR(C0TXDQ0R0DLL + j, ~0x3f, reg8);
}
/* WDLL programming: Perform HPLL/MPLL calibration after write levelization */
static void sdram_calibratepll(struct sysinfo *s, u8 pidelay)
{
struct pllparam pll = {
.pi = {
{ /* DDR = 667 */
3, 3, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7,
7, 7, 7, 7, 4, 4, 4, 4, 4, 4, 4, 4,
4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5,
7, 7, 7, 7, 3, 3, 3, 3, 3, 3, 3, 3,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 1, 1, 1, 1, 3, 3, 3, 3,
},
{ /* DDR = 800 */
53, 53, 10, 10, 5, 5, 5, 5, 27, 27, 27, 27,
34, 34, 34, 34, 34, 34, 34, 34, 39, 39, 39, 39,
47, 47, 47, 47, 44, 44, 44, 44, 47, 47, 47, 47,
47, 47, 47, 47, 59, 59, 59, 59, 2, 2, 2, 2,
2, 2, 2, 2, 7, 7, 7, 7, 15, 15, 15, 15,
12, 12, 12, 12, 15, 15, 15, 15, 15, 15, 15, 15,
}},
.dben = {
{ /* DDR = 667 */
0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
},
{ /* DDR = 800 */
1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
}},
.dbsel = {
{ /* DDR = 667 */
0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
},
{ /* DDR = 800 */
0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
}},
.clkdelay = {
{ /* DDR = 667 */
0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
},
{ /* DDR = 800 */
0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
}}
};
u8 i, f;
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
f = 0;
} else {
f = 1;
}
for (i = 0; i < 72; i++) {
pll.pi[f][i] += pidelay;
}
/* Disable Dynamic DQS Slave Setting Per Rank */
MCHBAR8_AND(CSHRDQSCMN, ~(1 << 7));
MCHBAR16_AND_OR(CSHRPDCTL4, ~0x3fff, 0x1fff);
sdram_p_clkset0(&pll, f, 0);
sdram_p_clkset1(&pll, f, 1);
sdram_p_cmd(&pll, f, 2);
sdram_p_ctrl(&pll, f, 4);
for (i = 0; i < 32; i++) {
sdram_p_dqs(&pll, f, i + 40);
}
for (i = 0; i < 32; i++) {
sdram_p_dq(&pll, f, i + 8);
}
}
/* Perform HMC hardware calibration */
static void sdram_calibratehwpll(struct sysinfo *s)
{
u8 reg8;
s->async = 0;
reg8 = 0;
MCHBAR16_OR(CSHRPDCTL, 1 << 15);
MCHBAR8_AND(CSHRPDCTL, ~(1 << 7));
MCHBAR8_OR(CSHRPDCTL, 1 << 3);
MCHBAR8_OR(CSHRPDCTL, 1 << 2);
/* Start hardware HMC calibration */
MCHBAR8_OR(CSHRPDCTL, 1 << 7);
/* Busy-wait until calibration is done */
while ((MCHBAR8(CSHRPDCTL) & (1 << 2)) == 0)
;
/* If hardware HMC calibration failed */
reg8 = (MCHBAR8(CSHRPDCTL) & (1 << 3)) >> 3;
if (reg8 != 0) {
s->async = 1;
}
}
static void sdram_dlltiming(struct sysinfo *s)
{
u8 reg8, i;
u16 reg16;
u32 reg32;
/* Configure the Master DLL */
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
reg32 = 0x08014227;
} else {
reg32 = 0x00014221;
}
MCHBAR32_AND_OR(CSHRMSTRCTL1, ~0x0fffffff, reg32);
MCHBAR32_OR(CSHRMSTRCTL1, 1 << 23);
MCHBAR32_OR(CSHRMSTRCTL1, 1 << 15);
MCHBAR32_AND(CSHRMSTRCTL1, ~(1 << 15));
if (s->nodll) {
/* Disable the Master DLLs by setting these bits, IN ORDER! */
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 0);
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 2);
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 4);
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 8);
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 10);
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 12);
MCHBAR16_OR(CSHRMSTRCTL0, 1 << 14);
} else {
/* Enable the Master DLLs by clearing these bits, IN ORDER! */
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 0));
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 2));
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 4));
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 8));
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 10));
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 12));
MCHBAR16_AND(CSHRMSTRCTL0, ~(1 << 14));
}
/* Initialize the Transmit DLL PI values in the following sequence. */
if (s->nodll) {
MCHBAR8_AND_OR(CREFPI, ~0x3f, 0x07);
} else {
MCHBAR8_AND(CREFPI, ~0x3f);
}
sdram_calibratepll(s, 0); // XXX check
/* Enable all modular Slave DLL */
MCHBAR16_OR(C0DLLPIEN, 1 << 11);
MCHBAR16_OR(C0DLLPIEN, 1 << 12);
for (i = 0; i < 8; i++) {
MCHBAR16_OR(C0DLLPIEN, (1 << 10) >> i);
}
/* Enable DQ/DQS output */
MCHBAR8_OR(C0SLVDLLOUTEN, 1);
MCHBAR16(CSPDSLVWT) = 0x5005;
MCHBAR16_AND_OR(CSHRPDCTL2, ~0x1f1f, 0x051a);
MCHBAR16_AND_OR(CSHRPDCTL5, ~0xbf3f, 0x9010);
if (s->nodll) {
MCHBAR8_AND_OR(CSHRPDCTL3, ~0x7f, 0x6b);
} else {
MCHBAR8_AND_OR(CSHRPDCTL3, ~0x7f, 0x55);
sdram_calibratehwpll(s);
}
/* Disable Dynamic Diff Amp */
MCHBAR32_AND(C0STATRDCTRL, ~(1 << 22));
/* Now, start initializing the transmit FIFO */
MCHBAR8_AND(C0MISCCTL, ~0x02);
/* Disable (gate) mdclk and mdclkb */
MCHBAR8_OR(CSHWRIOBONUS, 0xc0);
/* Select mdmclk */
MCHBAR8_AND(CSHWRIOBONUS, ~(1 << 5));
/* Ungate mdclk */
MCHBAR8_AND_OR(CSHWRIOBONUS, ~0xc0, 1 << 6);
MCHBAR8_AND_OR(CSHRFIFOCTL, ~0x3f, 0x1a);
/* Enable the write pointer count */
MCHBAR8_OR(CSHRFIFOCTL, 1);
/* Set the DDR3 Reset Enable bit */
MCHBAR8_OR(CSHRDDR3CTL, 1);
/* Configure DQS-DQ Transmit */
MCHBAR32(CSHRDQSTXPGM) = 0x00551803;
reg8 = 0; /* Switch all clocks on anyway */
/* Enable clock groups depending on rank population */
MCHBAR32_AND_OR(C0CKTX, ~0x3f000000, reg8 << 24);
/* Enable DDR command output buffers from core */
MCHBAR8_AND(0x594, ~1);
reg16 = 0;
if (!rank_is_populated(s->dimms, 0, 0)) {
reg16 |= (1 << 8) | (1 << 4) | (1 << 0);
}
if (!rank_is_populated(s->dimms, 0, 1)) {
reg16 |= (1 << 9) | (1 << 5) | (1 << 1);
}
if (!rank_is_populated(s->dimms, 0, 2)) {
reg16 |= (1 << 10) | (1 << 6) | (1 << 2);
}
if (!rank_is_populated(s->dimms, 0, 3)) {
reg16 |= (1 << 11) | (1 << 7) | (1 << 3);
}
MCHBAR16_OR(C0CTLTX2, reg16);
}
/* Define a shorter name for these to make the lines fit in 96 characters */
#define TABLE static const
/* Loop over each RCOMP group, but skip group 1 because it does not exist */
#define FOR_EACH_RCOMP_GROUP(idx) for (idx = 0; idx < 7; idx++) if (idx != 1)
/* Define accessors for the RCOMP register banks */
#define C0RCOMPCTRLx(x) (rcompctl[(x)] + 0x00)
#define C0RCOMPMULTx(x) (rcompctl[(x)] + 0x04)
#define C0RCOMPOVRx(x) (rcompctl[(x)] + 0x06)
#define C0RCOMPOSVx(x) (rcompctl[(x)] + 0x0A)
#define C0SCOMPVREFx(x) (rcompctl[(x)] + 0x0E)
#define C0SCOMPOVRx(x) (rcompctl[(x)] + 0x10)
#define C0SCOMPOFFx(x) (rcompctl[(x)] + 0x12)
#define C0DCOMPx(x) (rcompctl[(x)] + 0x14)
#define C0SLEWBASEx(x) (rcompctl[(x)] + 0x16)
#define C0SLEWPULUTx(x) (rcompctl[(x)] + 0x18)
#define C0SLEWPDLUTx(x) (rcompctl[(x)] + 0x1C)
#define C0DCOMPOVRx(x) (rcompctl[(x)] + 0x20)
#define C0DCOMPOFFx(x) (rcompctl[(x)] + 0x24)
/* FIXME: This only applies to DDR2 */
static void sdram_rcomp(struct sysinfo *s)
{
u8 i, j, reg8, rcompp, rcompn, srup, srun;
u16 reg16;
u32 reg32, rcomp1, rcomp2;
static const u8 rcompslew = 0x0a;
static const u16 rcompctl[7] = {
C0RCOMPCTRL0,
0, /* This register does not exist */
C0RCOMPCTRL2,
C0RCOMPCTRL3,
C0RCOMPCTRL4,
C0RCOMPCTRL5,
C0RCOMPCTRL6,
};
/* RCOMP settings tables = { NC-NC, x16SS, x16DS, x16SS2, x16DS2, x8DS, x8DS2}; */
TABLE u8 rcompupdate[7] = { 0, 0, 0, 1, 1, 0, 0};
TABLE u8 rcompstr[7] = { 0x66, 0x00, 0xaa, 0x55, 0x55, 0x77, 0x77};
TABLE u16 rcompscomp[7] = {0xa22a, 0x0000, 0xe22e, 0xe22e, 0xe22e, 0xa22a, 0xa22a};
TABLE u8 rcompdelay[7] = { 1, 0, 0, 0, 0, 1, 1};
TABLE u16 rcompf[7] = {0x1114, 0x0000, 0x0505, 0x0909, 0x0909, 0x0a0a, 0x0a0a};
TABLE u8 rcompstr2[7] = { 0x00, 0x55, 0x55, 0xaa, 0xaa, 0x55, 0xaa};
TABLE u16 rcompscomp2[7] = {0x0000, 0xe22e, 0xe22e, 0xe22e, 0x8228, 0xe22e, 0x8228};
TABLE u8 rcompdelay2[7] = { 0, 0, 0, 0, 2, 0, 2};
TABLE u8 rcomplut[64][12] = {
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{10, 9, 12, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{10, 9, 12, 11, 2, 2, 6, 5, 7, 6, 6, 5},
{10, 10, 12, 12, 2, 2, 6, 5, 7, 6, 6, 5},
{10, 10, 12, 12, 2, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{11, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{11, 10, 14, 13, 3, 3, 6, 6, 7, 7, 6, 6},
{12, 10, 14, 13, 3, 3, 6, 6, 7, 7, 6, 6},
{12, 12, 14, 13, 3, 3, 7, 6, 7, 7, 7, 6},
{13, 12, 16, 15, 3, 3, 7, 6, 8, 7, 7, 6},
{13, 14, 16, 15, 4, 3, 7, 7, 8, 8, 7, 7},
{14, 14, 16, 17, 4, 3, 7, 7, 8, 8, 7, 7},
{14, 16, 18, 17, 4, 4, 8, 7, 8, 8, 8, 7},
{15, 16, 18, 19, 4, 4, 8, 7, 9, 8, 8, 7},
{15, 18, 18, 19, 4, 4, 8, 8, 9, 9, 8, 8},
{16, 18, 20, 21, 4, 4, 8, 8, 9, 9, 8, 8},
{16, 19, 20, 21, 5, 4, 9, 8, 10, 9, 9, 8},
{16, 19, 20, 23, 5, 5, 9, 9, 10, 10, 9, 9},
{17, 19, 22, 23, 5, 5, 9, 9, 10, 10, 9, 9},
{17, 20, 22, 25, 5, 5, 9, 9, 10, 10, 9, 9},
{17, 20, 22, 25, 5, 5, 9, 9, 10, 10, 9, 9},
{18, 20, 22, 25, 5, 5, 9, 9, 10, 10, 9, 9},
{18, 21, 24, 25, 5, 5, 9, 9, 11, 10, 9, 9},
{19, 21, 24, 27, 5, 5, 9, 9, 11, 11, 9, 9},
{19, 22, 24, 27, 5, 5, 10, 9, 11, 11, 10, 9},
{20, 22, 24, 27, 6, 5, 10, 10, 11, 11, 10, 10},
{20, 23, 26, 27, 6, 6, 10, 10, 12, 12, 10, 10},
{20, 23, 26, 29, 6, 6, 10, 10, 12, 12, 10, 10},
{21, 24, 26, 29, 6, 6, 10, 10, 12, 12, 10, 10},
{21, 24, 26, 29, 6, 6, 11, 10, 12, 13, 11, 10},
{22, 25, 28, 29, 6, 6, 11, 11, 13, 13, 11, 11},
{22, 25, 28, 31, 6, 6, 11, 11, 13, 13, 11, 11},
{22, 26, 28, 31, 6, 6, 11, 11, 13, 14, 11, 11},
{23, 26, 30, 31, 7, 6, 12, 11, 14, 14, 12, 11},
{23, 27, 30, 33, 7, 7, 12, 12, 14, 14, 12, 12},
{23, 27, 30, 33, 7, 7, 12, 12, 14, 15, 12, 12},
{24, 28, 32, 33, 7, 7, 12, 12, 15, 15, 12, 12},
{24, 28, 32, 33, 7, 7, 12, 12, 15, 16, 12, 12},
{24, 29, 32, 35, 7, 7, 12, 12, 15, 16, 12, 12},
{25, 29, 32, 35, 7, 7, 12, 12, 15, 17, 12, 12},
{25, 30, 32, 35, 7, 7, 12, 12, 15, 17, 12, 12},
{25, 30, 32, 35, 7, 7, 12, 12, 15, 17, 12, 12},
};
srup = 0;
srun = 0;
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
rcomp1 = 0x00050431;
} else {
rcomp1 = 0x00050542;
}
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) {
rcomp2 = 0x14C42827;
} else {
rcomp2 = 0x19042827;
}
FOR_EACH_RCOMP_GROUP(i) {
reg8 = rcompupdate[i];
MCHBAR8_AND_OR(C0RCOMPCTRLx(i), ~1, reg8);
MCHBAR8_AND(C0RCOMPCTRLx(i), ~2);
reg16 = rcompslew;
MCHBAR16_AND_OR(C0RCOMPCTRLx(i), ~0xf000, reg16 << 12);
MCHBAR8(C0RCOMPMULTx(i)) = rcompstr[i];
MCHBAR16(C0SCOMPVREFx(i)) = rcompscomp[i];
MCHBAR8_AND_OR(C0DCOMPx(i), ~0x03, rcompdelay[i]);
if (i == 2) {
/* FIXME: Why are we rewriting this? */
MCHBAR16_AND_OR(C0RCOMPCTRLx(i), ~0xf000, reg16 << 12);
MCHBAR8(C0RCOMPMULTx(i)) = rcompstr2[s->dimm_config[0]];
MCHBAR16(C0SCOMPVREFx(i)) = rcompscomp2[s->dimm_config[0]];
MCHBAR8_AND_OR(C0DCOMPx(i), ~0x03, rcompdelay2[s->dimm_config[0]]);
}
MCHBAR16_AND(C0SLEWBASEx(i), ~0x7f7f);
/* FIXME: Why not do a single dword write? */
MCHBAR16_AND(C0SLEWPULUTx(i), ~0x3f3f);
MCHBAR16_AND(C0SLEWPULUTx(i) + 2, ~0x3f3f);
/* FIXME: Why not do a single dword write? */
MCHBAR16_AND(C0SLEWPDLUTx(i), ~0x3f3f);
MCHBAR16_AND(C0SLEWPDLUTx(i) + 2, ~0x3f3f);
}
/* FIXME: Hardcoded */
MCHBAR8_AND_OR(C0ODTRECORDX, ~0x3f, 0x36);
MCHBAR8_AND_OR(C0DQSODTRECORDX, ~0x3f, 0x36);
FOR_EACH_RCOMP_GROUP(i) {
MCHBAR8_AND(C0RCOMPCTRLx(i), ~0x60);
MCHBAR16_AND(C0RCOMPCTRLx(i) + 2, ~0x0706);
MCHBAR16_AND(C0RCOMPOSVx(i), ~0x7f7f);
MCHBAR16_AND(C0SCOMPOFFx(i), ~0x3f3f);
MCHBAR16_AND(C0DCOMPOFFx(i), ~0x1f1f);
MCHBAR8_AND(C0DCOMPOFFx(i) + 2, ~0x1f);
}
MCHBAR16_AND(C0ODTRECORDX, ~0xffc0);
MCHBAR16_AND(C0ODTRECORDX + 2, ~0x000f);
/* FIXME: Why not do a single dword write? */
MCHBAR16_AND(C0DQSODTRECORDX, ~0xffc0);
MCHBAR16_AND(C0DQSODTRECORDX + 2, ~0x000f);
FOR_EACH_RCOMP_GROUP(i) {
MCHBAR16(C0SCOMPOVRx(i)) = rcompf[i];
/* FIXME: Why not do a single dword write? */
MCHBAR16(C0DCOMPOVRx(i)) = 0x1219;
MCHBAR16(C0DCOMPOVRx(i) + 2) = 0x000C;
}
MCHBAR32_AND_OR(DCMEASBUFOVR, ~0x001f1f1f, 0x000c1219);
/* FIXME: Why not do a single word write? */
MCHBAR16_AND_OR(XCOMPSDR0BNS, ~0x1f00, 0x1200);
MCHBAR8_AND_OR(XCOMPSDR0BNS, ~0x1f, 0x12);
MCHBAR32(COMPCTRL3) = 0x007C9007;
MCHBAR32(OFREQDELSEL) = rcomp1;
MCHBAR16(XCOMPCMNBNS) = 0x1f7f;
MCHBAR32(COMPCTRL2) = rcomp2;
MCHBAR16_AND_OR(XCOMPDFCTRL, ~0x0f, 1);
MCHBAR16(ZQCALCTRL) = 0x0134;
MCHBAR32(COMPCTRL1) = 0x4C293600;
/* FIXME: wtf did these MRC guys smoke */
MCHBAR8_AND_OR(COMPCTRL1 + 3, ~0x44, (1 << 6) | (1 << 2));
MCHBAR16_AND(XCOMPSDR0BNS, ~(1 << 13));
MCHBAR8_AND(XCOMPSDR0BNS, ~(1 << 5));
FOR_EACH_RCOMP_GROUP(i) {
/* FIXME: This should be an _AND_OR */
MCHBAR8(C0RCOMPCTRLx(i) + 2) = MCHBAR8(C0RCOMPCTRLx(i)) & ~0x71;
}
if ((MCHBAR32(COMPCTRL1) & (1 << 30)) == 0) {
/* Start COMP */
MCHBAR8_OR(COMPCTRL1, 1);
/* Wait until COMP is done */
while ((MCHBAR8(COMPCTRL1) & 1) != 0)
;
reg32 = MCHBAR32(XCOMP);
rcompp = (u8) ((reg32 & ~(1 << 31)) >> 24);
rcompn = (u8) ((reg32 & ~(0xff800000)) >> 16);
FOR_EACH_RCOMP_GROUP(i) {
srup = (MCHBAR8(C0RCOMPCTRLx(i) + 1) & 0xc0) >> 6;
srun = (MCHBAR8(C0RCOMPCTRLx(i) + 1) & 0x30) >> 4;
/* FIXME: Why not do a single word write? */
reg16 = (u16)(rcompp - (1 << (srup + 1))) << 8;
MCHBAR16_AND_OR(C0SLEWBASEx(i), ~0x7f00, reg16);
reg16 = (u16)(rcompn - (1 << (srun + 1)));
MCHBAR8_AND_OR(C0SLEWBASEx(i), ~0x7f, (u8)reg16);
}
reg8 = rcompp - (1 << (srup + 1));
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
MCHBAR8_AND_OR(C0SLEWPULUTx(0) + i, ~0x3f, rcomplut[j][0]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
if (s->dimm_config[0] < 3 || s->dimm_config[0] == 5) {
MCHBAR8_AND_OR(C0SLEWPULUTx(2) + i, ~0x3f, rcomplut[j][10]);
}
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
MCHBAR8_AND_OR(C0SLEWPULUTx(3) + i, ~0x3f, rcomplut[j][6]);
MCHBAR8_AND_OR(C0SLEWPULUTx(4) + i, ~0x3f, rcomplut[j][6]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
MCHBAR8_AND_OR(C0SLEWPULUTx(5) + i, ~0x3f, rcomplut[j][8]);
MCHBAR8_AND_OR(C0SLEWPULUTx(6) + i, ~0x3f, rcomplut[j][8]);
}
reg8 = rcompn - (1 << (srun + 1));
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
MCHBAR8_AND_OR(C0SLEWPDLUTx(0) + i, ~0x3f, rcomplut[j][1]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
if (s->dimm_config[0] < 3 || s->dimm_config[0] == 5) {
MCHBAR8_AND_OR(C0SLEWPDLUTx(2) + i, ~0x3f, rcomplut[j][11]);
}
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
MCHBAR8_AND_OR(C0SLEWPDLUTx(3) + i, ~0x3f, rcomplut[j][7]);
MCHBAR8_AND_OR(C0SLEWPDLUTx(4) + i, ~0x3f, rcomplut[j][7]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
MCHBAR8_AND_OR(C0SLEWPDLUTx(5) + i, ~0x3f, rcomplut[j][9]);
MCHBAR8_AND_OR(C0SLEWPDLUTx(6) + i, ~0x3f, rcomplut[j][9]);
}
}
MCHBAR8_OR(COMPCTRL1, 1);
}
/* FIXME: The ODT tables are for DDR2 only! */
static void sdram_odt(struct sysinfo *s)
{
u8 rankindex = 0;
static const u16 odt_rankctrl[16] = {
/* NC_NC, 1R_NC, NV, 2R_NC, NC_1R, 1R_1R, NV, 2R_1R, */
0x0000, 0x0000, 0x0000, 0x0000, 0x0044, 0x1111, 0x0000, 0x1111,
/* NV, NV, NV, NV, NC_2R, 1R_2R, NV, 2R_2R, */
0x0000, 0x0000, 0x0000, 0x0000, 0x0044, 0x1111, 0x0000, 0x1111,
};
static const u16 odt_matrix[16] = {
/* NC_NC, 1R_NC, NV, 2R_NC, NC_1R, 1R_1R, NV, 2R_1R, */
0x0000, 0x0011, 0x0000, 0x0011, 0x0000, 0x4444, 0x0000, 0x4444,
/* NV, NV, NV, NV, NC_2R, 1R_2R, NV, 2R_2R, */
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x4444, 0x0000, 0x4444,
};
switch (s->dimms[0].ranks) {
case 0:
if (s->dimms[1].ranks == 0) {
rankindex = 0;
} else if (s->dimms[1].ranks == 1) {
rankindex = 4;
} else if (s->dimms[1].ranks == 2) {
rankindex = 12;
}
break;
case 1:
if (s->dimms[1].ranks == 0) {
rankindex = 1;
} else if (s->dimms[1].ranks == 1) {
rankindex = 5;
} else if (s->dimms[1].ranks == 2) {
rankindex = 13;
}
break;
case 2:
if (s->dimms[1].ranks == 0) {
rankindex = 3;
} else if (s->dimms[1].ranks == 1) {
rankindex = 7;
} else if (s->dimms[1].ranks == 2) {
rankindex = 15;
}
break;
}
/* Program the ODT Matrix */
MCHBAR16(C0ODT) = odt_matrix[rankindex];
/* Program the ODT Rank Control */
MCHBAR16(C0ODTRKCTRL) = odt_rankctrl[rankindex];
}
static void sdram_mmap(struct sysinfo *s)
{
TABLE u32 w260[7] = {0, 0x400001, 0xc00001, 0x500000, 0xf00000, 0xc00001, 0xf00000};
TABLE u32 w208[7] = {0, 0x10000, 0x1010000, 0x10001, 0x1010101, 0x1010000, 0x1010101};
TABLE u32 w200[7] = {0, 0, 0, 0x20002, 0x40002, 0, 0x40002};
TABLE u32 w204[7] = {0, 0x20002, 0x40002, 0x40004, 0x80006, 0x40002, 0x80006};
TABLE u16 tolud[7] = {2048, 2048, 4096, 4096, 8192, 4096, 8192};
TABLE u16 tom[7] = { 2, 2, 4, 4, 8, 4, 8};
TABLE u16 touud[7] = { 128, 128, 256, 256, 512, 256, 512};
TABLE u32 gbsm[7] = {1 << 27, 1 << 27, 1 << 28, 1 << 27, 1 << 29, 1 << 28, 1 << 29};
TABLE u32 bgsm[7] = {1 << 27, 1 << 27, 1 << 28, 1 << 27, 1 << 29, 1 << 28, 1 << 29};
TABLE u32 tsegmb[7] = {1 << 27, 1 << 27, 1 << 28, 1 << 27, 1 << 29, 1 << 28, 1 << 29};
if ((s->dimm_config[0] < 3) && rank_is_populated(s->dimms, 0, 0)) {
if (s->dimms[0].sides > 1) {
// 2R/NC
MCHBAR32_AND_OR(C0CKECTRL, ~1, 0x300001);
MCHBAR32(C0DRA01) = 0x00000101;
MCHBAR32(C0DRB0) = 0x00040002;
MCHBAR32(C0DRB2) = w204[s->dimm_config[0]];
} else {
// 1R/NC
MCHBAR32_AND_OR(C0CKECTRL, ~1, 0x100001);
MCHBAR32(C0DRA01) = 0x00000001;
MCHBAR32(C0DRB0) = 0x00020002;
MCHBAR32(C0DRB2) = w204[s->dimm_config[0]];
}
} else if ((s->dimm_config[0] == 5) && rank_is_populated(s->dimms, 0, 0)) {
MCHBAR32_AND_OR(C0CKECTRL, ~1, 0x300001);
MCHBAR32(C0DRA01) = 0x00000101;
MCHBAR32(C0DRB0) = 0x00040002;
MCHBAR32(C0DRB2) = 0x00040004;
} else {
MCHBAR32_AND_OR(C0CKECTRL, ~1, w260[s->dimm_config[0]]);
MCHBAR32(C0DRA01) = w208[s->dimm_config[0]];
MCHBAR32(C0DRB0) = w200[s->dimm_config[0]];
MCHBAR32(C0DRB2) = w204[s->dimm_config[0]];
}
pci_write_config16(HOST_BRIDGE, 0xb0, tolud[s->dimm_config[0]]);
pci_write_config16(HOST_BRIDGE, 0xa0, tom[s->dimm_config[0]]);
pci_write_config16(HOST_BRIDGE, 0xa2, touud[s->dimm_config[0]]);
pci_write_config32(HOST_BRIDGE, 0xa4, gbsm[s->dimm_config[0]]);
pci_write_config32(HOST_BRIDGE, 0xa8, bgsm[s->dimm_config[0]]);
pci_write_config32(HOST_BRIDGE, 0xac, tsegmb[s->dimm_config[0]]);
}
static void hpet_udelay(u32 del)
{
u32 start, finish, now;
del *= 15; /* now in usec */
start = HPET32(0xf0);
finish = start + del;
while (1) {
now = HPET32(0xf0);
if (finish > start) {
if (now >= finish)
break;
} else {
if ((now < start) && (now >= finish)) {
break;
}
}
}
}
static u8 sdram_checkrcompoverride(void)
{
u32 xcomp;
u8 aa, bb, a, b, c, d;
xcomp = MCHBAR32(XCOMP);
a = (u8)((xcomp & 0x7f000000) >> 24);
b = (u8)((xcomp & 0x007f0000) >> 16);
c = (u8)((xcomp & 0x00003f00) >> 8);
d = (u8)((xcomp & 0x0000003f) >> 0);
if (a > b) {
aa = a - b;
} else {
aa = b - a;
}
if (c > d) {
bb = c - d;
} else {
bb = d - c;
}
if ((aa > 18) || (bb > 7) || (a <= 5) || (b <= 5) || (c <= 5) || (d <= 5) ||
(a >= 0x7a) || (b >= 0x7a) || (c >= 0x3a) || (d >= 0x3a)) {
MCHBAR32(RCMEASBUFXOVR) = 0x9718a729;
return 1;
}
return 0;
}
static void sdram_rcompupdate(struct sysinfo *s)
{
u8 i, ok;
u32 reg32a, reg32b;
ok = 0;
MCHBAR8_AND(XCOMPDFCTRL, ~(1 << 3));
MCHBAR8_AND(COMPCTRL1, ~(1 << 7));
for (i = 0; i < 3; i++) {
MCHBAR8_OR(COMPCTRL1, 1);
hpet_udelay(1000);
while ((MCHBAR8(COMPCTRL1) & 1) != 0)
;
ok |= sdram_checkrcompoverride();
}
if (!ok) {
reg32a = MCHBAR32(XCOMP);
reg32b = ((reg32a >> 16) & 0x0000ffff);
reg32a = ((reg32a << 16) & 0xffff0000) | reg32b;
reg32a |= (1 << 31) | (1 << 15);
MCHBAR32(RCMEASBUFXOVR) = reg32a;
}
MCHBAR8_OR(COMPCTRL1, 1);
hpet_udelay(1000);
while ((MCHBAR8(COMPCTRL1) & 1) != 0)
;
}
static void __attribute__((noinline))
sdram_jedec(struct sysinfo *s, u8 rank, u8 jmode, u16 jval)
{
u32 reg32;
reg32 = jval << 3;
reg32 |= rank * (1 << 27);
MCHBAR8_AND_OR(C0JEDEC, ~0x3e, jmode);
read32((void *)reg32);
barrier();
hpet_udelay(1); // 1us
}
static void sdram_zqcl(struct sysinfo *s)
{
if (s->boot_path == BOOT_PATH_RESUME) {
MCHBAR32_OR(C0CKECTRL, 1 << 27);
MCHBAR8_AND_OR(C0JEDEC, ~0x0e, NORMAL_OP_CMD);
MCHBAR8_AND(C0JEDEC, ~0x30);
MCHBAR32_AND_OR(C0REFRCTRL2, ~(3 << 30), 3 << 30);
}
}
static void sdram_jedecinit(struct sysinfo *s)
{
u8 r, i, ch;
u16 reg16, mrs, rttnom;
struct jedeclist {
char debug[15];
u8 cmd;
u16 val;
};
static const struct jedeclist jedec[12] = {
{ " NOP ", NOP_CMD, 0 },
{ " PRE CHARGE ", PRE_CHARGE_CMD, 0 },
{ " EMRS2 ", EMRS2_CMD, 0 },
{ " EMRS3 ", EMRS3_CMD, 0 },
{ " EMRS1 ", EMRS1_CMD, 0 },
{ " DLL RESET ", MRS_CMD, (1 << 8) },
{ " PRE CHARGE ", PRE_CHARGE_CMD, 0 },
{ " AUTOREFRESH", CBR_CMD, 0 },
{ " AUTOREFRESH", CBR_CMD, 0 },
{ " INITIALISE ", MRS_CMD, 0 },
{ " EMRS1 OCD ", EMRS1_CMD, (1 << 9) | (1 << 8) | (1 << 7) },
{ " EMRS1 EXIT ", EMRS1_CMD, 0 }
};
mrs = (s->selected_timings.CAS << 4) |
((s->selected_timings.tWR - 1) << 9) | (1 << 3) | (1 << 1) | 3;
rttnom = (1 << 2);
if (rank_is_populated(s->dimms, 0, 0) && rank_is_populated(s->dimms, 0, 2)) {
rttnom |= (1 << 6);
}
hpet_udelay(200); // 200us
reg16 = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
for (i = 0; i < 12; i++) {
PRINTK_DEBUG("Rank:%d Jedec:%14s...", r, jedec[i].debug);
reg16 = jedec[i].val;
switch (jedec[i].cmd) {
case EMRS1_CMD:
reg16 |= rttnom;
break;
case MRS_CMD:
reg16 |= mrs;
break;
default:
break;
}
sdram_jedec(s, r, jedec[i].cmd, reg16);
PRINTK_DEBUG("done\n");
}
}
}
static void sdram_misc(struct sysinfo *s)
{
u32 reg32;
reg32 = 0;
reg32 |= (4 << 13);
reg32 |= (6 << 8);
MCHBAR32_AND_OR(C0DYNRDCTRL, ~0x3ff00, reg32);
MCHBAR8_AND(C0DYNRDCTRL, ~(1 << 7));
MCHBAR8_OR(C0REFRCTRL + 3, 1);
if (s->boot_path != BOOT_PATH_RESUME) {
MCHBAR8_AND_OR(C0JEDEC, ~0x0e, NORMAL_OP_CMD);
MCHBAR8_AND(C0JEDEC, ~0x30);
} else {
sdram_zqcl(s);
}
}
static void sdram_checkreset(void)
{
u8 pmcon2, pmcon3, reset;
pmcon2 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa2);
pmcon3 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa4);
pmcon3 &= ~0x2;
if (pmcon2 & 0x80) {
pmcon2 &= ~0x80;
reset = 1;
} else {
pmcon2 |= 0x80;
reset = 0;
}
if (pmcon2 & 0x4) {
pmcon2 |= 0x4;
pmcon3 = (pmcon3 & ~0x30) | 0x30;
pmcon3 |= (1 << 3);
}
pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, pmcon2);
pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa4, pmcon3);
if (reset)
full_reset();
}
static void sdram_dradrb(struct sysinfo *s)
{
u8 i, reg8, ch, r;
u32 reg32, ind, c0dra, c0drb, dra;
u16 addr;
i = 0;
static const u8 dratab[2][2][2][4] =
{{
{
{0xff, 0xff, 0xff, 0xff},
{0xff, 0x00, 0x02, 0xff}
},
{
{0xff, 0x01, 0xff, 0xff},
{0xff, 0x03, 0xff, 0x06}
}
},
{
{
{0xff, 0xff, 0xff, 0xff},
{0xff, 0x04, 0x06, 0x08}
},
{
{0xff, 0xff, 0xff, 0xff},
{0x05, 0x07, 0x09, 0xff}
}
}};
static const u8 dradrb[10][6] = {
//Row Col Bank Width DRB
{0x01, 0x01, 0x00, 0x08, 0, 0x04},
{0x01, 0x00, 0x00, 0x10, 0, 0x02},
{0x02, 0x01, 0x00, 0x08, 1, 0x08},
{0x01, 0x01, 0x00, 0x10, 1, 0x04},
{0x01, 0x01, 0x01, 0x08, 1, 0x08},
{0x00, 0x01, 0x01, 0x10, 1, 0x04},
{0x02, 0x01, 0x01, 0x08, 2, 0x10},
{0x01, 0x01, 0x01, 0x10, 2, 0x08},
{0x03, 0x01, 0x01, 0x08, 3, 0x20},
{0x02, 0x01, 0x01, 0x10, 3, 0x10},
};
reg32 = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
i = r / 2;
PRINTK_DEBUG("RANK %d PRESENT\n", r);
dra = dratab
[s->dimms[i].banks]
[s->dimms[i].width]
[s->dimms[i].cols - 9]
[s->dimms[i].rows - 12];
if (s->dimms[i].banks == 1) {
dra |= (1 << 7);
}
reg32 |= (dra << (r * 8));
}
MCHBAR32(C0DRA01) = reg32;
c0dra = reg32;
PRINTK_DEBUG("C0DRA = 0x%08x\n", c0dra);
reg32 = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
reg32 |= (1 << r);
}
reg8 = (u8)(reg32 << 4) & 0xf0;
MCHBAR8_AND_OR(C0CKECTRL + 2, ~0xf0, reg8);
if (ONLY_DIMMA_IS_POPULATED(s->dimms, 0) || ONLY_DIMMB_IS_POPULATED(s->dimms, 0)) {
MCHBAR8_OR(C0CKECTRL, 1);
}
addr = C0DRB0;
c0drb = 0;
FOR_EACH_RANK(ch, r) {
if (rank_is_populated(s->dimms, ch, r)) {
ind = (c0dra >> (8 * r)) & 0x7f;
c0drb = (u16)(c0drb + dradrb[ind][5]);
s->channel_capacity[0] += dradrb[ind][5] << 6;
}
MCHBAR16(addr) = c0drb;
addr += 2;
}
printk(BIOS_DEBUG, "Total memory = %dMB\n", s->channel_capacity[0]);
}
static u8 sampledqs(u32 dqshighaddr, u32 strobeaddr, u8 highlow, u8 count)
{
u8 dqsmatches = 1;
while (count--) {
MCHBAR8_AND(C0RSTCTL, ~2);
hpet_udelay(1);
MCHBAR8_OR(C0RSTCTL, 2);
hpet_udelay(1);
barrier();
read32((void *)strobeaddr);
barrier();
hpet_udelay(1);
if (((MCHBAR8(dqshighaddr) & 0x40) >> 6) != highlow) {
dqsmatches = 0;
}
}
return dqsmatches;
}
static void rcvenclock(u8 *coarse, u8 *medium, u8 lane)
{
if (*medium < 3) {
(*medium)++;
MCHBAR16_AND_OR(C0RCVMISCCTL2, (u16)~(3 << (lane * 2)), *medium << (lane * 2));
} else {
*medium = 0;
(*coarse)++;
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x000f0000, *coarse << 16);
MCHBAR16_AND_OR(C0RCVMISCCTL2, (u16)(~3 << (lane * 2)), *medium << (lane * 2));
}
}
static void sdram_rcven(struct sysinfo *s)
{
u8 coarse, savecoarse;
u8 medium, savemedium;
u8 pi, savepi;
u8 lane;
u8 lanecoarse[8] = {0};
u8 minlanecoarse = 0xff;
u8 offset;
u8 maxlane = 8;
/* Since dra/drb is already set up we know that at address 0x00000000
we will always find the first available rank */
u32 strobeaddr = 0;
u32 dqshighaddr;
MCHBAR8_AND(C0RSTCTL, ~0x0c);
MCHBAR8_AND(CMNDQFIFORST, ~0x80);
PRINTK_DEBUG("rcven 0\n");
for (lane = 0; lane < maxlane; lane++) {
PRINTK_DEBUG("rcven lane %d\n", lane);
// trylaneagain:
dqshighaddr = C0MISCCTLy(lane);
coarse = s->selected_timings.CAS + 1;
pi = 0;
medium = 0;
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x000f0000, coarse << 16);
MCHBAR16_AND_OR(C0RCVMISCCTL2, (u16)~(3 << (lane * 2)), medium << (lane * 2));
MCHBAR8_AND(C0RXRCVyDLL(lane), ~0x3f);
savecoarse = coarse;
savemedium = medium;
savepi = pi;
PRINTK_DEBUG("rcven 0.1\n");
// XXX comment out
// MCHBAR16_AND_OR(C0RCVMISCCTL1, (u16)~3 << (lane * 2), 1 << (lane * 2));
while (sampledqs(dqshighaddr, strobeaddr, 0, 3) == 0) {
// printk(BIOS_DEBUG, "coarse=%d medium=%d\n", coarse, medium);
rcvenclock(&coarse, &medium, lane);
if (coarse > 0xf) {
PRINTK_DEBUG("Error: coarse > 0xf\n");
// goto trylaneagain;
break;
}
}
PRINTK_DEBUG("rcven 0.2\n");
savecoarse = coarse;
savemedium = medium;
rcvenclock(&coarse, &medium, lane);
while (sampledqs(dqshighaddr, strobeaddr, 1, 3) == 0) {
savecoarse = coarse;
savemedium = medium;
rcvenclock(&coarse, &medium, lane);
if (coarse > 0xf) {
PRINTK_DEBUG("Error: coarse > 0xf\n");
//goto trylaneagain;
break;
}
}
PRINTK_DEBUG("rcven 0.3\n");
coarse = savecoarse;
medium = savemedium;
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x000f0000, coarse << 16);
MCHBAR16_AND_OR(C0RCVMISCCTL2, (u16)~(0x3 << lane * 2), medium << (lane * 2));
while (sampledqs(dqshighaddr, strobeaddr, 1, 3) == 0) {
savepi = pi;
pi++;
if (pi > s->maxpi) {
// if (s->nodll) {
pi = savepi = s->maxpi;
break;
// }
}
MCHBAR8_AND_OR(C0RXRCVyDLL(lane), ~0x3f, pi << s->pioffset);
}
PRINTK_DEBUG("rcven 0.4\n");
pi = savepi;
MCHBAR8_AND_OR(C0RXRCVyDLL(lane), ~0x3f, pi << s->pioffset);
rcvenclock(&coarse, &medium, lane);
if (sampledqs(dqshighaddr, strobeaddr, 1, 1) == 0) {
PRINTK_DEBUG("Error: DQS not high\n");
// goto trylaneagain;
}
PRINTK_DEBUG("rcven 0.5\n");
while (sampledqs(dqshighaddr, strobeaddr, 0, 3) == 0) {
coarse--;
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x000f0000, coarse << 16);
if (coarse == 0) {
PRINTK_DEBUG("Error: DQS did not hit 0\n");
break;
}
}
PRINTK_DEBUG("rcven 0.6\n");
rcvenclock(&coarse, &medium, lane);
s->pi[lane] = pi;
lanecoarse[lane] = coarse;
}
PRINTK_DEBUG("rcven 1\n");
lane = maxlane;
do {
lane--;
if (minlanecoarse > lanecoarse[lane]) {
minlanecoarse = lanecoarse[lane];
}
} while (lane != 0);
lane = maxlane;
do {
lane--;
offset = lanecoarse[lane] - minlanecoarse;
MCHBAR16_AND_OR(C0COARSEDLY0, (u16)(~(3 << (lane * 2))), offset << (lane * 2));
} while (lane != 0);
MCHBAR32_AND_OR(C0STATRDCTRL, ~0x000f0000, minlanecoarse << 16);
s->coarsectrl = minlanecoarse;
s->coarsedelay = MCHBAR16(C0COARSEDLY0);
s->mediumphase = MCHBAR16(C0RCVMISCCTL2);
s->readptrdelay = MCHBAR16(C0RCVMISCCTL1);
PRINTK_DEBUG("rcven 2\n");
MCHBAR8_AND(C0RSTCTL, ~0x0e);
MCHBAR8_OR(C0RSTCTL, 0x02);
MCHBAR8_OR(C0RSTCTL, 0x04);
MCHBAR8_OR(C0RSTCTL, 0x08);
MCHBAR8_OR(CMNDQFIFORST, 0x80);
MCHBAR8_AND(CMNDQFIFORST, ~0x80);
MCHBAR8_OR(CMNDQFIFORST, 0x80);
PRINTK_DEBUG("rcven 3\n");
}
/* NOTE: Unless otherwise specified, the values are expressed in MiB */
static void sdram_mmap_regs(struct sysinfo *s)
{
bool reclaim;
u32 mmiosize, tom, tolud, touud, reclaimbase, reclaimlimit;
u32 gfxbase, gfxsize, gttbase, gttsize, tsegbase, tsegsize;
u16 ggc;
u16 ggc_to_uma[10] = {0, 1, 4, 8, 16, 32, 48, 64, 128, 256};
u8 ggc_to_gtt[4] = {0, 1, 0, 0};
reclaimbase = 0;
reclaimlimit = 0;
ggc = pci_read_config16(HOST_BRIDGE, GGC);
printk(BIOS_DEBUG, "GGC = 0x%04x\n", ggc);
gfxsize = ggc_to_uma[(ggc & 0x00f0) >> 4];
gttsize = ggc_to_gtt[(ggc & 0x0300) >> 8];
tom = s->channel_capacity[0];
/* With GTT always being 1M, TSEG 1M is the only setting that can
be covered by SMRR which has alignment requirements. */
tsegsize = 1;
mmiosize = 1024;
reclaim = false;
tolud = MIN(4096 - mmiosize, tom);
if ((tom - tolud) > 64) {
reclaim = true;
}
if (reclaim) {
tolud = tolud & ~0x3f;
tom = tom & ~0x3f;
reclaimbase = MAX(4096, tom);
reclaimlimit = reclaimbase + (MIN(4096, tom) - tolud) - 0x40;
}
touud = tom;
if (reclaim) {
touud = reclaimlimit + 64;
}
gfxbase = tolud - gfxsize;
gttbase = gfxbase - gttsize;
tsegbase = gttbase - tsegsize;
/* Program the regs */
pci_write_config16(HOST_BRIDGE, TOLUD, (u16)(tolud << 4));
pci_write_config16<