blob: dbc373d1fb87a88b66af9d2b23a392cc4a30373e [file] [log] [blame]
/* SPDX-License-Identifier: GPL-2.0-or-later */
#include <cf9_reset.h>
#include <device/mmio.h>
#include <device/pci_ops.h>
#include <device/smbus_host.h>
#include <commonlib/helpers.h>
#include <console/console.h>
#include <delay.h>
#include <lib.h>
#include <southbridge/intel/common/hpet.h>
#include "pineview.h"
#include "raminit.h"
#include <spd.h>
#include <string.h>
/* Debugging macros */
#if CONFIG(DEBUG_RAM_SETUP)
#define PRINTK_DEBUG(x...) printk(BIOS_DEBUG, x)
#else
#define PRINTK_DEBUG(x...)
#endif
#define MAX_TCLK_667 0x30
#define MAX_TCLK_800 0x25
#define MAX_TAC_667 0x45
#define MAX_TAC_800 0x40
#define NOP_CMD (1 << 1)
#define PRE_CHARGE_CMD (1 << 2)
#define MRS_CMD ((1 << 2) | (1 << 1))
#define EMRS_CMD (1 << 3)
#define EMRS1_CMD (EMRS_CMD | (1 << 4))
#define EMRS2_CMD (EMRS_CMD | (1 << 5))
#define EMRS3_CMD (EMRS_CMD | (1 << 5) | (1 << 4))
#define ZQCAL_CMD ((1 << 3) | (1 << 1))
#define CBR_CMD ((1 << 3) | (1 << 2))
#define NORMAL_OP_CMD ((1 << 3) | (1 << 2) | (1 << 1))
#define UBDIMM 1
#define SODIMM 2
#define TOTAL_CHANNELS 1
#define TOTAL_DIMMS 2
#define DIMM_IS_POPULATED(dimms, idx) (dimms[idx].card_type != 0)
#define IF_DIMM_POPULATED(dimms, idx) if (dimms[idx].card_type != 0)
#define ONLY_DIMMA_IS_POPULATED(dimms, ch) (\
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2) && \
!DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3)))
#define ONLY_DIMMB_IS_POPULATED(dimms, ch) (\
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3) && \
!DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2)))
#define BOTH_DIMMS_ARE_POPULATED(dimms, ch) (\
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2) && \
(DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3))))
#define FOR_EACH_DIMM(idx) \
for (idx = 0; idx < TOTAL_DIMMS; ++idx)
#define FOR_EACH_POPULATED_DIMM(dimms, idx) \
FOR_EACH_DIMM(idx) IF_DIMM_POPULATED(dimms, idx)
#define CHANNEL_IS_POPULATED(dimms, idx) ((dimms[idx<<1].card_type != 0) || (dimms[(idx<<1) + 1].card_type != 0))
#define CHANNEL_IS_CARDF(dimms, idx) ((dimms[idx<<1].card_type == 0xf) || (dimms[(idx<<1) + 1].card_type == 0xf))
#define IF_CHANNEL_POPULATED(dimms, idx) if ((dimms[idx<<1].card_type != 0) || (dimms[(idx<<1) + 1].card_type != 0))
#define FOR_EACH_CHANNEL(idx) \
for (idx = 0; idx < TOTAL_CHANNELS; ++idx)
#define FOR_EACH_POPULATED_CHANNEL(dimms, idx) \
FOR_EACH_CHANNEL(idx) IF_CHANNEL_POPULATED(dimms, idx)
#define RANKS_PER_CHANNEL 4
#define FOR_EACH_RANK_IN_CHANNEL(r) \
for (r = 0; r < RANKS_PER_CHANNEL; ++r)
#define FOR_EACH_POPULATED_RANK_IN_CHANNEL(dimms, ch, r) \
FOR_EACH_RANK_IN_CHANNEL(r) if (rank_is_populated(dimms, ch, r))
#define FOR_EACH_RANK(ch, r) \
FOR_EACH_CHANNEL(ch) FOR_EACH_RANK_IN_CHANNEL(r)
#define FOR_EACH_POPULATED_RANK(dimms, ch, r) \
FOR_EACH_RANK(ch, r) if (rank_is_populated(dimms, ch, r))
static bool rank_is_populated(struct dimminfo dimms[], u8 ch, u8 r)
{
return ((dimms[ch<<1].card_type && ((r) < dimms[ch<<1].ranks))
|| (dimms[(ch<<1) + 1].card_type
&& ((r) >= 2)
&& ((r) < (dimms[(ch<<1) + 1].ranks + 2))));
}
static inline void barrier(void)
{
__asm__ __volatile__("": : :"memory");
}
static int decode_spd(struct dimminfo *d, int i)
{
d->type = 0;
if (d->spd_data[20] == 0x2) {
d->type = UBDIMM;
} else if (d->spd_data[20] == 0x4) {
d->type = SODIMM;
}
d->sides = (d->spd_data[5] & 0x7) + 1;
d->banks = (d->spd_data[17] >> 2) - 1;
d->chip_capacity = d->banks;
d->rows = d->spd_data[3];// - 12;
d->cols = d->spd_data[4];// - 9;
d->cas_latencies = 0x78;
d->cas_latencies &= d->spd_data[18];
if (d->cas_latencies == 0)
d->cas_latencies = 7;
d->tAAmin = d->spd_data[26];
d->tCKmin = d->spd_data[25];
d->width = (d->spd_data[13] >> 3) - 1;
d->page_size = (d->width+1) * (1 << d->cols); // Bytes
d->tRAS = d->spd_data[30];
d->tRP = d->spd_data[27];
d->tRCD = d->spd_data[29];
d->tWR = d->spd_data[36];
d->ranks = d->sides; // XXX
#if CONFIG(DEBUG_RAM_SETUP)
const char *ubso[2] = { "UB", "SO" };
#endif
PRINTK_DEBUG("%s-DIMM %d\n", &ubso[d->type][0], i);
PRINTK_DEBUG(" Sides : %d\n", d->sides);
PRINTK_DEBUG(" Banks : %d\n", d->banks);
PRINTK_DEBUG(" Ranks : %d\n", d->ranks);
PRINTK_DEBUG(" Rows : %d\n", d->rows);
PRINTK_DEBUG(" Cols : %d\n", d->cols);
PRINTK_DEBUG(" Page size : %d\n", d->page_size);
PRINTK_DEBUG(" Width : %d\n", (d->width + 1) * 8);
return 0;
}
/*
* RAM Config: DIMMB-DIMMA
* 0 EMPTY-EMPTY
* 1 EMPTY-x16SS
* 2 EMPTY-x16DS
* 3 x16SS-x16SS
* 4 x16DS-x16DS
* 5 EMPTY- x8DS
* 6 x8DS - x8DS
*/
static void find_ramconfig(struct sysinfo *s, u32 chan)
{
if (s->dimms[chan>>1].sides == 0) {
// NC
if (s->dimms[(chan>>1) + 1].sides == 0) {
// NC/NC
s->dimm_config[chan] = 0;
} else if (s->dimms[(chan>>1) + 1].sides == 1) {
// NC/{8,16}SS
s->dimm_config[chan] = 1;
} else {
// NC/DS
if (s->dimms[(chan>>1) + 1].width == 0) {
// NC/8DS
s->dimm_config[chan] = 5;
} else {
// NC/16DS
s->dimm_config[chan] = 2;
}
}
} else if (s->dimms[chan>>1].sides == 1) {
// SS
if (s->dimms[(chan>>1) + 1].sides == 0) {
// {8,16}SS/NC
s->dimm_config[chan] = 1;
} else if (s->dimms[(chan>>1) + 1].sides == 1) {
// SS/SS
if (s->dimms[chan>>1].width == 0) {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 8SS/8SS
s->dimm_config[chan] = 3;
} else {
// 8SS/16SS
die("Mixed Not supported\n");
}
} else {
if (s->dimms[(chan>>1) + 1].width == 0) {
// 16SS/8SS
die("Mixed Not supported\n");
} else {
// 16SS/16SS
s->dimm_config[chan] = 3;
}
}
} else {
// {8,16}SS/8DS
die("Mixed Not supported\n");
}
} else {
// DS
if (s->dimms[(chan>>1) + 1].sides == 0) {
// DS/NC
if (s->dimms[chan>>1].width == 0) {
// 8DS/NC
s->dimm_config[chan] = 5;
} else {
s->dimm_config[chan] = 4;
}
} else if (s->dimms[(chan>>1) + 1].sides == 1) {
// 8DS/{8,16}SS
if (s->dimms[chan>>1].width == 0) {
die("Mixed Not supported\n");
} else {
if (s->dimms[(chan>>1) + 1].width == 0) {
die("Mixed Not supported\n");
} else {
// 16DS/16DS
s->dimm_config[chan] = 4;
}
}
} else {
// DS/DS
if (s->dimms[chan>>1].width == 0 && s->dimms[(chan>>1)+1].width == 0) {
// 8DS/8DS
s->dimm_config[chan] = 6;
}
}
}
}
static void sdram_read_spds(struct sysinfo *s)
{
u8 i, chan;
s->dt0mode = 0;
FOR_EACH_DIMM(i) {
if (i2c_eeprom_read(s->spd_map[i], 0, 64, s->dimms[i].spd_data) != 64)
s->dimms[i].card_type = 0;
s->dimms[i].card_type = s->dimms[i].spd_data[62] & 0x1f;
hexdump(s->dimms[i].spd_data, 64);
}
s->spd_type = 0;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
switch (s->dimms[i].spd_data[2]) {
case 0x8:
s->spd_type = DDR2;
break;
case 0xb:
default:
die("DIMM type mismatch\n");
break;
}
}
int err = 1;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
err = decode_spd(&s->dimms[i], i);
s->dt0mode |= (s->dimms[i].spd_data[49] & 0x2) >> 1;
}
if (err) {
die("No memory dimms, halt\n");
}
FOR_EACH_POPULATED_CHANNEL(s->dimms, chan) {
find_ramconfig(s, chan);
PRINTK_DEBUG(" Config[CH%d] : %d\n", chan, s->dimm_config[chan]);
}
}
#if CONFIG(DEBUG_RAM_SETUP)
static u32 fsb_reg_to_mhz(u32 speed)
{
return (speed * 133) + 667;
}
static u32 ddr_reg_to_mhz(u32 speed)
{
return (speed == 0) ? 667 : (speed == 1) ? 800 : 0;
}
#endif
// Return the position of the least significant set bit, 0-indexed.
// 0 does not have a lsb, so return -1 for error.
static int lsbpos(u8 val)
{
for (int i = 0; i < 8; i++)
if (val & (1 << i))
return i;
return -1;
}
// Return the position of the most significant set bit, 0-indexed.
// 0 does not have a msb, so return -1 for error.
static int msbpos(u8 val)
{
for (int i = 7; i >= 0; i--)
if (val & (1 << i))
return i;
return -1;
}
static void sdram_detect_smallest_params(struct sysinfo *s)
{
static const u16 mult[6] = {
3000, // 667
2500, // 800
};
u8 i;
u32 maxtras = 0;
u32 maxtrp = 0;
u32 maxtrcd = 0;
u32 maxtwr = 0;
u32 maxtrfc = 0;
u32 maxtwtr = 0;
u32 maxtrrd = 0;
u32 maxtrtp = 0;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
maxtras = MAX(maxtras, (s->dimms[i].spd_data[30] * 1000));
maxtrp = MAX(maxtrp, (s->dimms[i].spd_data[27] * 1000) >> 2);
maxtrcd = MAX(maxtrcd, (s->dimms[i].spd_data[29] * 1000) >> 2);
maxtwr = MAX(maxtwr, (s->dimms[i].spd_data[36] * 1000) >> 2);
maxtrfc = MAX(maxtrfc, (s->dimms[i].spd_data[42] * 1000) +
(s->dimms[i].spd_data[40] & 0xf));
maxtwtr = MAX(maxtwtr, (s->dimms[i].spd_data[37] * 1000) >> 2);
maxtrrd = MAX(maxtrrd, (s->dimms[i].spd_data[28] * 1000) >> 2);
maxtrtp = MAX(maxtrtp, (s->dimms[i].spd_data[38] * 1000) >> 2);
}
/*
* TODO: on DDR3 there might be some minimal required values for some
* Timings: MIN_TRAS = 9, MIN_TRP = 3, MIN_TRCD = 3, MIN_TWR = 3,
* MIN_TWTR = 4, MIN_TRRD = 2, MIN_TRTP = 4
*/
s->selected_timings.tRAS = MIN(24, DIV_ROUND_UP(maxtras,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRP = MIN(10, DIV_ROUND_UP(maxtrp,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRCD = MIN(10, DIV_ROUND_UP(maxtrcd,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tWR = MIN(15, DIV_ROUND_UP(maxtwr,
mult[s->selected_timings.mem_clock]));
/* Needs to be even */
s->selected_timings.tRFC = 0xfe & (MIN(78, DIV_ROUND_UP(maxtrfc,
mult[s->selected_timings.mem_clock])) + 1);
s->selected_timings.tWTR = MIN(15, DIV_ROUND_UP(maxtwtr,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRRD = MIN(15, DIV_ROUND_UP(maxtrrd,
mult[s->selected_timings.mem_clock]));
s->selected_timings.tRTP = MIN(15, DIV_ROUND_UP(maxtrtp,
mult[s->selected_timings.mem_clock]));
PRINTK_DEBUG("Selected timings:\n");
PRINTK_DEBUG("\tFSB: %dMHz\n", fsb_reg_to_mhz(s->selected_timings.fsb_clock));
PRINTK_DEBUG("\tDDR: %dMHz\n", ddr_reg_to_mhz(s->selected_timings.mem_clock));
PRINTK_DEBUG("\tCAS: %d\n", s->selected_timings.CAS);
PRINTK_DEBUG("\ttRAS: %d\n", s->selected_timings.tRAS);
PRINTK_DEBUG("\ttRP: %d\n", s->selected_timings.tRP);
PRINTK_DEBUG("\ttRCD: %d\n", s->selected_timings.tRCD);
PRINTK_DEBUG("\ttWR: %d\n", s->selected_timings.tWR);
PRINTK_DEBUG("\ttRFC: %d\n", s->selected_timings.tRFC);
PRINTK_DEBUG("\ttWTR: %d\n", s->selected_timings.tWTR);
PRINTK_DEBUG("\ttRRD: %d\n", s->selected_timings.tRRD);
PRINTK_DEBUG("\ttRTP: %d\n", s->selected_timings.tRTP);
}
static void sdram_detect_ram_speed(struct sysinfo *s)
{
u8 cas, reg8;
u32 reg32;
u32 freq = 0;
u32 fsb = 0;
u8 i;
u8 commoncas = 0;
u8 highcas = 0;
u8 lowcas = 0;
// Core frequency
fsb = (pci_read_config8(HOST_BRIDGE, 0xe3) & 0x70) >> 4;
if (fsb) {
fsb = 5 - fsb;
} else {
fsb = FSB_CLOCK_800MHz;
}
// DDR frequency
freq = (pci_read_config8(HOST_BRIDGE, 0xe3) & 0x80) >> 7;
freq |= (pci_read_config8(HOST_BRIDGE, 0xe4) & 0x03) << 1;
if (freq) {
freq = 6 - freq;
} else {
freq = MEM_CLOCK_800MHz;
}
// Detect a common CAS latency
commoncas = 0xff;
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
commoncas &= s->dimms[i].spd_data[18];
}
if (commoncas == 0) {
die("No common CAS among dimms\n");
}
// commoncas is nonzero, so these calls will not error
u8 msbp = (u8)msbpos(commoncas);
u8 lsbp = (u8)lsbpos(commoncas);
// Start with fastest common CAS
cas = 0;
highcas = msbp;
lowcas = MAX(lsbp, 5);
while (cas == 0 && highcas >= lowcas) {
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
switch (freq) {
case MEM_CLOCK_800MHz:
if ((s->dimms[i].spd_data[9] > 0x25) ||
(s->dimms[i].spd_data[10] > 0x40)) {
// CAS too fast, lower it
highcas--;
break;
} else {
cas = highcas;
}
break;
case MEM_CLOCK_667MHz:
default:
if ((s->dimms[i].spd_data[9] > 0x30) ||
(s->dimms[i].spd_data[10] > 0x45)) {
// CAS too fast, lower it
highcas--;
break;
} else {
cas = highcas;
}
break;
}
}
}
if (highcas < lowcas) {
// Timings not supported by MCH, lower the frequency
if (freq == MEM_CLOCK_800MHz) {
freq--;
PRINTK_DEBUG("Run DDR clock speed reduced due to timings\n");
} else {
die("Timings not supported by MCH\n");
}
cas = 0;
highcas = msbp;
lowcas = lsbp;
while (cas == 0 && highcas >= lowcas) {
FOR_EACH_POPULATED_DIMM(s->dimms, i) {
if ((s->dimms[i].spd_data[9] > 0x30) ||
(s->dimms[i].spd_data[10] > 0x45)) {
// CAS too fast, lower it
highcas--;
} else {
cas = highcas;
}
}
}
if (cas == 0) {
die("Unsupported dimms\n");
}
}
s->selected_timings.CAS = cas;
s->selected_timings.mem_clock = freq;
s->selected_timings.fsb_clock = fsb;
PRINTK_DEBUG("Drive Memory at %dMHz with CAS = %d clocks\n",
ddr_reg_to_mhz(s->selected_timings.mem_clock), s->selected_timings.CAS);
// Set memory frequency
if (s->boot_path == BOOT_PATH_RESET)
return;
mchbar_setbits32(PMSTS, 1 << 0);
reg32 = (mchbar_read32(CLKCFG) & ~0x70) | (1 << 10);
if (s->selected_timings.mem_clock == MEM_CLOCK_800MHz) {
reg8 = 3;
} else {
reg8 = 2;
}
reg32 |= reg8 << 4;
mchbar_write32(CLKCFG, reg32);
s->selected_timings.mem_clock = ((mchbar_read32(CLKCFG) >> 4) & 0x7) - 2;
if (s->selected_timings.mem_clock == MEM_CLOCK_800MHz) {
PRINTK_DEBUG("MCH validated at 800MHz\n");
s->nodll = 0;
s->maxpi = 63;
s->pioffset = 0;
} else if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
PRINTK_DEBUG("MCH validated at 667MHz\n");
s->nodll = 1;
s->maxpi = 15;
s->pioffset = 1;
} else {
PRINTK_DEBUG("MCH set to unknown (%02x)\n",
(uint8_t)s->selected_timings.mem_clock & 0xff);
}
}
static void sdram_clk_crossing(struct sysinfo *s)
{
u8 ddr_freq, fsb_freq;
static const u32 clkcross[2][2][4] = {
{
{0xffffffff, 0x05030305, 0x0000ffff, 0x00000000}, /* FSB = 667, DDR = 667 */
{0x1f1f1f1f, 0x2a1f1fa5, 0x00000000, 0x05000002}, /* FSB = 667, DDR = 800 */
},
{
{0x1f1f1f1f, 0x0d07070b, 0x00000000, 0x00000000}, /* FSB = 800, DDR = 667 */
{0xffffffff, 0x05030305, 0x0000ffff, 0x00000000}, /* FSB = 800, DDR = 800 */
},
};
ddr_freq = s->selected_timings.mem_clock;
fsb_freq = s->selected_timings.fsb_clock;
mchbar_write32(HMCCMP, clkcross[fsb_freq][ddr_freq][0]);
mchbar_write32(HMDCMP, clkcross[fsb_freq][ddr_freq][1]);
mchbar_write32(HMBYPCP, clkcross[fsb_freq][ddr_freq][2]);
mchbar_write32(HMCCPEXT, 0);
mchbar_write32(HMDCPEXT, clkcross[fsb_freq][ddr_freq][3]);
mchbar_setbits32(HMCCMC, 1 << 7);
if ((fsb_freq == 0) && (ddr_freq == 1)) {
mchbar_write8(CLKXSSH2MCBYPPHAS, 0);
mchbar_write32(CLKXSSH2MD, 0);
mchbar_write32(CLKXSSH2MD + 4, 0);
}
static const u32 clkcross2[2][2][8] = {
{
{ // FSB = 667, DDR = 667
0x00000000, 0x08010204, 0x00000000, 0x08010204,
0x00000000, 0x00000000, 0x00000000, 0x04080102,
},
{ // FSB = 667, DDR = 800
0x04080000, 0x10010002, 0x10000000, 0x20010208,
0x00000000, 0x00000004, 0x02040000, 0x08100102,
},
},
{
{ // FSB = 800, DDR = 667
0x10000000, 0x20010208, 0x04080000, 0x10010002,
0x00000000, 0x00000000, 0x08000000, 0x10200204,
},
{ // FSB = 800, DDR = 800
0x00000000, 0x08010204, 0x00000000, 0x08010204,
0x00000000, 0x00000000, 0x00000000, 0x04080102,
},
},
};
mchbar_write32(CLKXSSH2MCBYP, clkcross2[fsb_freq][ddr_freq][0]);
mchbar_write32(CLKXSSH2MCRDQ, clkcross2[fsb_freq][ddr_freq][0]);
mchbar_write32(CLKXSSH2MCRDCST, clkcross2[fsb_freq][ddr_freq][0]);
mchbar_write32(CLKXSSH2MCBYP + 4, clkcross2[fsb_freq][ddr_freq][1]);
mchbar_write32(CLKXSSH2MCRDQ + 4, clkcross2[fsb_freq][ddr_freq][1]);
mchbar_write32(CLKXSSH2MCRDCST + 4, clkcross2[fsb_freq][ddr_freq][1]);
mchbar_write32(CLKXSSMC2H, clkcross2[fsb_freq][ddr_freq][2]);
mchbar_write32(CLKXSSMC2H + 4, clkcross2[fsb_freq][ddr_freq][3]);
mchbar_write32(CLKXSSMC2HALT, clkcross2[fsb_freq][ddr_freq][4]);
mchbar_write32(CLKXSSMC2HALT + 4, clkcross2[fsb_freq][ddr_freq][5]);
mchbar_write32(CLKXSSH2X2MD, clkcross2[fsb_freq][ddr_freq][6]);
mchbar_write32(CLKXSSH2X2MD + 4, clkcross2[fsb_freq][ddr_freq][7]);
}
static void sdram_clkmode(struct sysinfo *s)
{
u8 ddr_freq;
u16 mpll_ctl;
mchbar_clrbits16(CSHRMISCCTL1, 1 << 8);
mchbar_clrbits8(CSHRMISCCTL1, 0x3f);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
ddr_freq = 0;
mpll_ctl = 1;
} else {
ddr_freq = 1;
mpll_ctl = (1 << 8) | (1 << 5);
}
if (s->boot_path != BOOT_PATH_RESET)
mchbar_clrsetbits16(MPLLCTL, 0x033f, mpll_ctl);
mchbar_write32(C0GNT2LNCH1, 0x58001117);
mchbar_setbits32(C0STATRDCTRL, 1 << 23);
const u32 cas_to_reg[2][4] = {
{0x00000000, 0x00030100, 0x0c240201, 0x00000000}, /* DDR = 667 */
{0x00000000, 0x00030100, 0x0c240201, 0x10450302} /* DDR = 800 */
};
mchbar_write32(C0GNT2LNCH2, cas_to_reg[ddr_freq][s->selected_timings.CAS - 3]);
}
static void sdram_timings(struct sysinfo *s)
{
u8 i, j, ch, r, ta1, ta2, ta3, ta4, trp, bank, page, flag;
u8 reg8, wl;
u16 reg16;
u32 reg32, reg2;
static const u8 pagetab[2][2] = {
{0x0e, 0x12},
{0x10, 0x14},
};
/* Only consider DDR2 */
wl = s->selected_timings.CAS - 1;
ta1 = ta2 = 6;
ta3 = s->selected_timings.CAS;
ta4 = 8;
s->selected_timings.tRFC = (s->selected_timings.tRFC + 1) & 0xfe;
trp = 0;
bank = 1;
page = 0;
mchbar_write8(C0LATCTRL, (wl - 3) << 4 | (s->selected_timings.CAS - 3));
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
i = ch << 1;
if (s->dimms[i].banks == 1) {
trp = 1;
bank = 0;
}
if (s->dimms[i].page_size == 2048) {
page = 1;
}
}
PRINTK_DEBUG("trp=%d bank=%d page=%d\n",trp, bank, page);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
flag = 0;
} else {
flag = 1;
}
mchbar_setbits8(C0PVCFG, 3);
mchbar_write16(C0CYCTRKPCHG, (wl + 4 + s->selected_timings.tWR) << 6 |
(2 + MAX(s->selected_timings.tRTP, 2)) << 2 | 1);
reg32 = (bank << 21) | (s->selected_timings.tRRD << 17) |
(s->selected_timings.tRP << 13) | ((s->selected_timings.tRP + trp) << 9) |
s->selected_timings.tRFC;
if (bank == 0) {
reg32 |= (pagetab[flag][page] << 22);
}
/* FIXME: Why not do a single dword write? */
mchbar_write16(C0CYCTRKACT + 0, (u16)(reg32));
mchbar_write16(C0CYCTRKACT + 2, (u16)(reg32 >> 16));
/* FIXME: Only applies to DDR2 */
reg16 = (mchbar_read16(C0CYCTRKACT + 2) & 0x0fc0) >> 6;
mchbar_clrsetbits16(SHCYCTRKCKEL, 0x3f << 7, reg16 << 7);
reg16 = (s->selected_timings.tRCD << 12) | (4 << 8) | (ta2 << 4) | ta4;
mchbar_write16(C0CYCTRKWR, reg16);
reg32 = (s->selected_timings.tRCD << 17) | ((wl + 4 + s->selected_timings.tWTR) << 12) |
(ta3 << 8) | (4 << 4) | ta1;
mchbar_write32(C0CYCTRKRD, reg32);
reg16 = ((s->selected_timings.tRP + trp) << 9) | s->selected_timings.tRFC;
/* FIXME: Why not do a single word write? */
mchbar_write8(C0CYCTRKREFR + 0, (u8)(reg16));
mchbar_write8(C0CYCTRKREFR + 1, (u8)(reg16 >> 8));
mchbar_clrsetbits16(C0CKECTRL, 0x1ff << 1, 100 << 1);
mchbar_clrsetbits8(C0CYCTRKPCHG2, 0x3f, s->selected_timings.tRAS);
mchbar_write16(C0ARBCTRL, 0x2310);
mchbar_clrsetbits8(C0ADDCSCTRL, 0x1f, 1);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
reg32 = 3000;
} else {
reg32 = 2500;
}
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) {
reg2 = 6000;
} else {
reg2 = 5000;
}
reg16 = (u16)((((s->selected_timings.CAS + 7) * (reg32)) / reg2) << 8);
mchbar_clrsetbits16(C0STATRDCTRL, 0x1f << 8, reg16);
flag = 0;
if (wl > 2) {
flag = 1;
}
reg16 = (u8)(wl - 1 - flag);
reg16 |= reg16 << 4;
reg16 |= flag << 8;
mchbar_clrsetbits16(C0WRDATACTRL, 0x1ff, reg16);
mchbar_write16(C0RDQCTRL, 0x1585);
mchbar_clrbits8(C0PWLRCTRL, 0x1f);
/* rdmodwr_window[5..0] = CL+4+5 265[13..8] (264[21..16]) */
mchbar_clrsetbits16(C0PWLRCTRL, 0x3f << 8, (s->selected_timings.CAS + 9) << 8);
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
reg16 = 0x0514;
reg32 = 0x0a28;
} else {
reg16 = 0x0618;
reg32 = 0x0c30;
}
mchbar_clrsetbits32(C0REFRCTRL2, 0xfffff << 8, 0x3f << 22 | reg32 << 8);
/* FIXME: Is this weird access necessary? Reference code does it */
mchbar_write8(C0REFRCTRL + 3, 0);
mchbar_clrsetbits16(C0REFCTRL, 0x3fff, reg16);
/* NPUT Static Mode */
mchbar_setbits8(C0DYNRDCTRL, 1 << 0);
mchbar_clrsetbits32(C0STATRDCTRL, 0x7f << 24, 0xb << 25);
i = s->selected_timings.mem_clock;
j = s->selected_timings.fsb_clock;
if (i > j) {
mchbar_setbits32(C0STATRDCTRL, 1 << 24);
}
mchbar_clrbits8(C0RDFIFOCTRL, 3);
mchbar_clrsetbits16(C0WRDATACTRL, 0x1f << 10, (wl + 10) << 10);
mchbar_clrsetbits32(C0CKECTRL, 7 << 24 | 7 << 17, 3 << 24 | 3 << 17);
reg16 = 0x15 << 6;
reg16 |= 0x1f;
reg16 |= (0x6 << 12);
mchbar_clrsetbits16(C0REFRCTRL + 4, 0x7fff, reg16);
reg32 = (0x6 << 27) | (1 << 25); /* FIXME: For DDR3, set BIT26 as well */
mchbar_clrsetbits32(C0REFRCTRL2, 3 << 28, reg32 << 8);
mchbar_clrsetbits8(C0REFRCTRL + 3, 0xfa, reg32 >> 24);
mchbar_clrbits8(C0JEDEC, 1 << 7);
mchbar_clrbits8(C0DYNRDCTRL, 3 << 1);
/* Note: This is a 64-bit register, [34..30] = 0b00110 is split across two writes */
reg32 = ((6 & 3) << 30) | (4 << 25) | (1 << 20) | (8 << 15) | (6 << 10) | (4 << 5) | 1;
mchbar_write32(C0WRWMFLSH, reg32);
mchbar_clrsetbits16(C0WRWMFLSH + 4, 0x1ff, 8 << 3 | 6 >> 2);
mchbar_setbits16(SHPENDREG, 0x1c00 | 0x1f << 5);
/* FIXME: Why not do a single word write? */
mchbar_clrsetbits8(SHPAGECTRL, 0xff, 0x40);
mchbar_clrsetbits8(SHPAGECTRL + 1, 0x07, 0x05);
mchbar_setbits8(SHCMPLWRCMD, 0x1f);
reg8 = (3 << 6);
reg8 |= (s->dt0mode << 4);
reg8 |= 0x0c;
mchbar_clrsetbits8(SHBONUSREG, 0xdf, reg8);
mchbar_clrbits8(CSHRWRIOMLNS, 1 << 1);
mchbar_clrsetbits8(C0MISCTM, 0x07, 0x02);
mchbar_clrsetbits16(C0BYPCTRL, 0xff << 2, 4 << 2);
/* [31..29] = 0b010 for kN = 2 (2N) */
reg32 = (2 << 29) | (1 << 28) | (1 << 23);
mchbar_clrsetbits32(WRWMCONFIG, 0xffb << 20, reg32);
reg8 = (u8)((mchbar_read16(C0CYCTRKACT) & 0xe000) >> 13);
reg8 |= (u8)((mchbar_read16(C0CYCTRKACT + 2) & 1) << 3);
mchbar_clrsetbits8(BYPACTSF, 0xf << 4, reg8 << 4);
reg8 = (u8)((mchbar_read32(C0CYCTRKRD) & 0x000f0000) >> 17);
mchbar_clrsetbits8(BYPACTSF, 0xf, reg8);
/* FIXME: Why not clear everything at once? */
mchbar_clrbits8(BYPKNRULE, 0xfc);
mchbar_clrbits8(BYPKNRULE, 0x03);
mchbar_clrbits8(SHBONUSREG, 0x03);
mchbar_setbits8(C0BYPCTRL, 1 << 0);
mchbar_setbits16(CSHRMISCCTL1, 1 << 9);
for (i = 0; i < 8; i++) {
/* FIXME: Hardcoded for DDR2 SO-DIMMs */
mchbar_clrsetbits32(C0DLLRCVCTLy(i), 0x3f3f3f3f, 0x0c0c0c0c);
}
/* RDCS to RCVEN delay: Program coarse common to all bytelanes to default tCL + 1 */
mchbar_clrsetbits32(C0STATRDCTRL, 0xf << 16, (s->selected_timings.CAS + 1) << 16);
/* Program RCVEN delay with DLL-safe settings */
for (i = 0; i < 8; i++) {
mchbar_clrbits8(C0RXRCVyDLL(i), 0x3f);
mchbar_clrbits16(C0RCVMISCCTL2, 3 << (i * 2));
mchbar_clrbits16(C0RCVMISCCTL1, 3 << (i * 2));
mchbar_clrbits16(C0COARSEDLY0, 3 << (i * 2));
}
mchbar_clrbits8(C0DLLPIEN, 1 << 0); /* Power up receiver */
mchbar_setbits8(C0DLLPIEN, 1 << 1); /* Enable RCVEN DLL */
mchbar_setbits8(C0DLLPIEN, 1 << 2); /* Enable receiver DQS DLL */
mchbar_setbits32(C0COREBONUS, 0x000c0400);
mchbar_setbits32(C0CMDTX1, 1 << 31);
}
/* Program clkset0's register for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_clkset0(const struct pllparam *pll, u8 f, u8 i)
{
mchbar_clrsetbits16(C0CKTX, 0xc440,
(pll->clkdelay[f][i] << 14) |
(pll->dben[f][i] << 10) |
(pll->dbsel[f][i] << 6));
mchbar_clrsetbits8(C0TXCK0DLL, 0x3f, pll->pi[f][i]);
}
/* Program clkset1's register for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_clkset1(const struct pllparam *pll, u8 f, u8 i)
{
mchbar_clrsetbits32(C0CKTX, 0x00030880,
(pll->clkdelay[f][i] << 16) |
(pll->dben[f][i] << 11) |
(pll->dbsel[f][i] << 7));
mchbar_clrsetbits8(C0TXCK1DLL, 0x3f, pll->pi[f][i]);
}
/* Program CMD0 and CMD1 registers for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_cmd(const struct pllparam *pll, u8 f, u8 i)
{
u8 reg8;
/* Clock Group Index 3 */
reg8 = pll->dbsel[f][i] << 5;
reg8 |= pll->dben[f][i] << 6;
mchbar_clrsetbits8(C0CMDTX1, 3 << 5, reg8);
reg8 = pll->clkdelay[f][i] << 4;
mchbar_clrsetbits8(C0CMDTX2, 3 << 4, reg8);
reg8 = pll->pi[f][i];
mchbar_clrsetbits8(C0TXCMD0DLL, 0x3f, reg8);
mchbar_clrsetbits8(C0TXCMD1DLL, 0x3f, reg8);
}
/* Program CTRL registers for Kcoarse, Tap, PI, DBEn and DBSel */
static void sdram_p_ctrl(const struct pllparam *pll, u8 f, u8 i)
{
u8 reg8;
u32 reg32;
/* CTRL0 and CTRL1 */
reg32 = ((u32)pll->dbsel[f][i]) << 20;
reg32 |= ((u32)pll->dben[f][i]) << 21;
reg32 |= ((u32)pll->dbsel[f][i]) << 22;
reg32 |= ((u32)pll->dben[f][i]) << 23;
reg32 |= ((u32)pll->clkdelay[f][i]) << 24;
reg32 |= ((u32)pll->clkdelay[f][i]) << 27;
mchbar_clrsetbits32(C0CTLTX2, 0x01bf0000, reg32);
reg8 = pll->pi[f][i];
mchbar_clrsetbits8(C0TXCTL0DLL, 0x3f, reg8);
mchbar_clrsetbits8(C0TXCTL1DLL, 0x3f, reg8);
/* CTRL2 and CTRL3 */
reg32 = ((u32)pll->dbsel[f][i]) << 12;
reg32 |= ((u32)pll->dben[f][i]) << 13;
reg32 |= ((u32)pll->dbsel[f][i]) << 8;
reg32 |= ((u32)pll->dben[f][i]) << 9;
reg32 |= ((u32)pll->clkdelay[f][i]) << 14;
reg32 |= ((u32)pll->clkdelay[f][i]) << 10;
mchbar_clrsetbits32(C0CMDTX2, 0xff << 8, reg32);
reg8 = pll->pi[f][i];
mchbar_clrsetbits8(C0TXCTL2DLL, 0x3f, reg8);
mchbar_clrsetbits8(C0TXCTL3DLL, 0x3f, reg8);
}
static void sdram_p_dqs(struct pllparam *pll, u8 f, u8 clk)
{
u8 rank, dqs, reg8, j;
u32 reg32;
j = clk - 40;
reg8 = 0;
reg32 = 0;
rank = j % 4;
dqs = j / 4;
reg32 |= ((u32)pll->dben[f][clk]) << (dqs + 9);
reg32 |= ((u32)pll->dbsel[f][clk]) << dqs;
mchbar_clrsetbits32(C0DQSRyTX1(rank), 1 << (dqs + 9) | 1 << dqs, reg32);
reg32 = ((u32)pll->clkdelay[f][clk]) << ((dqs * 2) + 16);
mchbar_clrsetbits32(C0DQSDQRyTX3(rank), 1 << (dqs * 2 + 17) | 1 << (dqs * 2 + 16),
reg32);
reg8 = pll->pi[f][clk];
mchbar_clrsetbits8(C0TXDQS0R0DLL + j, 0x3f, reg8);
}
static void sdram_p_dq(struct pllparam *pll, u8 f, u8 clk)
{
u8 rank, dq, reg8, j;
u32 reg32;
j = clk - 8;
reg8 = 0;
reg32 = 0;
rank = j % 4;
dq = j / 4;
reg32 |= ((u32)pll->dben[f][clk]) << (dq + 9);
reg32 |= ((u32)pll->dbsel[f][clk]) << dq;
mchbar_clrsetbits32(C0DQRyTX1(rank), 1 << (dq + 9) | 1 << dq, reg32);
reg32 = ((u32)pll->clkdelay[f][clk]) << (dq*2);
mchbar_clrsetbits32(C0DQSDQRyTX3(rank), 1 << (dq * 2 + 1) | 1 << (dq * 2), reg32);
reg8 = pll->pi[f][clk];
mchbar_clrsetbits8(C0TXDQ0R0DLL + j, 0x3f, reg8);
}
/* WDLL programming: Perform HPLL/MPLL calibration after write levelization */
static void sdram_calibratepll(struct sysinfo *s, u8 pidelay)
{
struct pllparam pll = {
.pi = {
{ /* DDR = 667 */
3, 3, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7,
7, 7, 7, 7, 4, 4, 4, 4, 4, 4, 4, 4,
4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5,
7, 7, 7, 7, 3, 3, 3, 3, 3, 3, 3, 3,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 1, 1, 1, 1, 3, 3, 3, 3,
},
{ /* DDR = 800 */
53, 53, 10, 10, 5, 5, 5, 5, 27, 27, 27, 27,
34, 34, 34, 34, 34, 34, 34, 34, 39, 39, 39, 39,
47, 47, 47, 47, 44, 44, 44, 44, 47, 47, 47, 47,
47, 47, 47, 47, 59, 59, 59, 59, 2, 2, 2, 2,
2, 2, 2, 2, 7, 7, 7, 7, 15, 15, 15, 15,
12, 12, 12, 12, 15, 15, 15, 15, 15, 15, 15, 15,
}},
.dben = {
{ /* DDR = 667 */
0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
},
{ /* DDR = 800 */
1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
}},
.dbsel = {
{ /* DDR = 667 */
0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
},
{ /* DDR = 800 */
0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
}},
.clkdelay = {
{ /* DDR = 667 */
0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
},
{ /* DDR = 800 */
0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
}}
};
u8 i, f;
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
f = 0;
} else {
f = 1;
}
for (i = 0; i < 72; i++) {
pll.pi[f][i] += pidelay;
}
/* Disable Dynamic DQS Slave Setting Per Rank */
mchbar_clrbits8(CSHRDQSCMN, 1 << 7);
mchbar_clrsetbits16(CSHRPDCTL4, 0x3fff, 0x1fff);
sdram_p_clkset0(&pll, f, 0);
sdram_p_clkset1(&pll, f, 1);
sdram_p_cmd(&pll, f, 2);
sdram_p_ctrl(&pll, f, 4);
for (i = 0; i < 32; i++) {
sdram_p_dqs(&pll, f, i + 40);
}
for (i = 0; i < 32; i++) {
sdram_p_dq(&pll, f, i + 8);
}
}
/* Perform HMC hardware calibration */
static void sdram_calibratehwpll(struct sysinfo *s)
{
u8 reg8;
s->async = 0;
reg8 = 0;
mchbar_setbits16(CSHRPDCTL, 1 << 15);
mchbar_clrbits8(CSHRPDCTL, 1 << 7);
mchbar_setbits8(CSHRPDCTL, 1 << 3);
mchbar_setbits8(CSHRPDCTL, 1 << 2);
/* Start hardware HMC calibration */
mchbar_setbits8(CSHRPDCTL, 1 << 7);
/* Busy-wait until calibration is done */
while ((mchbar_read8(CSHRPDCTL) & (1 << 2)) == 0)
;
/* If hardware HMC calibration failed */
reg8 = (mchbar_read8(CSHRPDCTL) & (1 << 3)) >> 3;
if (reg8 != 0) {
s->async = 1;
}
}
static void sdram_dlltiming(struct sysinfo *s)
{
u8 reg8, i;
u16 reg16;
u32 reg32;
/* Configure the Master DLL */
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
reg32 = 0x08014227;
} else {
reg32 = 0x00014221;
}
mchbar_clrsetbits32(CSHRMSTRCTL1, 0x0fffffff, reg32);
mchbar_setbits32(CSHRMSTRCTL1, 1 << 23);
mchbar_setbits32(CSHRMSTRCTL1, 1 << 15);
mchbar_clrbits32(CSHRMSTRCTL1, 1 << 15);
if (s->nodll) {
/* Disable the Master DLLs by setting these bits, IN ORDER! */
mchbar_setbits16(CSHRMSTRCTL0, 1 << 0);
mchbar_setbits16(CSHRMSTRCTL0, 1 << 2);
mchbar_setbits16(CSHRMSTRCTL0, 1 << 4);
mchbar_setbits16(CSHRMSTRCTL0, 1 << 8);
mchbar_setbits16(CSHRMSTRCTL0, 1 << 10);
mchbar_setbits16(CSHRMSTRCTL0, 1 << 12);
mchbar_setbits16(CSHRMSTRCTL0, 1 << 14);
} else {
/* Enable the Master DLLs by clearing these bits, IN ORDER! */
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 0);
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 2);
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 4);
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 8);
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 10);
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 12);
mchbar_clrbits16(CSHRMSTRCTL0, 1 << 14);
}
/* Initialize the Transmit DLL PI values in the following sequence. */
if (s->nodll) {
mchbar_clrsetbits8(CREFPI, 0x3f, 0x07);
} else {
mchbar_clrbits8(CREFPI, 0x3f);
}
sdram_calibratepll(s, 0); // XXX check
/* Enable all modular Slave DLL */
mchbar_setbits16(C0DLLPIEN, 1 << 11);
mchbar_setbits16(C0DLLPIEN, 1 << 12);
for (i = 0; i < 8; i++) {
mchbar_setbits16(C0DLLPIEN, (1 << 10) >> i);
}
/* Enable DQ/DQS output */
mchbar_setbits8(C0SLVDLLOUTEN, 1 << 0);
mchbar_write16(CSPDSLVWT, 0x5005);
mchbar_clrsetbits16(CSHRPDCTL2, 0x1f1f, 0x051a);
mchbar_clrsetbits16(CSHRPDCTL5, 0xbf3f, 0x9010);
if (s->nodll) {
mchbar_clrsetbits8(CSHRPDCTL3, 0x7f, 0x6b);
} else {
mchbar_clrsetbits8(CSHRPDCTL3, 0x7f, 0x55);
sdram_calibratehwpll(s);
}
/* Disable Dynamic Diff Amp */
mchbar_clrbits32(C0STATRDCTRL, 1 << 22);
/* Now, start initializing the transmit FIFO */
mchbar_clrbits8(C0MISCCTL, 1 << 1);
/* Disable (gate) mdclk and mdclkb */
mchbar_setbits8(CSHWRIOBONUS, 3 << 6);
/* Select mdmclk */
mchbar_clrbits8(CSHWRIOBONUS, 1 << 5);
/* Ungate mdclk */
mchbar_clrsetbits8(CSHWRIOBONUS, 3 << 6, 1 << 6);
mchbar_clrsetbits8(CSHRFIFOCTL, 0x3f, 0x1a);
/* Enable the write pointer count */
mchbar_setbits8(CSHRFIFOCTL, 1 << 0);
/* Set the DDR3 Reset Enable bit */
mchbar_setbits8(CSHRDDR3CTL, 1 << 0);
/* Configure DQS-DQ Transmit */
mchbar_write32(CSHRDQSTXPGM, 0x00551803);
reg8 = 0; /* Switch all clocks on anyway */
/* Enable clock groups depending on rank population */
mchbar_clrsetbits32(C0CKTX, 0x3f << 24, reg8 << 24);
/* Enable DDR command output buffers from core */
mchbar_clrbits8(0x594, 1 << 0);
reg16 = 0;
if (!rank_is_populated(s->dimms, 0, 0)) {
reg16 |= (1 << 8) | (1 << 4) | (1 << 0);
}
if (!rank_is_populated(s->dimms, 0, 1)) {
reg16 |= (1 << 9) | (1 << 5) | (1 << 1);
}
if (!rank_is_populated(s->dimms, 0, 2)) {
reg16 |= (1 << 10) | (1 << 6) | (1 << 2);
}
if (!rank_is_populated(s->dimms, 0, 3)) {
reg16 |= (1 << 11) | (1 << 7) | (1 << 3);
}
mchbar_setbits16(C0CTLTX2, reg16);
}
/* Define a shorter name for these to make the lines fit in 96 characters */
#define TABLE static const
/* Loop over each RCOMP group, but skip group 1 because it does not exist */
#define FOR_EACH_RCOMP_GROUP(idx) for (idx = 0; idx < 7; idx++) if (idx != 1)
/* Define accessors for the RCOMP register banks */
#define C0RCOMPCTRLx(x) (rcompctl[(x)] + 0x00)
#define C0RCOMPMULTx(x) (rcompctl[(x)] + 0x04)
#define C0RCOMPOVRx(x) (rcompctl[(x)] + 0x06)
#define C0RCOMPOSVx(x) (rcompctl[(x)] + 0x0a)
#define C0SCOMPVREFx(x) (rcompctl[(x)] + 0x0e)
#define C0SCOMPOVRx(x) (rcompctl[(x)] + 0x10)
#define C0SCOMPOFFx(x) (rcompctl[(x)] + 0x12)
#define C0DCOMPx(x) (rcompctl[(x)] + 0x14)
#define C0SLEWBASEx(x) (rcompctl[(x)] + 0x16)
#define C0SLEWPULUTx(x) (rcompctl[(x)] + 0x18)
#define C0SLEWPDLUTx(x) (rcompctl[(x)] + 0x1c)
#define C0DCOMPOVRx(x) (rcompctl[(x)] + 0x20)
#define C0DCOMPOFFx(x) (rcompctl[(x)] + 0x24)
/* FIXME: This only applies to DDR2 */
static void sdram_rcomp(struct sysinfo *s)
{
u8 i, j, reg8, rcompp, rcompn, srup, srun;
u16 reg16;
u32 reg32, rcomp1, rcomp2;
static const u8 rcompslew = 0x0a;
static const u16 rcompctl[7] = {
C0RCOMPCTRL0,
0, /* This register does not exist */
C0RCOMPCTRL2,
C0RCOMPCTRL3,
C0RCOMPCTRL4,
C0RCOMPCTRL5,
C0RCOMPCTRL6,
};
/* RCOMP settings tables = { NC-NC, x16SS, x16DS, x16SS2, x16DS2, x8DS, x8DS2}; */
TABLE u8 rcompupdate[7] = { 0, 0, 0, 1, 1, 0, 0};
TABLE u8 rcompstr[7] = { 0x66, 0x00, 0xaa, 0x55, 0x55, 0x77, 0x77};
TABLE u16 rcompscomp[7] = {0xa22a, 0x0000, 0xe22e, 0xe22e, 0xe22e, 0xa22a, 0xa22a};
TABLE u8 rcompdelay[7] = { 1, 0, 0, 0, 0, 1, 1};
TABLE u16 rcompf[7] = {0x1114, 0x0000, 0x0505, 0x0909, 0x0909, 0x0a0a, 0x0a0a};
TABLE u8 rcompstr2[7] = { 0x00, 0x55, 0x55, 0xaa, 0xaa, 0x55, 0xaa};
TABLE u16 rcompscomp2[7] = {0x0000, 0xe22e, 0xe22e, 0xe22e, 0x8228, 0xe22e, 0x8228};
TABLE u8 rcompdelay2[7] = { 0, 0, 0, 0, 2, 0, 2};
TABLE u8 rcomplut[64][12] = {
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{ 9, 9, 11, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{10, 9, 12, 11, 2, 2, 5, 5, 6, 6, 5, 5},
{10, 9, 12, 11, 2, 2, 6, 5, 7, 6, 6, 5},
{10, 10, 12, 12, 2, 2, 6, 5, 7, 6, 6, 5},
{10, 10, 12, 12, 2, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 2, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{10, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{11, 10, 12, 12, 3, 3, 6, 6, 7, 7, 6, 6},
{11, 10, 14, 13, 3, 3, 6, 6, 7, 7, 6, 6},
{12, 10, 14, 13, 3, 3, 6, 6, 7, 7, 6, 6},
{12, 12, 14, 13, 3, 3, 7, 6, 7, 7, 7, 6},
{13, 12, 16, 15, 3, 3, 7, 6, 8, 7, 7, 6},
{13, 14, 16, 15, 4, 3, 7, 7, 8, 8, 7, 7},
{14, 14, 16, 17, 4, 3, 7, 7, 8, 8, 7, 7},
{14, 16, 18, 17, 4, 4, 8, 7, 8, 8, 8, 7},
{15, 16, 18, 19, 4, 4, 8, 7, 9, 8, 8, 7},
{15, 18, 18, 19, 4, 4, 8, 8, 9, 9, 8, 8},
{16, 18, 20, 21, 4, 4, 8, 8, 9, 9, 8, 8},
{16, 19, 20, 21, 5, 4, 9, 8, 10, 9, 9, 8},
{16, 19, 20, 23, 5, 5, 9, 9, 10, 10, 9, 9},
{17, 19, 22, 23, 5, 5, 9, 9, 10, 10, 9, 9},
{17, 20, 22, 25, 5, 5, 9, 9, 10, 10, 9, 9},
{17, 20, 22, 25, 5, 5, 9, 9, 10, 10, 9, 9},
{18, 20, 22, 25, 5, 5, 9, 9, 10, 10, 9, 9},
{18, 21, 24, 25, 5, 5, 9, 9, 11, 10, 9, 9},
{19, 21, 24, 27, 5, 5, 9, 9, 11, 11, 9, 9},
{19, 22, 24, 27, 5, 5, 10, 9, 11, 11, 10, 9},
{20, 22, 24, 27, 6, 5, 10, 10, 11, 11, 10, 10},
{20, 23, 26, 27, 6, 6, 10, 10, 12, 12, 10, 10},
{20, 23, 26, 29, 6, 6, 10, 10, 12, 12, 10, 10},
{21, 24, 26, 29, 6, 6, 10, 10, 12, 12, 10, 10},
{21, 24, 26, 29, 6, 6, 11, 10, 12, 13, 11, 10},
{22, 25, 28, 29, 6, 6, 11, 11, 13, 13, 11, 11},
{22, 25, 28, 31, 6, 6, 11, 11, 13, 13, 11, 11},
{22, 26, 28, 31, 6, 6, 11, 11, 13, 14, 11, 11},
{23, 26, 30, 31, 7, 6, 12, 11, 14, 14, 12, 11},
{23, 27, 30, 33, 7, 7, 12, 12, 14, 14, 12, 12},
{23, 27, 30, 33, 7, 7, 12, 12, 14, 15, 12, 12},
{24, 28, 32, 33, 7, 7, 12, 12, 15, 15, 12, 12},
{24, 28, 32, 33, 7, 7, 12, 12, 15, 16, 12, 12},
{24, 29, 32, 35, 7, 7, 12, 12, 15, 16, 12, 12},
{25, 29, 32, 35, 7, 7, 12, 12, 15, 17, 12, 12},
{25, 30, 32, 35, 7, 7, 12, 12, 15, 17, 12, 12},
{25, 30, 32, 35, 7, 7, 12, 12, 15, 17, 12, 12},
};
srup = 0;
srun = 0;
if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
rcomp1 = 0x00050431;
} else {
rcomp1 = 0x00050542;
}
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) {
rcomp2 = 0x14c42827;
} else {
rcomp2 = 0x19042827;
}
FOR_EACH_RCOMP_GROUP(i) {
reg8 = rcompupdate[i];
mchbar_clrsetbits8(C0RCOMPCTRLx(i), 1 << 0, reg8);
mchbar_clrbits8(C0RCOMPCTRLx(i), 1 << 1);
reg16 = rcompslew;
mchbar_clrsetbits16(C0RCOMPCTRLx(i), 0xf << 12, reg16 << 12);
mchbar_write8(C0RCOMPMULTx(i), rcompstr[i]);
mchbar_write16(C0SCOMPVREFx(i), rcompscomp[i]);
mchbar_clrsetbits8(C0DCOMPx(i), 0x03, rcompdelay[i]);
if (i == 2) {
/* FIXME: Why are we rewriting this? */
mchbar_clrsetbits16(C0RCOMPCTRLx(i), 0xf << 12, reg16 << 12);
mchbar_write8(C0RCOMPMULTx(i), rcompstr2[s->dimm_config[0]]);
mchbar_write16(C0SCOMPVREFx(i), rcompscomp2[s->dimm_config[0]]);
mchbar_clrsetbits8(C0DCOMPx(i), 0x03, rcompdelay2[s->dimm_config[0]]);
}
mchbar_clrbits16(C0SLEWBASEx(i), 0x7f7f);
/* FIXME: Why not do a single dword write? */
mchbar_clrbits16(C0SLEWPULUTx(i), 0x3f3f);
mchbar_clrbits16(C0SLEWPULUTx(i) + 2, 0x3f3f);
/* FIXME: Why not do a single dword write? */
mchbar_clrbits16(C0SLEWPDLUTx(i), 0x3f3f);
mchbar_clrbits16(C0SLEWPDLUTx(i) + 2, 0x3f3f);
}
/* FIXME: Hardcoded */
mchbar_clrsetbits8(C0ODTRECORDX, 0x3f, 0x36);
mchbar_clrsetbits8(C0DQSODTRECORDX, 0x3f, 0x36);
FOR_EACH_RCOMP_GROUP(i) {
mchbar_clrbits8(C0RCOMPCTRLx(i), 3 << 5);
mchbar_clrbits16(C0RCOMPCTRLx(i) + 2, 0x0706);
mchbar_clrbits16(C0RCOMPOSVx(i), 0x7f7f);
mchbar_clrbits16(C0SCOMPOFFx(i), 0x3f3f);
mchbar_clrbits16(C0DCOMPOFFx(i), 0x1f1f);
mchbar_clrbits8(C0DCOMPOFFx(i) + 2, 0x1f);
}
mchbar_clrbits16(C0ODTRECORDX, 0xffc0);
mchbar_clrbits16(C0ODTRECORDX + 2, 0x000f);
/* FIXME: Why not do a single dword write? */
mchbar_clrbits16(C0DQSODTRECORDX, 0xffc0);
mchbar_clrbits16(C0DQSODTRECORDX + 2, 0x000f);
FOR_EACH_RCOMP_GROUP(i) {
mchbar_write16(C0SCOMPOVRx(i), rcompf[i]);
/* FIXME: Why not do a single dword write? */
mchbar_write16(C0DCOMPOVRx(i) + 0, 0x1219);
mchbar_write16(C0DCOMPOVRx(i) + 2, 0x000c);
}
mchbar_clrsetbits32(DCMEASBUFOVR, 0x001f1f1f, 0x000c1219);
/* FIXME: Why not do a single word write? */
mchbar_clrsetbits16(XCOMPSDR0BNS, 0x1f << 8, 0x12 << 8);
mchbar_clrsetbits8(XCOMPSDR0BNS, 0x1f << 0, 0x12 << 0);
mchbar_write32(COMPCTRL3, 0x007c9007);
mchbar_write32(OFREQDELSEL, rcomp1);
mchbar_write16(XCOMPCMNBNS, 0x1f7f);
mchbar_write32(COMPCTRL2, rcomp2);
mchbar_clrsetbits16(XCOMPDFCTRL, 0xf, 1);
mchbar_write16(ZQCALCTRL, 0x0134);
mchbar_write32(COMPCTRL1, 0x4c293600);
mchbar_clrsetbits8(COMPCTRL1 + 3, 0x44, 1 << 6 | 1 << 2);
mchbar_clrbits16(XCOMPSDR0BNS, 1 << 13);
mchbar_clrbits8(XCOMPSDR0BNS, 1 << 5);
FOR_EACH_RCOMP_GROUP(i) {
/* POR values are zero */
mchbar_clrbits8(C0RCOMPCTRLx(i) + 2, 0x71);
}
if ((mchbar_read32(COMPCTRL1) & (1 << 30)) == 0) {
/* Start COMP */
mchbar_setbits8(COMPCTRL1, 1 << 0);
/* Wait until COMP is done */
while ((mchbar_read8(COMPCTRL1) & 1) != 0)
;
reg32 = mchbar_read32(XCOMP);
rcompp = (u8)((reg32 & ~(1 << 31)) >> 24);
rcompn = (u8)((reg32 & ~(0xff800000)) >> 16);
FOR_EACH_RCOMP_GROUP(i) {
srup = (mchbar_read8(C0RCOMPCTRLx(i) + 1) & 0xc0) >> 6;
srun = (mchbar_read8(C0RCOMPCTRLx(i) + 1) & 0x30) >> 4;
/* FIXME: Why not do a single word write? */
reg16 = (u16)(rcompp - (1 << (srup + 1))) << 8;
mchbar_clrsetbits16(C0SLEWBASEx(i), 0x7f << 8, reg16);
reg16 = (u16)(rcompn - (1 << (srun + 1)));
mchbar_clrsetbits8(C0SLEWBASEx(i), 0x7f, (u8)reg16);
}
reg8 = rcompp - (1 << (srup + 1));
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
mchbar_clrsetbits8(C0SLEWPULUTx(0) + i, 0x3f, rcomplut[j][0]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
if (s->dimm_config[0] < 3 || s->dimm_config[0] == 5) {
mchbar_clrsetbits8(C0SLEWPULUTx(2) + i, 0x3f, rcomplut[j][10]);
}
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
mchbar_clrsetbits8(C0SLEWPULUTx(3) + i, 0x3f, rcomplut[j][6]);
mchbar_clrsetbits8(C0SLEWPULUTx(4) + i, 0x3f, rcomplut[j][6]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srup)) {
mchbar_clrsetbits8(C0SLEWPULUTx(5) + i, 0x3f, rcomplut[j][8]);
mchbar_clrsetbits8(C0SLEWPULUTx(6) + i, 0x3f, rcomplut[j][8]);
}
reg8 = rcompn - (1 << (srun + 1));
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
mchbar_clrsetbits8(C0SLEWPDLUTx(0) + i, 0x3f, rcomplut[j][1]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
if (s->dimm_config[0] < 3 || s->dimm_config[0] == 5) {
mchbar_clrsetbits8(C0SLEWPDLUTx(2) + i, 0x3f, rcomplut[j][11]);
}
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
mchbar_clrsetbits8(C0SLEWPDLUTx(3) + i, 0x3f, rcomplut[j][7]);
mchbar_clrsetbits8(C0SLEWPDLUTx(4) + i, 0x3f, rcomplut[j][7]);
}
for (i = 0, j = reg8; i < 4; i++, j += (1 << srun)) {
mchbar_clrsetbits8(C0SLEWPDLUTx(5) + i, 0x3f, rcomplut[j][9]);
mchbar_clrsetbits8(C0SLEWPDLUTx(6) + i, 0x3f, rcomplut[j][9]);
}
}
mchbar_setbits8(COMPCTRL1, 1 << 0);
}
/* FIXME: The ODT tables are for DDR2 only! */
static void sdram_odt(struct sysinfo *s)
{
u8 rankindex = 0;
static const u16 odt_rankctrl[16] = {
/* NC_NC, 1R_NC, NV, 2R_NC, NC_1R, 1R_1R, NV, 2R_1R, */
0x0000, 0x0000, 0x0000, 0x0000, 0x0044, 0x1111, 0x0000, 0x1111,
/* NV, NV, NV, NV, NC_2R, 1R_2R, NV, 2R_2R, */
0x0000, 0x0000, 0x0000, 0x0000, 0x0044, 0x1111, 0x0000, 0x1111,
};
static const u16 odt_matrix[16] = {
/* NC_NC, 1R_NC, NV, 2R_NC, NC_1R, 1R_1R, NV, 2R_1R, */
0x0000, 0x0011, 0x0000, 0x0011, 0x0000, 0x4444, 0x0000, 0x4444,
/* NV, NV, NV, NV, NC_2R, 1R_2R, NV, 2R_2R, */
0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x4444, 0x0000, 0x4444,
};
switch (s->dimms[0].ranks) {
case 0:
if (s->dimms[1].ranks == 0) {
rankindex = 0;
} else if (s->dimms[1].ranks == 1) {
rankindex = 4;
} else if (s->dimms[1].ranks == 2) {
rankindex = 12;
}
break;
case 1:
if (s->dimms[1].ranks == 0) {
rankindex = 1;
} else if (s->dimms[1].ranks == 1) {
rankindex = 5;
} else if (s->dimms[1].ranks == 2) {
rankindex = 13;
}
break;
case 2:
if (s->dimms[1].ranks == 0) {
rankindex = 3;
} else if (s->dimms[1].ranks == 1) {
rankindex = 7;
} else if (s->dimms[1].ranks == 2) {
rankindex = 15;
}
break;
}
/* Program the ODT Matrix */
mchbar_write16(C0ODT, odt_matrix[rankindex]);
/* Program the ODT Rank Control */
mchbar_write16(C0ODTRKCTRL, odt_rankctrl[rankindex]);
}
static void sdram_mmap(struct sysinfo *s)
{
TABLE u32 w260[7] = {0, 0x400001, 0xc00001, 0x500000, 0xf00000, 0xc00001, 0xf00000};
TABLE u32 w208[7] = {0, 0x10000, 0x1010000, 0x10001, 0x1010101, 0x1010000, 0x1010101};
TABLE u32 w200[7] = {0, 0, 0, 0x20002, 0x40002, 0, 0x40002};
TABLE u32 w204[7] = {0, 0x20002, 0x40002, 0x40004, 0x80006, 0x40002, 0x80006};
TABLE u16 tolud[7] = {2048, 2048, 4096, 4096, 8192, 4096, 8192};
TABLE u16 tom[7] = { 2, 2, 4, 4, 8, 4, 8};
TABLE u16 touud[7] = { 128, 128, 256, 256, 512, 256, 512};
TABLE u32 gbsm[7] = {1 << 27, 1 << 27, 1 << 28, 1 << 27, 1 << 29, 1 << 28, 1 << 29};
TABLE u32 bgsm[7] = {1 << 27, 1 << 27, 1 << 28, 1 << 27, 1 << 29, 1 << 28, 1 << 29};
TABLE u32 tsegmb[7] = {1 << 27, 1 << 27, 1 << 28, 1 << 27, 1 << 29, 1 << 28, 1 << 29};
if ((s->dimm_config[0] < 3) && rank_is_populated(s->dimms, 0, 0)) {
if (s->dimms[0].sides > 1) {
// 2R/NC
mchbar_clrsetbits32(C0CKECTRL, 1, 0x300001);
mchbar_write32(C0DRA01, 0x00000101);
mchbar_write32(C0DRB0, 0x00040002);
mchbar_write32(C0DRB2, w204[s->dimm_config[0]]);
} else {
// 1R/NC
mchbar_clrsetbits32(C0CKECTRL, 1, 0x100001);
mchbar_write32(C0DRA01, 0x00000001);
mchbar_write32(C0DRB0, 0x00020002);
mchbar_write32(C0DRB2, w204[s->dimm_config[0]]);
}
} else if ((s->dimm_config[0] == 5) && rank_is_populated(s->dimms, 0, 0)) {
mchbar_clrsetbits32(C0CKECTRL, 1, 0x300001);
mchbar_write32(C0DRA01, 0x00000101);
mchbar_write32(C0DRB0, 0x00040002);
mchbar_write32(C0DRB2, 0x00040004);
} else {
mchbar_clrsetbits32(C0CKECTRL, 1, w260[s->dimm_config[0]]);
mchbar_write32(C0DRA01, w208[s->dimm_config[0]]);
mchbar_write32(C0DRB0, w200[s->dimm_config[0]]);
mchbar_write32(C0DRB2, w204[s->dimm_config[0]]);
}
pci_write_config16(HOST_BRIDGE, 0xb0, tolud[s->dimm_config[0]]);
pci_write_config16(HOST_BRIDGE, 0xa0, tom[s->dimm_config[0]]);
pci_write_config16(HOST_BRIDGE, 0xa2, touud[s->dimm_config[0]]);
pci_write_config32(HOST_BRIDGE, 0xa4, gbsm[s->dimm_config[0]]);
pci_write_config32(HOST_BRIDGE, 0xa8, bgsm[s->dimm_config[0]]);
pci_write_config32(HOST_BRIDGE, 0xac, tsegmb[s->dimm_config[0]]);
}
static u8 sdram_checkrcompoverride(void)
{
u32 xcomp;
u8 aa, bb, a, b, c, d;
xcomp = mchbar_read32(XCOMP);
a = (u8)((xcomp & 0x7f000000) >> 24);
b = (u8)((xcomp & 0x007f0000) >> 16);
c = (u8)((xcomp & 0x00003f00) >> 8);
d = (u8)((xcomp & 0x0000003f) >> 0);
if (a > b) {
aa = a - b;
} else {
aa = b - a;
}
if (c > d) {
bb = c - d;
} else {
bb = d - c;
}
if ((aa > 18) || (bb > 7) || (a <= 5) || (b <= 5) || (c <= 5) || (d <= 5) ||
(a >= 0x7a) || (b >= 0x7a) || (c >= 0x3a) || (d >= 0x3a)) {
mchbar_write32(RCMEASBUFXOVR, 0x9718a729);
return 1;
}
return 0;
}
static void sdram_rcompupdate(struct sysinfo *s)
{
u8 i, ok;
u32 reg32a, reg32b;
ok = 0;
mchbar_clrbits8(XCOMPDFCTRL, 1 << 3);
mchbar_clrbits8(COMPCTRL1, 1 << 7);
for (i = 0; i < 3; i++) {
mchbar_setbits8(COMPCTRL1, 1 << 0);
hpet_udelay(1000);
while ((mchbar_read8(COMPCTRL1) & 1) != 0)
;
ok |= sdram_checkrcompoverride();
}
if (!ok) {
reg32a = mchbar_read32(XCOMP);
reg32b = ((reg32a >> 16) & 0x0000ffff);
reg32a = ((reg32a << 16) & 0xffff0000) | reg32b;
reg32a |= (1 << 31) | (1 << 15);
mchbar_write32(RCMEASBUFXOVR, reg32a);
}
mchbar_setbits8(COMPCTRL1, 1 << 0);
hpet_udelay(1000);
while ((mchbar_read8(COMPCTRL1) & 1) != 0)
;
}
static void __attribute__((noinline))
sdram_jedec(struct sysinfo *s, u8 rank, u8 jmode, u16 jval)
{
u32 reg32;
reg32 = jval << 3;
reg32 |= rank * (1 << 27);
mchbar_clrsetbits8(C0JEDEC, 0x3e, jmode);
read32p(reg32);
barrier();
hpet_udelay(1); // 1us
}
static void sdram_zqcl(struct sysinfo *s)
{
if (s->boot_path == BOOT_PATH_RESUME) {
mchbar_setbits32(C0CKECTRL, 1 << 27);
mchbar_clrsetbits8(C0JEDEC, 0x0e, NORMAL_OP_CMD);
mchbar_clrbits8(C0JEDEC, 3 << 4);
mchbar_clrsetbits32(C0REFRCTRL2, 3 << 30, 3 << 30);
}
}
static void sdram_jedecinit(struct sysinfo *s)
{
u8 r, i, ch;
u16 reg16, mrs, rttnom;
struct jedeclist {
char debug[15];
u8 cmd;
u16 val;
};
static const struct jedeclist jedec[12] = {
{ " NOP ", NOP_CMD, 0 },
{ " PRE CHARGE ", PRE_CHARGE_CMD, 0 },
{ " EMRS2 ", EMRS2_CMD, 0 },
{ " EMRS3 ", EMRS3_CMD, 0 },
{ " EMRS1 ", EMRS1_CMD, 0 },
{ " DLL RESET ", MRS_CMD, (1 << 8) },
{ " PRE CHARGE ", PRE_CHARGE_CMD, 0 },
{ " AUTOREFRESH", CBR_CMD, 0 },
{ " AUTOREFRESH", CBR_CMD, 0 },
{ " INITIALISE ", MRS_CMD, 0 },
{ " EMRS1 OCD ", EMRS1_CMD, (1 << 9) | (1 << 8) | (1 << 7) },
{ " EMRS1 EXIT ", EMRS1_CMD, 0 }
};
mrs = (s->selected_timings.CAS << 4) |
((s->selected_timings.tWR - 1) << 9) | (1 << 3) | (1 << 1) | 3;
rttnom = (1 << 2);
if (rank_is_populated(s->dimms, 0, 0) && rank_is_populated(s->dimms, 0, 2)) {
rttnom |= (1 << 6);
}
hpet_udelay(200); // 200us
reg16 = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
for (i = 0; i < 12; i++) {
PRINTK_DEBUG("Rank:%d Jedec:%14s...", r, jedec[i].debug);
reg16 = jedec[i].val;
switch (jedec[i].cmd) {
case EMRS1_CMD:
reg16 |= rttnom;
break;
case MRS_CMD:
reg16 |= mrs;
break;
default:
break;
}
sdram_jedec(s, r, jedec[i].cmd, reg16);
PRINTK_DEBUG("done\n");
}
}
}
static void sdram_misc(struct sysinfo *s)
{
u32 reg32;
reg32 = 0;
reg32 |= (4 << 13);
reg32 |= (6 << 8);
mchbar_clrsetbits32(C0DYNRDCTRL, 0x3ff << 8, reg32);
mchbar_clrbits8(C0DYNRDCTRL, 1 << 7);
mchbar_setbits8(C0REFRCTRL + 3, 1 << 0);
if (s->boot_path != BOOT_PATH_RESUME) {
mchbar_clrsetbits8(C0JEDEC, 0x0e, NORMAL_OP_CMD);
mchbar_clrbits8(C0JEDEC, 3 << 4);
} else {
sdram_zqcl(s);
}
}
static void sdram_checkreset(void)
{
u8 pmcon2, pmcon3, reset;
pmcon2 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa2);
pmcon3 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa4);
pmcon3 &= ~0x2;
if (pmcon2 & 0x80) {
pmcon2 &= ~0x80;
reset = 1;
} else {
pmcon2 |= 0x80;
reset = 0;
}
if (pmcon2 & 0x4) {
pmcon2 |= 0x4;
pmcon3 = (pmcon3 & ~0x30) | 0x30;
pmcon3 |= (1 << 3);
}
pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, pmcon2);
pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa4, pmcon3);
if (reset)
full_reset();
}
static void sdram_dradrb(struct sysinfo *s)
{
u8 i, reg8, ch, r;
u32 reg32, ind, c0dra, c0drb, dra;
u16 addr;
i = 0;
static const u8 dratab[2][2][2][4] =
{{
{
{0xff, 0xff, 0xff, 0xff},
{0xff, 0x00, 0x02, 0xff}
},
{
{0xff, 0x01, 0xff, 0xff},
{0xff, 0x03, 0xff, 0x06}
}
},
{
{
{0xff, 0xff, 0xff, 0xff},
{0xff, 0x04, 0x06, 0x08}
},
{
{0xff, 0xff, 0xff, 0xff},
{0x05, 0x07, 0x09, 0xff}
}
}};
static const u8 dradrb[10][6] = {
//Row Col Bank Width DRB
{0x01, 0x01, 0x00, 0x08, 0, 0x04},
{0x01, 0x00, 0x00, 0x10, 0, 0x02},
{0x02, 0x01, 0x00, 0x08, 1, 0x08},
{0x01, 0x01, 0x00, 0x10, 1, 0x04},
{0x01, 0x01, 0x01, 0x08, 1, 0x08},
{0x00, 0x01, 0x01, 0x10, 1, 0x04},
{0x02, 0x01, 0x01, 0x08, 2, 0x10},
{0x01, 0x01, 0x01, 0x10, 2, 0x08},
{0x03, 0x01, 0x01, 0x08, 3, 0x20},
{0x02, 0x01, 0x01, 0x10, 3, 0x10},
};
reg32 = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
i = r / 2;
PRINTK_DEBUG("RANK %d PRESENT\n", r);
dra = dratab
[s->dimms[i].banks]
[s->dimms[i].width]
[s->dimms[i].cols - 9]
[s->dimms[i].rows - 12];
if (s->dimms[i].banks == 1) {
dra |= (1 << 7);
}
reg32 |= (dra << (r * 8));
}
mchbar_write32(C0DRA01, reg32);
c0dra = reg32;
PRINTK_DEBUG("C0DRA = 0x%08x\n", c0dra);
reg32 = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
reg32 |= (1 << r);
}
reg8 = (u8)(reg32 << 4) & 0xf0;
mchbar_clrsetbits8(C0CKECTRL + 2, 0xf0, reg8);
if (ONLY_DIMMA_IS_POPULATED(s->dimms, 0) || ONLY_DIMMB_IS_POPULATED(s->dimms, 0)) {
mchbar_setbits8(C0CKECTRL, 1 << 0);
}
addr = C0DRB0;
c0drb = 0;
FOR_EACH_RANK(ch, r) {
if (rank_is_populated(s->dimms, ch, r)) {
ind = (c0dra >> (8 * r)) & 0x7f;
c0drb = (u16)(c0drb + dradrb[ind][5]);
s->channel_capacity[0] += dradrb[ind][5] << 6;
}
mchbar_write16(addr, c0drb);
addr += 2;
}
printk(BIOS_DEBUG, "Total memory = %dMB\n", s->channel_capacity[0]);
}
static u8 sampledqs(u32 dqshighaddr, u32 strobeaddr, u8 highlow, u8 count)
{
u8 dqsmatches = 1;
while (count--) {
mchbar_clrbits8(C0RSTCTL, 1 << 1);
hpet_udelay(1);
mchbar_setbits8(C0RSTCTL, 1 << 1);
hpet_udelay(1);
barrier();
read32p(strobeaddr);
barrier();
hpet_udelay(1);
if (((mchbar_read8(dqshighaddr) & (1 << 6)) >> 6) != highlow) {
dqsmatches = 0;
}
}
return dqsmatches;
}
static void rcvenclock(u8 *coarse, u8 *medium, u8 lane)
{
if (*medium < 3) {
(*medium)++;
mchbar_clrsetbits16(C0RCVMISCCTL2, 3 << (lane * 2), *medium << (lane * 2));
} else {
*medium = 0;
(*coarse)++;
mchbar_clrsetbits32(C0STATRDCTRL, 0xf << 16, *coarse << 16);
mchbar_clrsetbits16(C0RCVMISCCTL2, 3 << (lane * 2), *medium << (lane * 2));
}
}
static void sdram_rcven(struct sysinfo *s)
{
u8 coarse, savecoarse;
u8 medium, savemedium;
u8 pi, savepi;
u8 lane;
u8 lanecoarse[8] = {0};
u8 minlanecoarse = 0xff;
u8 offset;
u8 maxlane = 8;
/* Since dra/drb is already set up we know that at address 0x00000000
we will always find the first available rank */
u32 strobeaddr = 0;
u32 dqshighaddr;
mchbar_clrbits8(C0RSTCTL, 3 << 2);
mchbar_clrbits8(CMNDQFIFORST, 1 << 7);
PRINTK_DEBUG("rcven 0\n");
for (lane = 0; lane < maxlane; lane++) {
PRINTK_DEBUG("rcven lane %d\n", lane);
// trylaneagain:
dqshighaddr = C0MISCCTLy(lane);
coarse = s->selected_timings.CAS + 1;
pi = 0;
medium = 0;
mchbar_clrsetbits32(C0STATRDCTRL, 0xf << 16, coarse << 16);
mchbar_clrsetbits16(C0RCVMISCCTL2, 3 << (lane * 2), medium << (lane * 2));
mchbar_clrbits8(C0RXRCVyDLL(lane), 0x3f);
savecoarse = coarse;
savemedium = medium;
savepi = pi;
PRINTK_DEBUG("rcven 0.1\n");
// XXX comment out
// mchbar_clrsetbits16(C0RCVMISCCTL1, 3 << (lane * 2), 1 << (lane * 2));
while (sampledqs(dqshighaddr, strobeaddr, 0, 3) == 0) {
// printk(BIOS_DEBUG, "coarse=%d medium=%d\n", coarse, medium);
rcvenclock(&coarse, &medium, lane);
if (coarse > 0xf) {
PRINTK_DEBUG("Error: coarse > 0xf\n");
// goto trylaneagain;
break;
}
}
PRINTK_DEBUG("rcven 0.2\n");
savecoarse = coarse;
savemedium = medium;
rcvenclock(&coarse, &medium, lane);
while (sampledqs(dqshighaddr, strobeaddr, 1, 3) == 0) {
savecoarse = coarse;
savemedium = medium;
rcvenclock(&coarse, &medium, lane);
if (coarse > 0xf) {
PRINTK_DEBUG("Error: coarse > 0xf\n");
//goto trylaneagain;
break;
}
}
PRINTK_DEBUG("rcven 0.3\n");
coarse = savecoarse;
medium = savemedium;
mchbar_clrsetbits32(C0STATRDCTRL, 0xf << 16, coarse << 16);
mchbar_clrsetbits16(C0RCVMISCCTL2, 3 << (lane * 2), medium << (lane * 2));
while (sampledqs(dqshighaddr, strobeaddr, 1, 3) == 0) {
savepi = pi;
pi++;
if (pi > s->maxpi) {
// if (s->nodll) {
pi = savepi = s->maxpi;
break;
// }
}
mchbar_clrsetbits8(C0RXRCVyDLL(lane), 0x3f, pi << s->pioffset);
}
PRINTK_DEBUG("rcven 0.4\n");
pi = savepi;
mchbar_clrsetbits8(C0RXRCVyDLL(lane), 0x3f, pi << s->pioffset);
rcvenclock(&coarse, &medium, lane);
if (sampledqs(dqshighaddr, strobeaddr, 1, 1) == 0) {
PRINTK_DEBUG("Error: DQS not high\n");
// goto trylaneagain;
}
PRINTK_DEBUG("rcven 0.5\n");
while (sampledqs(dqshighaddr, strobeaddr, 0, 3) == 0) {
coarse--;
mchbar_clrsetbits32(C0STATRDCTRL, 0xf << 16, coarse << 16);
if (coarse == 0) {
PRINTK_DEBUG("Error: DQS did not hit 0\n");
break;
}
}
PRINTK_DEBUG("rcven 0.6\n");
rcvenclock(&coarse, &medium, lane);
s->pi[lane] = pi;
lanecoarse[lane] = coarse;
}
PRINTK_DEBUG("rcven 1\n");
lane = maxlane;
do {
lane--;
if (minlanecoarse > lanecoarse[lane]) {
minlanecoarse = lanecoarse[lane];
}
} while (lane != 0);
lane = maxlane;
do {
lane--;
offset = lanecoarse[lane] - minlanecoarse;
mchbar_clrsetbits16(C0COARSEDLY0, 3 << (lane * 2), offset << (lane * 2));
} while (lane != 0);
mchbar_clrsetbits32(C0STATRDCTRL, 0xf << 16, minlanecoarse << 16);
s->coarsectrl = minlanecoarse;
s->coarsedelay = mchbar_read16(C0COARSEDLY0);
s->mediumphase = mchbar_read16(C0RCVMISCCTL2);
s->readptrdelay = mchbar_read16(C0RCVMISCCTL1);
PRINTK_DEBUG("rcven 2\n");
mchbar_clrbits8(C0RSTCTL, 7 << 1);
mchbar_setbits8(C0RSTCTL, 1 << 1);
mchbar_setbits8(C0RSTCTL, 1 << 2);
mchbar_setbits8(C0RSTCTL, 1 << 3);
mchbar_setbits8(CMNDQFIFORST, 1 << 7);
mchbar_clrbits8(CMNDQFIFORST, 1 << 7);
mchbar_setbits8(CMNDQFIFORST, 1 << 7);
PRINTK_DEBUG("rcven 3\n");
}
/* NOTE: Unless otherwise specified, the values are expressed in MiB */
static void sdram_mmap_regs(struct sysinfo *s)
{
bool reclaim;
u32 mmiosize, tom, tolud, touud, reclaimbase, reclaimlimit;
u32 gfxbase, gfxsize, gttbase, gttsize, tsegbase, tsegsize;
u16 ggc;
u16 ggc_to_uma[10] = {0, 1, 4, 8, 16, 32, 48, 64, 128, 256};
u8 ggc_to_gtt[4] = {0, 1, 0, 0};
reclaimbase = 0;
reclaimlimit = 0;
ggc = pci_read_config16(HOST_BRIDGE, GGC);
printk(BIOS_DEBUG, "GGC = 0x%04x\n", ggc);
gfxsize = ggc_to_uma[(ggc & 0x00f0) >> 4];
gttsize = ggc_to_gtt[(ggc & 0x0300) >> 8];
tom = s->channel_capacity[0];
/* With GTT always being 1M, TSEG 1M is the only setting that can
be covered by SMRR which has alignment requirements. */
tsegsize = 1;
mmiosize = 1024;
reclaim = false;
tolud = MIN(4096 - mmiosize, tom);
if ((tom - tolud) > 64) {
reclaim = true;
}
if (reclaim) {
tolud = tolud & ~0x3f;
tom = tom & ~0x3f;
reclaimbase = MAX(4096, tom);
reclaimlimit = reclaimbase + (MIN(4096, tom) - tolud) - 0x40;
}
touud = tom;
if (reclaim) {
touud = reclaimlimit + 64;
}
gfxbase = tolud - gfxsize;
gttbase = gfxbase - gttsize;
tsegbase = gttbase - tsegsize;
/* Program the regs */
pci_write_config16(HOST_BRIDGE, TOLUD, (u16)(tolud << 4));
pci_write_config16(HOST_BRIDGE, TOM, (u16)(tom >> 6));
if (reclaim) {
pci_write_config16(HOST_BRIDGE, 0x98, (u16)(reclaimbase >> 6));
pci_write_config16(HOST_BRIDGE, 0x9a, (u16)(reclaimlimit >> 6));
}
pci_write_config16(HOST_BRIDGE, TOUUD, (u16)(touud));
pci_write_config32(HOST_BRIDGE, GBSM, gfxbase << 20);
pci_write_config32(HOST_BRIDGE, BGSM, gttbase << 20);
pci_write_config32(HOST_BRIDGE, TSEG, tsegbase << 20);
u8 reg8 = pci_read_config8(HOST_BRIDGE, ESMRAMC);
reg8 &= ~0x07;
reg8 |= (0 << 1) | (1 << 0); /* 1M and TSEG_Enable */
pci_write_config8(HOST_BRIDGE, ESMRAMC, reg8);
printk(BIOS_DEBUG, "GBSM (igd) = verified %08x (written %08x)\n",
pci_read_config32(HOST_BRIDGE, GBSM), gfxbase << 20);
printk(BIOS_DEBUG, "BGSM (gtt) = verified %08x (written %08x)\n",
pci_read_config32(HOST_BRIDGE, BGSM), gttbase << 20);
printk(BIOS_DEBUG, "TSEG (smm) = verified %08x (written %08x)\n",
pci_read_config32(HOST_BRIDGE, TSEG), tsegbase << 20);
}
static void sdram_enhancedmode(struct sysinfo *s)
{
u8 reg8, ch, r, fsb_freq, ddr_freq;
u32 mask32, reg32;
mchbar_setbits8(C0ADDCSCTRL, 1 << 0);
mchbar_setbits8(C0REFRCTRL + 3, 1 << 0);
mask32 = (0x1f << 15) | (0x1f << 10) | (0x1f << 5) | 0x1f;
reg32 = (0x1e << 15) | (0x10 << 10) | (0x1e << 5) | 0x10;
mchbar_clrsetbits32(WRWMCONFIG, mask32, reg32);
mchbar_write8(C0DITCTRL + 1, 2);
mchbar_write16(C0DITCTRL + 2, 0x0804);
mchbar_write16(C0DITCTRL + 4, 0x2010);
mchbar_write8(C0DITCTRL + 6, 0x40);
mchbar_write16(C0DITCTRL + 8, 0x091c);
mchbar_write8(C0DITCTRL + 10, 0xf2);
mchbar_setbits8(C0BYPCTRL, 1 << 0);
mchbar_setbits8(C0CWBCTRL, 1 << 0);
mchbar_setbits16(C0ARBSPL, 1 << 8);
pci_or_config8(HOST_BRIDGE, 0xf0, 1);
mchbar_write32(SBCTL, 0x00000002);
mchbar_write32(SBCTL2, 0x20310002);
mchbar_write32(SLIMCFGTMG, 0x02020302);
mchbar_write32(HIT0, 0x001f1806);
mchbar_write32(HIT1, 0x01102800);
mchbar_write32(HIT2, 0x07000000);
mchbar_write32(HIT3, 0x01014010);
mchbar_write32(HIT4, 0x0f038000);
pci_and_config8(HOST_BRIDGE, 0xf0, ~1);
u32 nranks, curranksize, maxranksize, dra;
u8 rankmismatch;
static const u8 drbtab[10] = {0x4, 0x2, 0x8, 0x4, 0x8, 0x4, 0x10, 0x8, 0x20, 0x10};
nranks = 0;
curranksize = 0;
maxranksize = 0;
rankmismatch = 0;
FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
nranks++;
dra = (u8)((mchbar_read32(C0DRA01) >> (8 * r)) & 0x7f);
curranksize = drbtab[dra];
if (maxranksize == 0) {
maxranksize = curranksize;
}
if (curranksize != maxranksize) {
rankmismatch = 1;
}
}
reg8 = 0;
switch (nranks) {
case 4:
if (rankmismatch) {
reg8 = 0x64;
} else {
reg8 = 0xa4;
}
break;
case 1:
case 3:
reg8 = 0x64;
break;
case 2:
if (rankmismatch) {
reg8 = 0x64;
} else {
reg8 = 0x24;
}
break;
default:
die("Invalid number of ranks found, halt\n");
break;
}
mchbar_clrsetbits8(CHDECMISC, 0xfc, reg8 & 0xfc);
mchbar_clrbits32(NOACFGBUSCTL, 1 << 31);
mchbar_write32(HTBONUS0, 0xf);
mchbar_setbits8(C0COREBONUS + 4, 1 << 0);
mchbar_clrbits32(HIT3, 7 << 25);
mchbar_clrsetbits32(HIT4, 3 << 18, 1 << 18);
u32 clkcx[2][2][3] = {
{
{0x00000000, 0x0c080302, 0x08010204}, /* FSB = 667, DDR = 667 */
{0x02040000, 0x08100102, 0x00000000}, /* FSB = 667, DDR = 800 */
},
{
{0x18000000, 0x3021060c, 0x20010208}, /* FSB = 800, DDR = 667 */
{0x00000000, 0x0c090306, 0x00000000}, /* FSB = 800, DDR = 800 */
}
};
fsb_freq = s->selected_timings.fsb_clock;
ddr_freq = s->selected_timings.mem_clock;
mchbar_write32(CLKXSSH2X2MD + 0, clkcx[fsb_freq][ddr_freq][0]);
mchbar_write32(CLKXSSH2X2MD + 4, clkcx[fsb_freq][ddr_freq][1]);
mchbar_write32(CLKXSSH2MCBYP + 4, clkcx[fsb_freq][ddr_freq][2]);
mchbar_clrbits8(HIT4, 1 << 1);
}
static void sdram_periodic_rcomp(void)
{
mchbar_clrbits8(COMPCTRL1, 1 << 1);
while ((mchbar_read32(COMPCTRL1) & (1 << 31)) > 0) {
;
}
mchbar_clrbits16(CSHRMISCCTL, 3 << 12);
mchbar_setbits8(CMNDQFIFORST, 1 << 7);
mchbar_clrsetbits16(XCOMPDFCTRL, 0x0f, 0x09);
mchbar_setbits8(COMPCTRL1, 1 << 7 | 1 << 1);
}
static void sdram_new_trd(struct sysinfo *s)
{
u8 pidelay, i, j, k, cc, trd_perphase[5];
u8 bypass, freqgb, trd, reg8, txfifo;
u32 reg32, datadelay, tio, rcvendelay, maxrcvendelay;
u16 tmclk, thclk, buffertocore, postcalib;
static const u8 txfifo_lut[8] = { 0, 7, 6, 5, 2, 1, 4, 3 };
static const u16 trd_adjust[2][2][5] = {
{
{3000, 3000, 0,0,0},
{1000,2000,3000,1500,2500}
},
{
{2000,1000,3000,0,0},
{2500, 2500, 0,0,0}
}};
freqgb = 110;
buffertocore = 5000;
postcalib = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 1250 : 500;
tmclk = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 3000 : 2500;
tmclk = tmclk * 100 / freqgb;
thclk = (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) ? 6000 : 5000;
switch (s->selected_timings.mem_clock) {
case MEM_CLOCK_667MHz:
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) {
cc = 2;
} else {
cc = 3;
}
break;
default:
case MEM_CLOCK_800MHz:
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) {
cc = 5;
} else {
cc = 2;
}
break;
}
tio = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 2700 : 3240;
maxrcvendelay = 0;
pidelay = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 24 : 20;
for (i = 0; i < 8; i++) {
rcvendelay = ((u32)((s->coarsedelay >> (i << 1)) & 3) * (u32)(tmclk));
rcvendelay += ((u32)((s->readptrdelay >> (i << 1)) & 3) * (u32)(tmclk) / 2);
rcvendelay += ((u32)((s->mediumphase >> (i << 1)) & 3) * (u32)(tmclk) / 4);
rcvendelay += (u32)(pidelay * s->pi[i]);
maxrcvendelay = MAX(maxrcvendelay, rcvendelay);
}
if ((mchbar_read8(HMBYPCP + 3) == 0xff) && (mchbar_read8(HMCCMC) & (1 << 7))) {
bypass = 1;
} else {
bypass = 0;
}
txfifo = 0;
reg8 = (mchbar_read8(CSHRFIFOCTL) & 0x0e) >> 1;
txfifo = txfifo_lut[reg8] & 0x07;
datadelay = tmclk * (2*txfifo + 4*s->coarsectrl + 4*(bypass-1) + 13) / 4
+ tio + maxrcvendelay + pidelay + buffertocore + postcalib;
if (s->async) {
datadelay += tmclk / 2;
}
j = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 0 : 1;
k = (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz) ? 0 : 1;
if (j == 0 && k == 0) {
datadelay -= 3084;
}
trd = 0;
for (i = 0; i < cc; i++) {
reg32 = datadelay - (trd_adjust[k][j][i] * 100 / freqgb);
trd_perphase[i] = (u8)(reg32 / thclk) - 2;
trd_perphase[i] += 1;
if (trd_perphase[i] > trd) {
trd = trd_perphase[i];
}
}
mchbar_clrsetbits16(C0STATRDCTRL, 0x1f << 8, trd << 8);
}
static void sdram_powersettings(struct sysinfo *s)
{
u8 j;
u32 reg32;
/* Thermal sensor */
mchbar_write8(TSC1, 0x9b);
mchbar_clrsetbits32(TSTTP, 0x00ffffff, 0x1d00);
mchbar_write8(THERM1, 0x08);
mchbar_write8(TSC3, 0);
mchbar_clrsetbits8(TSC2, 0x0f, 0x04);
mchbar_clrsetbits8(THERM1, 1, 1);
mchbar_clrsetbits8(TCO, 1 << 7, 1 << 7);
/* Clock gating */
mchbar_clrbits32(PMMISC, 1 << 18 | 1 << 0);
mchbar_clrbits8(SBCTL3 + 3, 1 << 7);
mchbar_clrbits8(CISDCTRL + 3, 1 << 7);
mchbar_clrbits16(CICGDIS, 0x1fff);
mchbar_clrbits32(SBCLKGATECTRL, 0x1ffff);
mchbar_clrsetbits16(HICLKGTCTL, 0x03ff, 0x06);
mchbar_clrsetbits32(HTCLKGTCTL, ~0, 0x20);
mchbar_clrbits8(TSMISC, 1 << 0);
mchbar_write8(C0WRDPYN, s->selected_timings.CAS - 1 + 0x15);
mchbar_clrsetbits16(CLOCKGATINGI, 0x07fc, 0x0040);
mchbar_clrsetbits16(CLOCKGATINGII, 0x0fff, 0x0d00);
mchbar_clrbits16(CLOCKGATINGIII, 0x0d80);
mchbar_write16(GTDPCGC + 2, 0xffff);
/* Sequencing */
mchbar_clrsetbits32(HPWRCTL1, 0x1fffffff, 0x1f643fff);
mchbar_clrsetbits32(HPWRCTL2, 0xffffff7f, 0x02010000);
mchbar_clrsetbits16(HPWRCTL3, 7 << 12, 3 << 12);
/* Power */
mchbar_clrsetbits32(GFXC3C4, 0xffff0003, 0x10100000);
mchbar_clrsetbits32(PMDSLFRC, 0x0001bff7, 0x00000078);
if (s->selected_timings.fsb_clock == FSB_CLOCK_667MHz)
mchbar_clrsetbits16(PMMSPMRES, 0x03ff, 0x00c8);
else
mchbar_clrsetbits16(PMMSPMRES, 0x03ff, 0x0100);
j = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 0 : 1;
mchbar_clrsetbits32(PMCLKRC, 0x01fff37f, 0x10810700);
mchbar_clrsetbits8(PMPXPRC, 7, 1);
mchbar_clrbits8(PMBAK, 1 << 1);
static const u16 ddr2lut[2][4][2] = {
{
{0x0000, 0x0000},
{0x019A, 0x0039},
{0x0099, 0x1049},
{0x0000, 0x0000},
},
{
{0x0000, 0x0000},
{0x019A, 0x0039},
{0x0099, 0x1049},
{0x0099, 0x2159},
},
};
mchbar_write16(C0C2REG, 0x7a89);
mchbar_write8(SHC2REGII, 0xaa);
mchbar_write16(SHC2REGII + 1, ddr2lut[j][s->selected_timings.CAS - 3][1]);
mchbar_clrsetbits16(SHC2REGI, 0x7fff, ddr2lut[j][s->selected_timings.CAS - 3][0]);
mchbar_clrsetbits16(CLOCKGATINGIII, 0xf000, 0xf000);
mchbar_clrsetbits8(CSHWRIOBONUSX, 0x77, 4 << 4 | 4);
reg32 = s->nodll ? 0x30000000 : 0;
mchbar_clrsetbits32(C0COREBONUS, 0xf << 24, 1 << 29 | reg32);
mchbar_clrsetbits32(CLOCKGATINGI, 0xf << 20, 0xf << 20);
mchbar_clrsetbits32(CLOCKGATINGII - 1, 0x001ff000, 0xbf << 20);
mchbar_clrsetbits16(SHC3C4REG2, 0x1f7f, 0x0b << 8 | 7 << 4 | 0x0b);
mchbar_write16(SHC3C4REG3, 0x3264);
mchbar_clrsetbits16(SHC3C4REG4, 0x3f3f, 0x14 << 8 | 0x0a);
mchbar_setbits32(C1COREBONUS, 1 << 31 | 1 << 13);
}
static void sdram_programddr(void)
{
mchbar_clrsetbits16(CLOCKGATINGII, 0x03ff, 0x0100);
mchbar_clrsetbits16(CLOCKGATINGIII, 0x003f, 0x0010);
mchbar_clrsetbits16(CLOCKGATINGI, 0x7000, 0x2000);
mchbar_clrbits8(CSHRPDCTL, 7 << 1);
mchbar_clrbits8(CSHRWRIOMLNS, 3 << 2);
mchbar_clrbits8(C0MISCCTLy(0), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(1), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(2), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(3), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(4), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(5), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(6), 7 << 1);
mchbar_clrbits8(C0MISCCTLy(7), 7 << 1);
mchbar_clrbits8(CSHRWRIOMLNS, 1 << 1);
mchbar_clrbits16(CSHRMISCCTL, 1 << 10);
mchbar_clrbits16(CLOCKGATINGIII, 0x0dc0);
mchbar_clrbits8(C0WRDPYN, 1 << 7);
mchbar_clrbits32(C0COREBONUS, 1 << 22);
mchbar_clrbits16(CLOCKGATINGI, 0x80fc);
mchbar_clrbits16(CLOCKGATINGII, 0x0c00);
mchbar_clrbits8(CSHRPDCTL, 0x0d);
mchbar_clrbits8(C0MISCCTLy(0), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(1), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(2), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(3), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(4), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(5), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(6), 1 << 0);
mchbar_clrbits8(C0MISCCTLy(7), 1 << 0);
mchbar_clrsetbits32(C0STATRDCTRL, 7 << 20, 3 << 20);
mchbar_clrbits32(C0COREBONUS, 1 << 20);
mchbar_setbits8(C0DYNSLVDLLEN, 0x1e);
mchbar_setbits8(C0DYNSLVDLLEN2, 0x03);
mchbar_clrsetbits32(SHCYCTRKCKEL, 3 << 26, 1 << 26);
mchbar_setbits16(C0STATRDCTRL, 3 << 13);
mchbar_setbits32(C0CKECTRL, 1 << 16);
mchbar_setbits8(C0COREBONUS, 1 << 4);
mchbar_setbits32(CLOCKGATINGI - 1, 0xf << 24);
mchbar_setbits8(CSHWRIOBONUS, 7);
mchbar_setbits8(C0DYNSLVDLLEN, 3 << 6);
mchbar_setbits8(SHC2REGIII, 7);
mchbar_clrsetbits16(SHC2MINTM, ~0, 1 << 7);
mchbar_clrsetbits8(SHC2IDLETM, 0xff, 0x10);
mchbar_setbits16(C0COREBONUS, 0xf << 5);
mchbar_setbits8(CSHWRIOBONUS, 3 << 3);
mchbar_setbits8(CSHRMSTDYNDLLENB, 0x0d);
mchbar_setbits16(SHC3C4REG1, 0x0a3f);
mchbar_setbits8(C0STATRDCTRL, 3);
mchbar_clrsetbits8(C0REFRCTRL2, 0xff, 0x4a);
mchbar_clrbits8(C0COREBONUS + 4, 3 << 5);
mchbar_setbits16(C0DYNSLVDLLEN, 0x0321);
}
static void sdram_programdqdqs(struct sysinfo *s)
{
u16 mdclk, tpi, refclk, dqdqs_out, dqdqs_outdelay, dqdqs_delay;
u32 coretomcp, txdelay, tmaxunmask, tmaxpi;
u8 repeat, halfclk, feature, reg8, push;
u16 cwb, pimdclk;
u32 reg32;
static const u8 txfifotab[8] = {0, 7, 6, 5, 2, 1, 4, 3};
tpi = 3000;
dqdqs_out = 4382;
dqdqs_outdelay = 5083;
dqdqs_delay = 4692;
coretomcp = 0;
txdelay = 0;
halfclk = 0;
tmaxunmask = 0;
tmaxpi = 0;
repeat = 2;
feature = 0;
cwb = 0;
pimdclk = 0;
reg32 = 0;
push = 0;
reg8 = 0;
mdclk = (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) ? 3000 : 2500;
refclk = 3000 - mdclk;
coretomcp = ((mchbar_read8(C0ADDCSCTRL) >> 2) & 0x3) + 1;
coretomcp *= mdclk;
reg8 = (mchbar_read8(CSHRFIFOCTL) & 0x0e) >> 1;
while (repeat) {
txdelay = mdclk * (
((mchbar_read16(C0GNT2LNCH1) >> 8) & 0x7) +
(mchbar_read8(C0WRDATACTRL) & 0xf) +
(mchbar_read8(C0WRDATACTRL + 1) & 0x1)
) +
txfifotab[reg8]*(mdclk / 2) +
coretomcp +
refclk +
cwb;
halfclk = (mchbar_read8(C0MISCCTL) >> 1) & 0x1;
if (halfclk) {
txdelay -= mdclk / 2;
reg32 = dqdqs_outdelay + coretomcp - mdclk / 2;
} else {
reg32 = dqdqs_outdelay + coretomcp;
}
tmaxunmask = txdelay - mdclk - dqdqs_out;
tmaxpi = tmaxunmask - tpi;
if ((tmaxunmask >= reg32) && tmaxpi >= dqdqs_delay) {
if (repeat == 2) {
mchbar_clrbits32(C0COREBONUS, 1 << 23);
}
feature = 1;
repeat = 0;
} else {
repeat--;
mchbar_setbits32(C0COREBONUS, 1 << 23);
cwb = 2 * mdclk;
}
}
if (!feature) {
mchbar_clrbits8(CLOCKGATINGI, 3);
return;
}
mchbar_setbits8(CLOCKGATINGI, 3);
mchbar_clrsetbits16(CLOCKGATINGIII, 0xf << 12, pimdclk << 12);
mchbar_clrsetbits8(CSHWRIOBONUSX, 0x77, push << 4 | push);
mchbar_clrsetbits32(C0COREBONUS, 0xf << 24, 3 << 24);
}
/**
* @param boot_path: 0 = normal, 1 = reset, 2 = resume from s3
*/
void sdram_initialize(int boot_path, const u8 *spd_addresses)
{
struct sysinfo si;
const char *boot_str[] = {"Normal", "Reset", "Resume"};
PRINTK_DEBUG("Setting up RAM controller.\n");
memset(&si, 0, sizeof(si));
si.boot_path = boot_path;
printk(BIOS_DEBUG, "Boot path: %s\n", boot_str[boot_path]);
si.spd_map[0] = spd_addresses[0];
si.spd_map[1] = spd_addresses[1];
si.spd_map[2] = spd_addresses[2];
si.spd_map[3] = spd_addresses[3];
sdram_read_spds(&si);
/* Choose Common Frequency */
sdram_detect_ram_speed(&si);
/* Determine smallest common tRAS, tRP, tRCD, etc */
sdram_detect_smallest_params(&si);
/* Enable HPET */
enable_hpet();
mchbar_setbits16(CPCTL, 1 << 15);
sdram_clk_crossing(&si);
sdram_checkreset();
PRINTK_DEBUG("Done checkreset\n");
sdram_clkmode(&si);
PRINTK_DEBUG("Done clkmode\n");
sdram_timings(&si);
PRINTK_DEBUG("Done timings (dqs dll enabled)\n");
if (si.boot_path != BOOT_PATH_RESET) {
sdram_dlltiming(&si);
PRINTK_DEBUG("Done dlltiming\n");
}
if (si.boot_path != BOOT_PATH_RESET) {
sdram_rcomp(&si);
PRINTK_DEBUG("Done RCOMP\n");
}
sdram_odt(&si);
PRINTK_DEBUG("Done odt\n");
if (si.boot_path != BOOT_PATH_RESET) {
while ((mchbar_read8(COMPCTRL1) & 1) != 0)
;
}
sdram_mmap(&si);
PRINTK_DEBUG("Done mmap\n");
/* Enable DDR IO buffer */
mchbar_clrsetbits8(C0IOBUFACTCTL, 0x3f, 0x08);
mchbar_setbits8(C0RSTCTL, 1 << 0);
sdram_rcompupdate(&si);
PRINTK_DEBUG("Done RCOMP update\n");
mchbar_setbits8(HIT4, 1 << 1);
if (si.boot_path != BOOT_PATH_RESUME) {
mchbar_setbits32(C0CKECTRL, 1 << 27);
sdram_jedecinit(&si);
PRINTK_DEBUG("Done MRS\n");
}
sdram_misc(&si);
PRINTK_DEBUG("Done misc\n");
sdram_zqcl(&si);
PRINTK_DEBUG("Done zqcl\n");
if (si.boot_path != BOOT_PATH_RESUME) {
mchbar_setbits32(C0REFRCTRL2, 3 << 30);
}
sdram_dradrb(&si);
PRINTK_DEBUG("Done dradrb\n");
sdram_rcven(&si);
PRINTK_DEBUG("Done rcven\n");
sdram_new_trd(&si);
PRINTK_DEBUG("Done tRD\n");
sdram_mmap_regs(&si);
PRINTK_DEBUG("Done mmap regs\n");
sdram_enhancedmode(&si);
PRINTK_DEBUG("Done enhanced mode\n");
sdram_powersettings(&si);
PRINTK_DEBUG("Done power settings\n");
sdram_programddr();
PRINTK_DEBUG("Done programming ddr\n");
sdram_programdqdqs(&si);
PRINTK_DEBUG("Done programming dqdqs\n");
sdram_periodic_rcomp();
PRINTK_DEBUG("Done periodic RCOMP\n");
/* Set init done */
mchbar_setbits32(C0REFRCTRL2, 1 << 30);
/* Tell ICH7 that we're done */
pci_and_config8(PCI_DEV(0, 0x1f, 0), 0xa2, (u8)~(1 << 7));
/* Tell northbridge we're done */
pci_or_config8(HOST_BRIDGE, 0xf4, 1);
printk(BIOS_DEBUG, "RAM initialization finished.\n");
}