[coreboot-gerrit] Patch set updated for coreboot: northbridge/intel/x4x: Native raminit (WIP)
Damien Zammit (damien@zamaudio.com)
gerrit at coreboot.org
Thu Dec 10 01:06:49 CET 2015
Damien Zammit (damien at zamaudio.com) just uploaded a new patch set to gerrit, which you can find at https://review.coreboot.org/11307
-gerrit
commit 783731868c0b0584b757f1b7f6b15213525be9e1
Author: Damien Zammit <damien at zamaudio.com>
Date: Thu Aug 20 00:37:05 2015 +1000
northbridge/intel/x4x: Native raminit (WIP)
Passes ram_check() @ 0x200000
Need to get jump to ramstage working so we can run memtest86+
Change-Id: Ib34d862cb48b49c054a505fffcba1c17aeb39436
Signed-off-by: Damien Zammit <damien at zamaudio.com>
---
src/northbridge/intel/x4x/Makefile.inc | 5 +-
src/northbridge/intel/x4x/bootblock.c | 32 +-
src/northbridge/intel/x4x/debug.h | 13 +
src/northbridge/intel/x4x/delay.c | 7 +-
src/northbridge/intel/x4x/delay.h | 2 +
src/northbridge/intel/x4x/early_init.c | 15 +
src/northbridge/intel/x4x/raminit.c | 520 ++++++++
src/northbridge/intel/x4x/raminit_ddr2.c | 2117 ++++++++++++++++++++++++++++++
src/northbridge/intel/x4x/x4x.h | 139 +-
9 files changed, 2804 insertions(+), 46 deletions(-)
diff --git a/src/northbridge/intel/x4x/Makefile.inc b/src/northbridge/intel/x4x/Makefile.inc
index 0c979b8..3c92c87 100644
--- a/src/northbridge/intel/x4x/Makefile.inc
+++ b/src/northbridge/intel/x4x/Makefile.inc
@@ -21,8 +21,9 @@ ifeq ($(CONFIG_NORTHBRIDGE_INTEL_X4X),y)
romstage-y += early_init.c
#romstage-y += early_reset.c
-#romstage-y += delay.c
-#romstage-y += raminit.c
+romstage-y += delay.c
+romstage-y += raminit.c
+romstage-y += raminit_ddr2.c
#romstage-y += raminit_rcomp_calibration.c
#romstage-y += raminit_receive_enable_calibration.c
#romstage-y += raminit_read_write_training.c
diff --git a/src/northbridge/intel/x4x/bootblock.c b/src/northbridge/intel/x4x/bootblock.c
index fb40b94..c1a42c5 100644
--- a/src/northbridge/intel/x4x/bootblock.c
+++ b/src/northbridge/intel/x4x/bootblock.c
@@ -4,9 +4,24 @@
#define D0F0_PCIEXBAR_LO 0x60
#define D0F0_PCIEXBAR_HI 0x64
+#define EARLYRCBA 0xd0000
+#define ERCBA8(x) *((volatile u8 *)(EARLYRCBA + x))
+#define ERCBA16(x) *((volatile u16 *)(EARLYRCBA + x))
+#define ERCBA32(x) *((volatile u32 *)(EARLYRCBA + x))
+
+#define EARLYMCH 0xfed14000
+#define EMCH8(x) *((volatile u8 *)(EARLYMCH + x))
+#define EMCH16(x) *((volatile u16 *)(EARLYMCH + x))
+#define EMCH32(x) *((volatile u32 *)(EARLYMCH + x))
+
+#define TPMBASE 0xfed40000
+#define TPM8(x) *((volatile u8 *)(TPMBASE + x))
+
static void bootblock_northbridge_init(void)
{
uint32_t reg;
+ uint32_t reg2;
+ uint8_t reg8;
/*
* The "io" variant of the config access is explicitly used to
@@ -20,8 +35,21 @@ static void bootblock_northbridge_init(void)
* The PCIEXBAR is assumed to live in the memory mapped IO space under
* 4GiB.
*/
- reg = 0;
- pci_io_write_config32(PCI_DEV(0,0,0), D0F0_PCIEXBAR_HI, reg);
+
+ // Do some magic early with RCBA
+ reg = pci_io_read_config32(PCI_DEV(0, 0x1f, 0), 0xf0);
+ pci_io_write_config32(PCI_DEV(0, 0x1f, 0), 0xf0, EARLYRCBA | 1);
+
+ ERCBA8(0x3410) = ERCBA8(0x3410) | 0x24;
+ ERCBA8(0x3400) = ERCBA8(0x3400) | 0x4;
+ outb(0xce, 0x80);
+ reg8 = ERCBA8(0x3411);
+ pci_io_write_config32(PCI_DEV(0, 0x1f, 0), 0xf0, 0xfed1c000 | 1);
+
+ // Do some magic early with TPM
+ reg8 = TPM8(0);
+
+ pci_io_write_config32(PCI_DEV(0,0,0), D0F0_PCIEXBAR_HI, 0);
reg = CONFIG_MMCONF_BASE_ADDRESS | (2 << 1) | 1; /* 64MiB - 0-63 buses. */
pci_io_write_config32(PCI_DEV(0,0,0), D0F0_PCIEXBAR_LO, reg);
}
diff --git a/src/northbridge/intel/x4x/debug.h b/src/northbridge/intel/x4x/debug.h
new file mode 100644
index 0000000..94bea08
--- /dev/null
+++ b/src/northbridge/intel/x4x/debug.h
@@ -0,0 +1,13 @@
+/* Debugging macros. */
+#if 1 //CONFIG_DEBUG_RAM_SETUP
+#define PRINTK_DEBUG(x...) printk(BIOS_DEBUG, x)
+#else
+#define PRINTK_DEBUG(x...)
+#endif
+
+#if 0 //CONFIG_DEBUG_RAM_SETUP
+#define PRINTK_VERBOSE(x...) printk(BIOS_DEBUG, x)
+#else
+#define PRINTK_VERBOSE(x...)
+#endif
+
diff --git a/src/northbridge/intel/x4x/delay.c b/src/northbridge/intel/x4x/delay.c
index 1060dc3..2fbb001 100644
--- a/src/northbridge/intel/x4x/delay.c
+++ b/src/northbridge/intel/x4x/delay.c
@@ -84,11 +84,16 @@ static void _udelay(const u32 us, const u32 numerator, const int total)
|| ((tsc.hi == tsc1.hi) && (tsc.lo < tsc1.lo)));
}
-void udelay(const u32 us)
+void microdelay(const u32 us)
{
_udelay(us, 1, 0);
}
+void ns10delay(const u32 ns10)
+{
+ _udelay(ns10, 100, 0);
+}
+
void ns100delay(const u32 ns100)
{
_udelay(ns100, 10, 0);
diff --git a/src/northbridge/intel/x4x/delay.h b/src/northbridge/intel/x4x/delay.h
index c8ee9ce..181e576 100644
--- a/src/northbridge/intel/x4x/delay.h
+++ b/src/northbridge/intel/x4x/delay.h
@@ -22,7 +22,9 @@
#include <delay.h>
+void microdelay(u32);
void ns100delay(u32);
+void ns10delay(u32);
void udelay_from_reset(u32);
#endif /* __NORTHBRIDGE_INTEL_GM45_DELAY_H__ */
diff --git a/src/northbridge/intel/x4x/early_init.c b/src/northbridge/intel/x4x/early_init.c
index e489e90..7a151dc 100644
--- a/src/northbridge/intel/x4x/early_init.c
+++ b/src/northbridge/intel/x4x/early_init.c
@@ -23,6 +23,8 @@
void x4x_early_init(void)
{
+ u16 reg16;
+
const device_t d0f0 = PCI_DEV(0, 0, 0);
/* Setup MCHBAR. */
@@ -34,8 +36,14 @@ void x4x_early_init(void)
/* Setup EPBAR. */
pci_write_config32(d0f0, D0F0_EPBAR_LO, DEFAULT_EPBAR | 1);
+ /* Setup PMBASE */
pci_write_config32(d0f0, D0F0_PMBASE, DEFAULT_PMBASE | 1);
+ /* Setup HECIBAR */
+ pci_write_config32(PCI_DEV(0,3,0), 0x10, DEFAULT_HECIBAR);
+ reg16 = pci_read_config16(PCI_DEV(0,3,0), 0x4);
+ pci_write_config16(PCI_DEV(0,3,0), 0x4, reg16 | 0x6);
+
/* Set C0000-FFFFF to access RAM on both reads and writes */
pci_write_config8(d0f0, D0F0_PAM(0), 0x30);
pci_write_config8(d0f0, D0F0_PAM(1), 0x33);
@@ -44,4 +52,11 @@ void x4x_early_init(void)
pci_write_config8(d0f0, D0F0_PAM(4), 0x33);
pci_write_config8(d0f0, D0F0_PAM(5), 0x33);
pci_write_config8(d0f0, D0F0_PAM(6), 0x33);
+
+ /* Enable internal GFX */
+ reg16 = pci_read_config16(d0f0, 0x52);
+ pci_write_config16(d0f0, 0x52, reg16 | 0x802); // GTT = 2, UMA = 32
+
+ reg16 = pci_read_config16(d0f0, 0x54);
+ pci_write_config16(d0f0, 0x54, reg16 | 0x8);
}
diff --git a/src/northbridge/intel/x4x/raminit.c b/src/northbridge/intel/x4x/raminit.c
new file mode 100644
index 0000000..564356c
--- /dev/null
+++ b/src/northbridge/intel/x4x/raminit.c
@@ -0,0 +1,520 @@
+/*
+ * This file is part of the coreboot project.
+ *
+ * Copyright (C) 2015 Damien Zammit <damien at zamaudio.com>
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License as
+ * published by the Free Software Foundation; version 2 of
+ * the License.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc.
+ */
+
+#include <arch/io.h>
+#include <cbmem.h>
+#include <console/console.h>
+#include <cpu/x86/cache.h>
+#include <cpu/x86/mtrr.h>
+#include <delay.h>
+#include <halt.h>
+#include <lib.h>
+#include <northbridge/intel/x4x/x4x.h>
+#include <pc80/mc146818rtc.h>
+#include <spd.h>
+#include <string.h>
+#include "debug.h"
+
+static inline int spd_read_byte(unsigned device, unsigned address)
+{
+ return smbus_read_byte(device, address);
+}
+
+static void sdram_read_spds(sysinfo_t *s)
+{
+ u8 i, j, chan;
+ int status = 0;
+ FOR_EACH_DIMM(i) {
+ for (j = 0; j < 64; j++) {
+ status = spd_read_byte(s->spd_map[i], j);
+ if (status < 0) {
+ s->dimms[i].card_type = 0;
+ break;
+ }
+ s->dimms[i].spd_data[j] = (u8) status;
+ PRINTK_DEBUG("%02x ", (u8) status);
+ if (j % 16 == 15)
+ PRINTK_DEBUG("\n");
+ if (j == 62)
+ s->dimms[i].card_type = ((u8) status) & 0x1f;
+ }
+ PRINTK_DEBUG("\n");
+ }
+
+/*
+ if (ONLY_DIMMB_IS_POPULATED(s->dimms, 0)) {
+ // Swap dimm info on ch 0
+ dimminfo_t tmp;
+ memcpy(&tmp, &s->dimms[0], sizeof(dimminfo_t));
+ memcpy(&s->dimms[0], &s->dimms[1], sizeof(dimminfo_t));
+ memcpy(&s->dimms[1], &tmp, sizeof(dimminfo_t));
+ }
+ if (ONLY_DIMMB_IS_POPULATED(s->dimms, 1)) {
+ // Swap dimm info on ch 1
+ dimminfo_t tmp;
+ memcpy(&tmp, &s->dimms[2], sizeof(dimminfo_t));
+ memcpy(&s->dimms[2], &s->dimms[3], sizeof(dimminfo_t));
+ memcpy(&s->dimms[3], &tmp, sizeof(dimminfo_t));
+ }
+*/
+
+ s->spd_type = 0;
+ int fail = 1;
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ switch (s->dimms[i].spd_data[2]) {
+ case 0x8:
+ if (s->spd_type == 0) {
+ s->spd_type = DDR2;
+ } else if (s->spd_type == DDR3) {
+ die("DIMM type mismatch\n");
+ }
+ break;
+ case 0xb:
+ default:
+ if (s->spd_type == 0) {
+ s->spd_type = DDR3;
+ } else if (s->spd_type == DDR2) {
+ die("DIMM type mismatch\n");
+ }
+ break;
+ }
+ }
+ if (s->spd_type == DDR3) {
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ s->dimms[i].sides = (s->dimms[i].spd_data[5] & 0x0f) + 1;
+ s->dimms[i].ranks = ((s->dimms[i].spd_data[7] >> 3) & 0x7) + 1;
+ s->dimms[i].chip_capacity = (s->dimms[i].spd_data[4] & 0xf);
+ s->dimms[i].banks = 8;
+ s->dimms[i].rows = ((s->dimms[i].spd_data[5] >> 3) & 0x7) + 12;
+ s->dimms[i].cols = (s->dimms[i].spd_data[5] & 0x7) + 9;
+ s->dimms[i].cas_latencies = 0xfe;
+ s->dimms[i].cas_latencies &= (s->dimms[i].spd_data[14] << 1);
+ if (s->dimms[i].cas_latencies == 0)
+ s->dimms[i].cas_latencies = 0x40;
+ s->dimms[i].tAAmin = s->dimms[i].spd_data[16];
+ s->dimms[i].tCKmin = s->dimms[i].spd_data[12];
+ s->dimms[i].width = s->dimms[i].spd_data[7] & 0x7;
+ s->dimms[i].page_size = s->dimms[i].width * (1 << s->dimms[i].cols); // Bytes
+ s->dimms[i].tRAS = ((s->dimms[i].spd_data[21] & 0xf) << 8) |
+ s->dimms[i].spd_data[22];
+ s->dimms[i].tRP = s->dimms[i].spd_data[20];
+ s->dimms[i].tRCD = s->dimms[i].spd_data[18];
+ s->dimms[i].tWR = s->dimms[i].spd_data[17];
+ fail = 0;
+ }
+ } else if (s->spd_type == DDR2) {
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ s->dimms[i].sides = (s->dimms[i].spd_data[5] & 0x7) + 1;
+ s->dimms[i].banks = (s->dimms[i].spd_data[17] >> 2) - 1;
+ s->dimms[i].chip_capacity = s->dimms[i].banks;
+ s->dimms[i].rows = s->dimms[i].spd_data[3];// - 12;
+ s->dimms[i].cols = s->dimms[i].spd_data[4];// - 9;
+ s->dimms[i].cas_latencies = 0x78;
+ s->dimms[i].cas_latencies &= s->dimms[i].spd_data[18];
+ if (s->dimms[i].cas_latencies == 0)
+ s->dimms[i].cas_latencies = 7;
+ s->dimms[i].tAAmin = s->dimms[i].spd_data[26];
+ s->dimms[i].tCKmin = s->dimms[i].spd_data[25];
+ s->dimms[i].width = (s->dimms[i].spd_data[13] >> 3) - 1;
+ s->dimms[i].page_size = (s->dimms[i].width+1) * (1 << s->dimms[i].cols); // Bytes
+ s->dimms[i].tRAS = s->dimms[i].spd_data[30];
+ s->dimms[i].tRP = s->dimms[i].spd_data[27];
+ s->dimms[i].tRCD = s->dimms[i].spd_data[29];
+ s->dimms[i].tWR = s->dimms[i].spd_data[36];
+ s->dimms[i].ranks = s->dimms[i].sides; // XXX
+
+ PRINTK_DEBUG("DIMM %d\n", i);
+ PRINTK_DEBUG(" Sides : %d\n", s->dimms[i].sides);
+ PRINTK_DEBUG(" Banks : %d\n", s->dimms[i].banks);
+ PRINTK_DEBUG(" Ranks : %d\n", s->dimms[i].ranks);
+ PRINTK_DEBUG(" Rows : %d\n", s->dimms[i].rows);
+ PRINTK_DEBUG(" Cols : %d\n", s->dimms[i].cols);
+ PRINTK_DEBUG(" Page size : %d\n", s->dimms[i].page_size);
+ PRINTK_DEBUG(" Width : %d\n", (s->dimms[i].width+1)*8);
+ fail = 0;
+ }
+ }
+ if (fail) {
+ die("No memory dimms, halt\n");
+ }
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, chan) {
+ if (s->dimms[chan>>1].sides == 0) {
+ // NC
+ if (s->dimms[(chan>>1) + 1].sides == 0) {
+ // NC/NC
+ s->dimm_config[chan] = 0;
+ } else if (s->dimms[(chan>>1) + 1].sides == 1) {
+ // NC/SS
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // NC/8SS
+ s->dimm_config[chan] = 4;
+ } else {
+ // NC/16SS
+ s->dimm_config[chan] = 12;
+ }
+ } else {
+ // NC/DS
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // NC/8DS
+ s->dimm_config[chan] = 8;
+ } else {
+ // NOT SUPPORTED
+ die("16DS Not supported\n");
+ }
+ }
+ } else if (s->dimms[chan>>1].sides == 1) {
+ // SS
+ if (s->dimms[(chan>>1) + 1].sides == 0) {
+ // SS/NC
+ if (s->dimms[chan>>1].width == 0) {
+ // 8SS/NC
+ s->dimm_config[chan] = 1;
+ } else {
+ // 16SS/NC
+ s->dimm_config[chan] = 3;
+ }
+ } else if (s->dimms[(chan>>1) + 1].sides == 1) {
+ // SS/SS
+ if (s->dimms[chan>>1].width == 0) {
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // 8SS/8SS
+ s->dimm_config[chan] = 5;
+ } else {
+ // 8SS/16SS
+ s->dimm_config[chan] = 13;
+ }
+ } else {
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // 16SS/8SS
+ s->dimm_config[chan] = 7;
+ } else {
+ // 16SS/16SS
+ s->dimm_config[chan] = 15;
+ }
+ }
+ } else {
+ // SS/DS
+ if (s->dimms[chan>>1].width == 0) {
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // 8SS/8DS
+ s->dimm_config[chan] = 9;
+ } else {
+ die("16DS not supported\n");
+ }
+ } else {
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // 16SS/8DS
+ s->dimm_config[chan] = 11;
+ } else {
+ die("16DS not supported\n");
+ }
+ }
+ }
+ } else {
+ // DS
+ if (s->dimms[(chan>>1) + 1].sides == 0) {
+ // DS/NC
+ if (s->dimms[chan>>1].width == 0) {
+ // 8DS/NC
+ s->dimm_config[chan] = 2;
+ } else {
+ die("16DS not supported\n");
+ }
+ } else if (s->dimms[(chan>>1) + 1].sides == 1) {
+ // DS/SS
+ if (s->dimms[chan>>1].width == 0) {
+ if (s->dimms[(chan>>1) + 1].width == 0) {
+ // 8DS/8SS
+ s->dimm_config[chan] = 6;
+ } else {
+ // 8DS/16SS
+ s->dimm_config[chan] = 14;
+ }
+ } else {
+ die("16DS not supported\n");
+ }
+ } else {
+ // DS/DS
+ if (s->dimms[chan>>1].width == 0 && s->dimms[(chan>>1)+1].width == 0) {
+ // 8DS/8DS
+ s->dimm_config[chan] = 10;
+ }
+ }
+ }
+ PRINTK_DEBUG(" Config[CH%d] : %d\n", chan, s->dimm_config[chan]);
+ }
+}
+
+static u8 lsbpos(u8 val) //Forward
+{
+ u8 i;
+ for (i = 0; (i < 8) && ((val & (1 << i)) == 0); i++);
+ return i;
+}
+
+static u8 msbpos(u8 val) //Reverse
+{
+ u8 i;
+ for (i = 7; (i >= 0) && ((val & (1 << i)) == 0); i--);
+ return i;
+}
+
+static void mchinfo_ddr2(sysinfo_t *s)
+{
+ const u32 eax = cpuid_ext(0x04, 0).eax;
+ s->cores = ((eax >> 26) & 0x3f) + 1;
+ printk(BIOS_SPEW, "%d CPU cores\n", s->cores);
+
+ u32 capid = pci_read_config16(PCI_DEV(0,0,0), 0xe8);
+ if (!(capid & (1<<(79-64)))) {
+ printk(BIOS_SPEW, "iTPM enabled\n");
+ }
+
+ capid = pci_read_config32(PCI_DEV(0, 0, 0), 0xe4);
+ if (!(capid & (1<<(57-32)))) {
+ printk(BIOS_SPEW, "ME enabled\n");
+ }
+
+ if (!(capid & (1<<(56-32)))) {
+ printk(BIOS_SPEW, "AMT enabled\n");
+ }
+
+ s->max_ddr2_mhz = (capid & (1<<(53-32)))?667:800;
+ printk(BIOS_SPEW, "Capable of DDR2 of %d MHz or lower\n", s->max_ddr2_mhz);
+
+ if (!(capid & (1<<(48-32)))) {
+ printk(BIOS_SPEW, "VT-d enabled\n");
+ }
+}
+
+static void sdram_detect_ram_speed(sysinfo_t *s)
+{
+ u8 i;
+ u8 commoncas = 0;
+ u8 cas;
+ u8 lowcas;
+ u8 highcas;
+ u8 maxfreq;
+ u8 freq = 0;
+
+ // Find max FSB speed
+ switch (MCHBAR32(0xc00) & 0x7) {
+ case 0x0:
+ s->max_fsb = FSB_CLOCK_1066MHz;
+ break;
+ case 0x2:
+ s->max_fsb = FSB_CLOCK_800MHz;
+ break;
+ case 0x4:
+ s->max_fsb = FSB_CLOCK_1333MHz;
+ break;
+ default:
+ die("Can't find FSB\n");
+ break;
+ }
+
+ // Find RAM speed
+ maxfreq = (u8) ((pci_read_config16(PCI_DEV(0,0,0), 0xea) >> 4) & 0x3f);
+ if (s->spd_type == DDR2) {
+
+ // Limit frequency for MCH
+ maxfreq &= 0x7;
+ freq = MEM_CLOCK_800MHz;
+ if (maxfreq) {
+ freq = maxfreq;
+ }
+ if (freq > MEM_CLOCK_800MHz) {
+ freq = MEM_CLOCK_800MHz;
+ }
+
+ // Detect a common CAS latency
+ commoncas = 0xff;
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ commoncas &= s->dimms[i].spd_data[18];
+ }
+ if (commoncas == 0) {
+ die("No common CAS among dimms\n");
+ }
+
+ // Start with fastest common CAS
+ cas = 0;
+ highcas = msbpos(commoncas);
+ lowcas = lsbpos(commoncas);
+
+ while (cas == 0 && highcas >= lowcas) {
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ switch (freq) {
+ case MEM_CLOCK_800MHz:
+ if ((s->dimms[i].spd_data[9] > 0x25) ||
+ (s->dimms[i].spd_data[10] > 0x40)) {
+ // CAS too fast, lower it
+ highcas--;
+ break;
+ } else {
+ cas = highcas;
+ }
+ break;
+ case MEM_CLOCK_667MHz:
+ default:
+ if ((s->dimms[i].spd_data[9] > 0x30) ||
+ (s->dimms[i].spd_data[10] > 0x45)) {
+ // CAS too fast, lower it
+ highcas--;
+ break;
+ } else {
+ cas = highcas;
+ }
+ break;
+ }
+ }
+ }
+ if (highcas < lowcas) {
+ // Timings not supported by MCH, lower the frequency
+ freq--;
+ cas = 0;
+ highcas = msbpos(commoncas);
+ lowcas = lsbpos(commoncas);
+ while (cas == 0 && highcas >= lowcas) {
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ switch (freq) {
+ case MEM_CLOCK_800MHz:
+ if ((s->dimms[i].spd_data[23] > 0x25) ||
+ (s->dimms[i].spd_data[24] > 0x40)) {
+ // CAS too fast, lower it
+ highcas--;
+ break;
+ } else {
+ cas = highcas;
+ }
+ break;
+ case MEM_CLOCK_667MHz:
+ default:
+ if ((s->dimms[i].spd_data[23] > 0x30) ||
+ (s->dimms[i].spd_data[24] > 0x45)) {
+ // CAS too fast, lower it
+ highcas--;
+ break;
+ } else {
+ cas = highcas;
+ }
+ break;
+ }
+ }
+ }
+ }
+ s->selected_timings.mem_clock = freq;
+ s->selected_timings.CAS = cas;
+
+ } else { // DDR3
+ // Limit frequency for MCH
+ maxfreq >>= 3;
+ freq = MEM_CLOCK_1333MHz;
+ if (maxfreq) {
+ freq = maxfreq + 2;
+ }
+ if (freq > MEM_CLOCK_1333MHz) {
+ freq = MEM_CLOCK_1333MHz;
+ }
+
+ // Limit DDR speed to FSB speed
+ switch (s->max_fsb) {
+ case FSB_CLOCK_800MHz:
+ if (freq > MEM_CLOCK_800MHz) {
+ freq = MEM_CLOCK_800MHz;
+ }
+ break;
+ case FSB_CLOCK_1066MHz:
+ if (freq > MEM_CLOCK_1066MHz) {
+ freq = MEM_CLOCK_1066MHz;
+ }
+ break;
+ case FSB_CLOCK_1333MHz:
+ if (freq > MEM_CLOCK_1333MHz) {
+ freq = MEM_CLOCK_1333MHz;
+ }
+ break;
+ default:
+ die("Invalid FSB\n");
+ break;
+ }
+
+ // TODO: CAS detection for DDR3
+ }
+}
+
+/**
+ * @param boot_path: 0 = normal, 1 = reset, 2 = resume from s3
+ */
+void sdram_initialize(int boot_path, const u8 *spd_map)
+{
+ sysinfo_t sysinfo;
+ u8 reg8;
+
+ PRINTK_DEBUG("Setting up RAM controller.\n");
+
+ pci_write_config8(PCI_DEV(0,0,0), 0xdf, 0xff);
+
+ memset(&sysinfo, 0, sizeof(sysinfo));
+
+ sysinfo.boot_path = boot_path;
+ sysinfo.spd_map[0] = spd_map[0];
+ sysinfo.spd_map[1] = spd_map[1];
+ sysinfo.spd_map[2] = spd_map[2];
+ sysinfo.spd_map[3] = spd_map[3];
+
+ /* Detect dimms per channel */
+ sysinfo.dimms_per_ch = 2;
+ reg8 = pci_read_config8(PCI_DEV(0,0,0), 0xe9);
+ if (reg8 & 0x10) {
+ sysinfo.dimms_per_ch = 1;
+ }
+ PRINTK_DEBUG("Dimms per channel: %d\n", sysinfo.dimms_per_ch);
+
+ mchinfo_ddr2(&sysinfo);
+
+ sdram_read_spds(&sysinfo);
+
+ /* Choose Common Frequency */
+ sdram_detect_ram_speed(&sysinfo);
+
+ sysinfo.enable_igd = 1;
+ igd_compute_ggc(&sysinfo);
+ init_igd(&sysinfo);
+
+ switch (sysinfo.spd_type) {
+ case DDR2:
+ raminit_ddr2(&sysinfo);
+ break;
+ case DDR3:
+ //raminit_ddr3(&sysinfo);
+ break;
+ default:
+ die("Unknown DDR type\n");
+ break;
+ }
+
+ reg8 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa2);
+ pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, reg8 & ~0x80);
+
+ reg8 = pci_read_config8(PCI_DEV(0,0,0), 0xf4);
+ pci_write_config8(PCI_DEV(0,0,0), 0xf4, reg8 | 1);
+ printk(BIOS_DEBUG, "RAM initialization finished.\n");
+}
diff --git a/src/northbridge/intel/x4x/raminit_ddr2.c b/src/northbridge/intel/x4x/raminit_ddr2.c
new file mode 100644
index 0000000..590b502
--- /dev/null
+++ b/src/northbridge/intel/x4x/raminit_ddr2.c
@@ -0,0 +1,2117 @@
+/*
+ * This file is part of the coreboot project.
+ *
+ * Copyright (C) 2015 Damien Zammit <damien at zamaudio.com>
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; version 2 of the License.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc.
+ */
+
+#include <stdint.h>
+#include <arch/io.h>
+#include <arch/cpu.h>
+#include <console/console.h>
+#include "delay.h"
+#include "x4x.h"
+#include "debug.h"
+
+#define max(a, b) ((a) > (b) ? (a) : (b))
+#define min(a, b) ((a) < (b) ? (a) : (b))
+#define barrier() __asm__ __volatile__("": : :"memory")
+
+static u32 fsb2mhz(u32 speed)
+{
+ return (speed * 267) + 800;
+}
+
+static u32 ddr2mhz(u32 speed)
+{
+ u32 mhz;
+ mhz = (speed == 2) ? 667 :
+ (speed == 3) ? 800 :
+ (speed == 4) ? 1067 :
+ (speed == 5) ? 1333 :
+ 0;
+ return mhz;
+}
+
+static u8 msbpos(u8 val) //Reverse
+{
+ u8 i;
+ for (i = 7; (i >= 0) && ((val & (1 << i)) == 0); i--);
+ return i;
+}
+
+static void sdram_detect_smallest_params2(sysinfo_t *s)
+{
+ u16 mult[6] = {
+ 5000, // 400
+ 3750, // 533
+ 3000, // 667
+ 2500, // 800
+ 1875, // 1066
+ 1500, // 1333
+ };
+
+ u8 i;
+ u32 tmp;
+ u32 maxtras = 0;
+ u32 maxtrp = 0;
+ u32 maxtrcd = 0;
+ u32 maxtwr = 0;
+ u32 maxtrfc = 0;
+ u32 maxtwtr = 0;
+ u32 maxtrrd = 0;
+ u32 maxtrtp = 0;
+
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ maxtras = max(maxtras, s->dimms[i].spd_data[30] * 1000);
+ maxtrp = max(maxtrp, (s->dimms[i].spd_data[27] * 1000) >> 2);
+ maxtrcd = max(maxtrcd, (s->dimms[i].spd_data[29] * 1000) >> 2);
+ maxtwr = max(maxtwr, (s->dimms[i].spd_data[36] * 1000) >> 2);
+ maxtrfc = max(maxtrfc, s->dimms[i].spd_data[42] * 1000 +
+ (s->dimms[i].spd_data[40] & 0xf));
+ maxtwtr = max(maxtwtr, (s->dimms[i].spd_data[37] * 1000) >> 2);
+ maxtrrd = max(maxtrrd, (s->dimms[i].spd_data[28] * 1000) >> 2);
+ maxtrtp = max(maxtrtp, (s->dimms[i].spd_data[38] * 1000) >> 2);
+ }
+ for (i = 9; i < 24; i++) { // 16
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtras) {
+ s->selected_timings.tRAS = i;
+ break;
+ }
+ }
+ for (i = 3; i < 10; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtrp) {
+ s->selected_timings.tRP = i;
+ break;
+ }
+ }
+ for (i = 3; i < 10; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtrcd) {
+ s->selected_timings.tRCD = i;
+ break;
+ }
+ }
+ for (i = 3; i < 15; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtwr) {
+ s->selected_timings.tWR = i;
+ break;
+ }
+ }
+ for (i = 15; i < 78; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtrfc) {
+ s->selected_timings.tRFC = ((i + 16) & 0xfe) - 15;
+ break;
+ }
+ }
+ for (i = 4; i < 15; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtwtr) {
+ s->selected_timings.tWTR = i;
+ break;
+ }
+ }
+ for (i = 2; i < 15; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtrrd) {
+ s->selected_timings.tRRD = i;
+ break;
+ }
+ }
+ for (i = 4; i < 15; i++) {
+ tmp = mult[s->selected_timings.mem_clock] * i;
+ if (tmp >= maxtrtp) {
+ s->selected_timings.tRTP = i;
+ break;
+ }
+ }
+
+ s->selected_timings.fsb_clock = s->max_fsb;
+
+ PRINTK_DEBUG("Selected timings:\n");
+ PRINTK_DEBUG(" FSB: %dMHz\n", fsb2mhz(s->selected_timings.fsb_clock));
+ PRINTK_DEBUG(" DDR: %dMHz\n", ddr2mhz(s->selected_timings.mem_clock));
+
+ PRINTK_DEBUG(" CAS: %d\n", s->selected_timings.CAS);
+ PRINTK_DEBUG(" tRAS: %d\n", s->selected_timings.tRAS);
+ PRINTK_DEBUG(" tRP: %d\n", s->selected_timings.tRP);
+ PRINTK_DEBUG(" tRCD: %d\n", s->selected_timings.tRCD);
+ PRINTK_DEBUG(" tWR: %d\n", s->selected_timings.tWR);
+ PRINTK_DEBUG(" tRFC: %d\n", s->selected_timings.tRFC);
+ PRINTK_DEBUG(" tWTR: %d\n", s->selected_timings.tWTR);
+ PRINTK_DEBUG(" tRRD: %d\n", s->selected_timings.tRRD);
+ PRINTK_DEBUG(" tRTP: %d\n", s->selected_timings.tRTP);
+}
+
+static void clkcross_ddr2(sysinfo_t *s)
+{
+ u32 c04, c50, c54, x6d8, x6dc, x6e8, x6ec, x6f8, x6fc, x700, x704, x708, x70c;
+
+ MCHBAR16(0xc1c) = MCHBAR16(0xc1c) | (1 << 15);
+
+ if ((s->selected_timings.fsb_clock == FSB_CLOCK_800MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_667MHz)) {
+ c04 = 0x1f1f1f1f;
+ c50 = 0x1a07070b;
+ c54 = 0x0;
+ x6d8 = 0x10000000;
+ x6dc = 0x20010208;
+ x6e8 = 0x04080000;
+ x6ec = 0x10010002;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x02000000;
+ x704 = 0x04000100;
+ x708 = 0x08000000;
+ x70c = 0x10200204;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_800MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_800MHz)) {
+ c04 = 0xffffffff;
+ c50 = 0x05030305;
+ c54 = 0x0000ffff;
+ x6d8 = 0x0;
+ x6dc = 0x08010204;
+ x6e8 = 0x0;
+ x6ec = 0x08010204;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x0;
+ x704 = 0x00020001;
+ x708 = 0x0;
+ x70c = 0x04080102;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1066MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_667MHz)) {
+ c04 = 0x6d5b1f1f;
+ c50 = 0x0f0f0f0f;
+ c54 = 0x0;
+ x6d8 = 0x20000000;
+ x6dc = 0x80020410;
+ x6e8 = 0x02040008;
+ x6ec = 0x10000100;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x04000000;
+ x704 = 0x08000102;
+ x708 = 0x20000000;
+ x70c = 0x40010208;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1066MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_800MHz)) {
+ c04 = 0x07070707;
+ c50 = 0x06030303;
+ c54 = 0x0;
+ x6d8 = 0x0;
+ x6dc = 0x08010200;
+ x6e8 = 0x0;
+ x6ec = 0x04000102;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x0;
+ x704 = 0x00020001;
+ x708 = 0x0;
+ x70c = 0x02040801;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1066MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_1066MHz)) {
+ c04 = 0xffffffff;
+ c50 = 0x05030305;
+ c54 = 0x0000ffff;
+ x6d8 = 0x0;
+ x6dc = 0x04080102;
+ x6e8 = 0x0;
+ x6ec = 0x08010204;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x0;
+ x704 = 0x00020001;
+ x708 = 0x0;
+ x70c = 0x02040801;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1333MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_667MHz)) {
+ c04 = 0x05050303;
+ c50 = 0xffffffff;
+ c54 = 0xffff0000;
+ x6d8 = 0x0;
+ x6dc = 0x08020000;
+ x6e8 = 0x0;
+ x6ec = 0x00020001;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x0;
+ x704 = 0x08010204;
+ x708 = 0x0;
+ x70c = 0x04010000;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1333MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_800MHz)) {
+ c04 = 0x0d0b0707;
+ c50 = 0x3e1f1f2f;
+ c54 = 0x01010000;
+ x6d8 = 0x0;
+ x6dc = 0x10020400;
+ x6e8 = 0x02000000;
+ x6ec = 0x00040100;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x04080000;
+ x704 = 0x00100102;
+ x708 = 0x0;
+ x70c = 0x08100200;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1333MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_1066MHz)) {
+ c04 = 0x0f0f0f0f;
+ c50 = 0x5b1f1f6d;
+ c54 = 0x0;
+ x6d8 = 0x0;
+ x6dc = 0x08010204;
+ x6e8 = 0x04000000;
+ x6ec = 0x00080102;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x02000408;
+ x704 = 0x00100001;
+ x708 = 0x0;
+ x70c = 0x04080102;
+ } else if ((s->selected_timings.fsb_clock == FSB_CLOCK_1333MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_1333MHz)) {
+ c04 = 0xffffffff;
+ c50 = 0x05030305;
+ c54 = 0x0000ffff;
+ x6d8 = 0x0;
+ x6dc = 0x04080102;
+ x6e8 = 0x0;
+ x6ec = 0x04080102;
+ x6f8 = 0x0;
+ x6fc = 0x0;
+ x700 = 0x0;
+ x704 = 0x0;
+ x708 = 0x0;
+ x70c = 0x02040801;
+ } else {
+ die("Unsupported DDR/FSB configuration\n");
+ }
+
+ MCHBAR32(0xc04) = c04;
+ MCHBAR32(0xc50) = c50;
+ MCHBAR32(0xc54) = c54;
+ MCHBAR8(0xc08) = MCHBAR8(0xc08) | (1 << 7);
+
+ MCHBAR32(0x6d8) = x6d8;
+ MCHBAR32(0x6e0) = x6d8;
+ MCHBAR32(0x6dc) = x6dc;
+ MCHBAR32(0x6e4) = x6dc;
+ MCHBAR32(0x6e8) = x6e8;
+ MCHBAR32(0x6f0) = x6e8;
+ MCHBAR32(0x6ec) = x6ec;
+ MCHBAR32(0x6f4) = x6ec;
+ MCHBAR32(0x6f8) = x6f8;
+ MCHBAR32(0x6fc) = x6fc;
+ MCHBAR32(0x708) = x708;
+ MCHBAR32(0x70c) = x70c;
+}
+
+static void checkreset_ddr2(sysinfo_t *s)
+{
+ u8 pmcon2;
+ u8 reset = 0;
+
+// MCHBAR32(0xc00) = (MCHBAR32(0xc00) & ~0xf0000) | 0x10000;
+
+ pmcon2 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa2);
+ if (!(pmcon2 & 0x80)) {
+ pmcon2 |= 0x80;
+ pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, pmcon2);
+ reset = 1;
+
+ /* do magic 0xf0 thing. */
+ u8 reg8 = pci_read_config8(PCI_DEV(0, 0, 0), 0xf0);
+ pci_write_config8(PCI_DEV(0, 0, 0), 0xf0, reg8 & ~(1 << 2));
+ reg8 = pci_read_config8(PCI_DEV(0, 0, 0), 0xf0);
+ pci_write_config8(PCI_DEV(0, 0, 0), 0xf0, reg8 | (1 << 2));
+ }
+ if (reset) {
+ PRINTK_DEBUG("Reset...\n");
+ outb(0xe, 0xcf9);
+ //outb(0x02, 0xcf9); /* Set system reset bit. */
+ //outb(0x06, 0xcf9); /* Set cpu reset bit, too. */
+ asm ("hlt");
+ }
+ pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa2, pmcon2 | 0x80);
+}
+
+static void setioclk_ddr2(sysinfo_t *s)
+{
+ MCHBAR32(0x1bc) = 0x08060402;
+ MCHBAR16(0x1c0) = MCHBAR16(0x1c0) | 0x200;
+ MCHBAR16(0x1c0) = MCHBAR16(0x1c0) | 0x100;
+ MCHBAR16(0x1c0) = MCHBAR16(0x1c0) | 0x20;
+ MCHBAR16(0x1c0) = MCHBAR16(0x1c0) & ~1;
+ switch (s->selected_timings.mem_clock) {
+ default:
+ case MEM_CLOCK_800MHz:
+ case MEM_CLOCK_1066MHz:
+ MCHBAR8(0x5d9) = (MCHBAR8(0x5d9) & ~0x2) | 0x2;
+ MCHBAR8(0x9d9) = (MCHBAR8(0x9d9) & ~0x2) | 0x2;
+ MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0xc0;
+ MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0xe0;
+ MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0xa0;
+ break;
+ case MEM_CLOCK_667MHz:
+ case MEM_CLOCK_1333MHz:
+ MCHBAR8(0x5d9) = MCHBAR8(0x5d9) & ~0x2;
+ MCHBAR8(0x9d9) = MCHBAR8(0x9d9) & ~0x2;
+ MCHBAR8(0x189) = (MCHBAR8(0x189) & ~0xf0) | 0x40;
+ break;
+ }
+ MCHBAR32(0x594) = MCHBAR32(0x594) | (1 << 31);
+ MCHBAR32(0x994) = MCHBAR32(0x994) | (1 << 31);
+}
+
+static void launch_ddr2(sysinfo_t *s)
+{
+ u8 i;
+ u32 launch1 = 0x58001117;
+ u32 launch2 = 0;
+ u32 launch3 = 0;
+
+ if (s->selected_timings.CAS == 5) {
+ launch2 = 0x00220201;
+ } else if ((s->selected_timings.mem_clock == MEM_CLOCK_800MHz) &&
+ (s->selected_timings.CAS == 6)) {
+ launch2 = 0x00230302;
+ } else {
+ die("Unsupported CAS & Frequency combination detected\n");
+ }
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ MCHBAR32(0x400*i + 0x220) = launch1;
+ MCHBAR32(0x400*i + 0x224) = launch2;
+ MCHBAR32(0x400*i + 0x21c) = launch3;
+ MCHBAR32(0x400*i + 0x248) = MCHBAR32(0x400*i + 0x248) | (1 << 23);
+ }
+
+ MCHBAR32(0x2c0) = (MCHBAR32(0x2c0) & ~0x58000000) | 0x48000000;
+ MCHBAR32(0x2c0) = MCHBAR32(0x2c0) | 0x1e0;
+ MCHBAR32(0x2c4) = (MCHBAR32(0x2c4) & ~0xf) | 0xc;
+}
+
+static void clkset0(u8 ch, u8 setting[5])
+{
+ MCHBAR16(0x400*ch + 0x5a0) = (MCHBAR16(0x400*ch + 0x5a0) & ~0xc440) |
+ (setting[4] << 14) |
+ (setting[3] << 6) |
+ (setting[2] << 10);
+ MCHBAR8(0x400*ch + 0x581) = (MCHBAR8(0x400*ch + 0x581) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x581) = (MCHBAR8(0x400*ch + 0x581) & ~0xf) |
+ setting[0];
+}
+
+static void clkset1(u8 ch, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x5a0) = (MCHBAR32(0x400*ch + 0x5a0) & ~0x30880) |
+ (setting[4] << 16) |
+ (setting[3] << 7) |
+ (setting[2] << 11);
+ MCHBAR8(0x400*ch + 0x582) = (MCHBAR8(0x400*ch + 0x582) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x582) = (MCHBAR8(0x400*ch + 0x582) & ~0xf) |
+ setting[0];
+}
+
+static void ctrlset0(u8 ch, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x59c) = (MCHBAR32(0x400*ch + 0x59c) & ~0x3300000) |
+ (setting[4] << 24) |
+ (setting[3] << 20) |
+ (setting[2] << 21);
+ MCHBAR8(0x400*ch + 0x584) = (MCHBAR8(0x400*ch + 0x584) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x584) = (MCHBAR8(0x400*ch + 0x584) & ~0xf) |
+ setting[0];
+}
+
+static void ctrlset1(u8 ch, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x59c) = (MCHBAR32(0x400*ch + 0x59c) & ~0x18c00000) |
+ (setting[4] << 27) |
+ (setting[3] << 22) |
+ (setting[2] << 23);
+ MCHBAR8(0x400*ch + 0x585) = (MCHBAR8(0x400*ch + 0x585) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x585) = (MCHBAR8(0x400*ch + 0x585) & ~0xf) |
+ setting[0];
+}
+
+static void ctrlset2(u8 ch, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x598) = (MCHBAR32(0x400*ch + 0x598) & ~0x18c00000) |
+ (setting[4] << 14) |
+ (setting[3] << 12) |
+ (setting[2] << 13);
+ MCHBAR8(0x400*ch + 0x586) = (MCHBAR8(0x400*ch + 0x586) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x586) = (MCHBAR8(0x400*ch + 0x586) & ~0xf) |
+ setting[0];
+}
+
+static void ctrlset3(u8 ch, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x598) = (MCHBAR32(0x400*ch + 0x598) & ~0x18c00000) |
+ (setting[4] << 10) |
+ (setting[3] << 8) |
+ (setting[2] << 9);
+ MCHBAR8(0x400*ch + 0x587) = (MCHBAR8(0x400*ch + 0x587) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x587) = (MCHBAR8(0x400*ch + 0x587) & ~0xf) |
+ setting[0];
+}
+
+static void cmdset(u8 ch, u8 setting[5])
+{
+ MCHBAR8(0x400*ch + 0x598) = (MCHBAR8(0x400*ch + 0x598) & ~0x30) |
+ (setting[4] << 4);
+ MCHBAR8(0x400*ch + 0x594) = (MCHBAR8(0x400*ch + 0x594) & ~0x60) |
+ (setting[3] << 5) |
+ (setting[2] << 6);
+ MCHBAR8(0x400*ch + 0x580) = (MCHBAR8(0x400*ch + 0x580) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x580) = (MCHBAR8(0x400*ch + 0x580) & ~0xf) |
+ setting[0];
+}
+
+static void dqsset(u8 ch, u8 lane, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x5fc) = MCHBAR32(0x400*ch + 0x5fc) & ~(2 << (lane*4));
+
+ MCHBAR32(0x400*ch + 0x5b4) = (MCHBAR32(0x400*ch + 0x5b4) & ~(0x201 << lane)) |
+ (setting[2] << (9 + lane)) |
+ (setting[3] << lane);
+ MCHBAR32(0x400*ch + 0x5b8) = (MCHBAR32(0x400*ch + 0x5b8) & ~(0x201 << lane)) |
+ (setting[2] << (9 + lane)) |
+ (setting[3] << lane);
+ MCHBAR32(0x400*ch + 0x5bc) = (MCHBAR32(0x400*ch + 0x5bc) & ~(0x201 << lane)) |
+ (setting[2] << (9 + lane)) |
+ (setting[3] << lane);
+ MCHBAR32(0x400*ch + 0x5c0) = (MCHBAR32(0x400*ch + 0x5c0) & ~(0x201 << lane)) |
+ (setting[2] << (9 + lane)) |
+ (setting[3] << lane);
+
+ MCHBAR32(0x400*ch + 0x5c8) = (MCHBAR32(0x400*ch + 0x5c8) & ~(0x3 << (16+lane*2))) |
+ (setting[4] << (16+lane*2));
+ MCHBAR32(0x400*ch + 0x5cc) = (MCHBAR32(0x400*ch + 0x5cc) & ~(0x3 << (16+lane*2))) |
+ (setting[4] << (16+lane*2));
+ MCHBAR32(0x400*ch + 0x5d0) = (MCHBAR32(0x400*ch + 0x5d0) & ~(0x3 << (16+lane*2))) |
+ (setting[4] << (16+lane*2));
+ MCHBAR32(0x400*ch + 0x5d4) = (MCHBAR32(0x400*ch + 0x5d4) & ~(0x3 << (16+lane*2))) |
+ (setting[4] << (16+lane*2));
+
+ MCHBAR8(0x400*ch + 0x520 + lane*4) = (MCHBAR8(0x400*ch + 0x520 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x520 + lane*4) = (MCHBAR8(0x400*ch + 0x520 + lane*4) & ~0xf) |
+ setting[0];
+ MCHBAR8(0x400*ch + 0x521 + lane*4) = (MCHBAR8(0x400*ch + 0x521 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x521 + lane*4) = (MCHBAR8(0x400*ch + 0x521 + lane*4) & ~0xf) |
+ setting[0];
+ MCHBAR8(0x400*ch + 0x522 + lane*4) = (MCHBAR8(0x400*ch + 0x522 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x522 + lane*4) = (MCHBAR8(0x400*ch + 0x522 + lane*4) & ~0xf) |
+ setting[0];
+ MCHBAR8(0x400*ch + 0x523 + lane*4) = (MCHBAR8(0x400*ch + 0x523 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x523 + lane*4) = (MCHBAR8(0x400*ch + 0x523 + lane*4) & ~0xf) |
+ setting[0];
+}
+
+static void dqset(u8 ch, u8 lane, u8 setting[5])
+{
+ MCHBAR32(0x400*ch + 0x5fc) = MCHBAR32(0x400*ch + 0x5fc) & ~(1 << (lane*4));
+
+ MCHBAR32(0x400*ch + 0x5a4) = (MCHBAR32(0x400*ch + 0x5a4) & ~(0x201 << lane)) |
+ (setting[2] << (9+lane)) |
+ (setting[3] << lane);
+ MCHBAR32(0x400*ch + 0x5a8) = (MCHBAR32(0x400*ch + 0x5a8) & ~(0x201 << lane)) |
+ (setting[2] << (9+lane)) |
+ (setting[3] << lane);
+ MCHBAR32(0x400*ch + 0x5ac) = (MCHBAR32(0x400*ch + 0x5ac) & ~(0x201 << lane)) |
+ (setting[2] << (9+lane)) |
+ (setting[3] << lane);
+ MCHBAR32(0x400*ch + 0x5b0) = (MCHBAR32(0x400*ch + 0x5b0) & ~(0x201 << lane)) |
+ (setting[2] << (9+lane)) |
+ (setting[3] << lane);
+
+ MCHBAR32(0x400*ch + 0x5c8) = (MCHBAR32(0x400*ch + 0x5c8) & ~(0x3 << (lane*2))) |
+ (setting[4] << (2*lane));
+ MCHBAR32(0x400*ch + 0x5cc) = (MCHBAR32(0x400*ch + 0x5cc) & ~(0x3 << (lane*2))) |
+ (setting[4] << (2*lane));
+ MCHBAR32(0x400*ch + 0x5d0) = (MCHBAR32(0x400*ch + 0x5d0) & ~(0x3 << (lane*2))) |
+ (setting[4] << (2*lane));
+ MCHBAR32(0x400*ch + 0x5d4) = (MCHBAR32(0x400*ch + 0x5d4) & ~(0x3 << (lane*2))) |
+ (setting[4] << (2*lane));
+
+ MCHBAR8(0x400*ch + 0x500 + lane*4) = (MCHBAR8(0x400*ch + 0x500 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x500 + lane*4) = (MCHBAR8(0x400*ch + 0x500 + lane*4) & ~0xf) |
+ setting[0];
+ MCHBAR8(0x400*ch + 0x501 + lane*4) = (MCHBAR8(0x400*ch + 0x501 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x501 + lane*4) = (MCHBAR8(0x400*ch + 0x501 + lane*4) & ~0xf) |
+ setting[0];
+ MCHBAR8(0x400*ch + 0x502 + lane*4) = (MCHBAR8(0x400*ch + 0x502 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x502 + lane*4) = (MCHBAR8(0x400*ch + 0x502 + lane*4) & ~0xf) |
+ setting[0];
+ MCHBAR8(0x400*ch + 0x503 + lane*4) = (MCHBAR8(0x400*ch + 0x503 + lane*4) & ~0x70) |
+ (setting[1] << 4);
+ MCHBAR8(0x400*ch + 0x503 + lane*4) = (MCHBAR8(0x400*ch + 0x503 + lane*4) & ~0xf) |
+ setting[0];
+}
+
+static void timings_ddr2(sysinfo_t *s)
+{
+ u8 i;
+ u8 twl, ta1, ta2, ta3, ta4;
+ u8 reg8;
+ u8 flag1 = 0;
+ u8 flag2 = 0;
+ u16 reg16;
+ u32 reg32;
+ u16 ddr, fsb;
+ u8 trpmod = 0;
+ u8 bankmod = 1;
+ u8 pagemod = 0;
+
+ u16 fsb2ps[3] = {
+ 5000, // 800
+ 3750, // 1067
+ 3000 // 1333
+ };
+
+ u16 ddr2ps[6] = {
+ 5000, // 400
+ 3750, // 533
+ 3000, // 667
+ 2500, // 800
+ 1875, // 1067
+ 1500 // 1333
+ };
+
+ u16 lut1[6] = {
+ 0,
+ 0,
+ 2600,
+ 3120,
+ 4171,
+ 5200
+ };
+
+ ta1 = 6;
+ ta2 = 6;
+ ta3 = 5;
+ ta4 = 8;
+
+ twl = s->selected_timings.CAS - 1;
+
+ FOR_EACH_POPULATED_DIMM(s->dimms, i) {
+ if (s->dimms[i].banks == 1) { // 8 banks
+ trpmod = 1;
+ bankmod = 0;
+ }
+ if (s->dimms[i].page_size == 2048) {
+ pagemod = 1;
+ }
+ }
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ MCHBAR8(0x400*i + 0x2f6) = MCHBAR8(0x400*i + 0x2f6) | 0x3;
+ MCHBAR8(0x400*i + 0x228) = (MCHBAR8(0x400*i + 0x228) & ~0x7) | 0x2;
+ MCHBAR8(0x400*i + 0x240) = (MCHBAR8(0x400*i + 0x240) & ~0xf0) | (twl << 4);
+ MCHBAR8(0x400*i + 0x240) = (MCHBAR8(0x400*i + 0x240) & ~0xf) |
+ s->selected_timings.CAS;
+ MCHBAR16(0x400*i + 0x265) = (MCHBAR16(0x400*i + 0x265) & ~0x3f00) |
+ ((s->selected_timings.CAS + 9) << 8);
+
+ reg16 = (s->selected_timings.tRAS << 11) |
+ ((twl + 4 + s->selected_timings.tWR) << 6) |
+ ((2 + max(s->selected_timings.tRTP, 2)) << 2) | 1;
+ MCHBAR16(0x400*i + 0x250) = reg16;
+
+ reg32 = (bankmod << 21) |
+ (s->selected_timings.tRRD << 17) |
+ (s->selected_timings.tRP << 13) |
+ ((s->selected_timings.tRP + trpmod) << 9) |
+ s->selected_timings.tRFC;
+ reg8 = (MCHBAR8(0x400*i + 0x26f) >> 1) & 1;
+ if (bankmod) {
+ switch (s->selected_timings.mem_clock) {
+ default:
+ case MEM_CLOCK_667MHz:
+ if (reg8) {
+ if (pagemod) {
+ reg32 |= 16 << 22;
+ } else {
+ reg32 |= 12 << 22;
+ }
+ } else {
+ if (pagemod) {
+ reg32 |= 18 << 22;
+ } else {
+ reg32 |= 14 << 22;
+ }
+ }
+ break;
+ case MEM_CLOCK_800MHz:
+ if (reg8) {
+ if (pagemod) {
+ reg32 |= 18 << 22;
+ } else {
+ reg32 |= 14 << 22;
+ }
+ } else {
+ if (pagemod) {
+ reg32 |= 20 << 22;
+ } else {
+ reg32 |= 16 << 22;
+ }
+ }
+ break;
+ }
+ }
+ MCHBAR32(0x400*i + 0x252) = reg32;
+
+ MCHBAR16(0x400*i + 0x256) = (s->selected_timings.tRCD << 12) |
+ (0x4 << 8) | (ta2 << 4) | ta4;
+
+ MCHBAR32(0x400*i + 0x258) = (s->selected_timings.tRCD << 17) |
+ ((twl + 4 + s->selected_timings.tWTR) << 12) |
+ (ta3 << 8) | (4 << 4) | ta1;
+
+ MCHBAR16(0x400*i + 0x25b) = ((s->selected_timings.tRP + trpmod) << 9) |
+ s->selected_timings.tRFC;
+
+ MCHBAR16(0x400*i + 0x260) = (MCHBAR16(0x400*i + 0x260) & ~0x3fe) | (100 << 1);
+ MCHBAR8(0x400*i + 0x264) = 0xff;
+ MCHBAR8(0x400*i + 0x25d) = (MCHBAR8(0x400*i + 0x25d) & ~0x3f) |
+ s->selected_timings.tRAS;
+ MCHBAR16(0x400*i + 0x244) = 0x2310;
+
+ switch (s->selected_timings.mem_clock) {
+ case MEM_CLOCK_667MHz:
+ reg8 = 0;
+ break;
+ default:
+ reg8 = 1;
+ break;
+ }
+
+ MCHBAR8(0x400*i + 0x246) = (MCHBAR8(0x400*i + 0x246) & ~0x1f) |
+ (reg8 << 2) | 1;
+
+ fsb = fsb2ps[s->selected_timings.fsb_clock];
+ ddr = ddr2ps[s->selected_timings.mem_clock];
+ reg32 = (u32)((s->selected_timings.CAS + 7 + reg8) * ddr);
+ reg32 = (u32)((reg32 / fsb) << 8);
+ reg32 |= 0x0e000000;
+ if ((fsb2mhz(s->selected_timings.fsb_clock) /
+ ddr2mhz(s->selected_timings.mem_clock)) > 2) {
+ reg32 |= 1 << 24;
+ }
+ MCHBAR32(0x400*i + 0x248) = (MCHBAR32(0x400*i + 0x248) & ~0x0f001f00) |
+ reg32;
+
+ if (twl > 2) {
+ flag1 = 1;
+ }
+ if (s->selected_timings.mem_clock >= MEM_CLOCK_800MHz) {
+ flag2 = 1;
+ }
+ reg16 = (u8)(twl - 1 - flag1 - flag2);
+ reg16 |= reg16 << 4;
+ if (s->selected_timings.mem_clock == MEM_CLOCK_1333MHz) {
+ if (reg16) {
+ reg16--;
+ }
+ }
+ reg16 |= flag1 << 8;
+ reg16 |= flag2 << 9;
+ MCHBAR16(0x400*i + 0x24d) = (MCHBAR16(0x400*i + 0x24d) & ~0x1ff) | reg16;
+ MCHBAR16(0x400*i + 0x25e) = 0x15a5;
+ MCHBAR32(0x400*i + 0x265) = MCHBAR32(0x400*i + 0x265) & ~0x1f;
+ MCHBAR32(0x400*i + 0x269) = (MCHBAR32(0x400*i + 0x269) & ~0x000fffff) |
+ (0x3f << 14) | lut1[s->selected_timings.mem_clock];
+ MCHBAR8(0x400*i + 0x274) = MCHBAR8(0x400*i + 0x274) | 1;
+ MCHBAR8(0x400*i + 0x24c) = MCHBAR8(0x400*i + 0x24c) & ~0x3;
+
+ reg16 = 0;
+ switch (s->selected_timings.mem_clock) {
+ default:
+ case MEM_CLOCK_667MHz:
+ reg16 = 0x99;
+ break;
+ case MEM_CLOCK_800MHz:
+ if (s->selected_timings.CAS == 5) {
+ reg16 = 0x19a;
+ } else if (s->selected_timings.CAS == 6) {
+ reg16 = 0x9a;
+ }
+ break;
+ }
+ reg16 &= 0x7;
+ reg16 += twl + 9;
+ reg16 <<= 10;
+ MCHBAR16(0x400*i + 0x24d) = (MCHBAR16(0x400*i + 0x24d) & ~0x7c00) | reg16;
+ MCHBAR8(0x400*i + 0x267) = (MCHBAR8(0x400*i + 0x267) & ~0x3f) | 0x13;
+ MCHBAR8(0x400*i + 0x268) = (MCHBAR8(0x400*i + 0x268) & ~0xff) | 0x4a;
+
+ reg16 = (MCHBAR16(0x400*i + 0x269) & 0xc000) >> 2;
+ reg16 += 2 << 12;
+ reg16 |= (0x15 << 6) | 0x1f;
+ MCHBAR16(0x400*i + 0x26d) = (MCHBAR16(0x400*i + 0x26d) & ~0x7fff) | reg16;
+
+ reg32 = (1 << 25) | (6 << 27);
+ MCHBAR32(0x400*i + 0x269) = (MCHBAR32(0x400*i + 0x269) & ~0xfa300000) | reg32;
+ MCHBAR8(0x400*i + 0x271) = MCHBAR8(0x400*i + 0x271) & ~0x80;
+ MCHBAR8(0x400*i + 0x274) = MCHBAR8(0x400*i + 0x274) & ~0x6;
+ } // END EACH POPULATED CHANNEL
+
+ reg16 = 0x1f << 5;
+ reg16 |= 0xe << 10;
+ MCHBAR16(0x125) = (MCHBAR16(0x125) & ~0x3fe0) | reg16;
+ MCHBAR16(0x127) = (MCHBAR16(0x127) & ~0x7ff) | 0x540;
+ MCHBAR8(0x129) = MCHBAR8(0x129) | 0x1f;
+ MCHBAR8(0x12c) = MCHBAR8(0x12c) | 0xa0;
+ MCHBAR32(0x241) = (MCHBAR32(0x241) & ~0x1ffff) | 0x11;
+ MCHBAR32(0x641) = (MCHBAR32(0x641) & ~0x1ffff) | 0x11;
+ MCHBAR8(0x246) = MCHBAR8(0x246) & ~0x10;
+ MCHBAR8(0x646) = MCHBAR8(0x646) & ~0x10;
+ MCHBAR32(0x120) = (2 << 29) | (1 << 28) | (1 << 23) | 0xd7f5f;
+ reg8 = (u8)((MCHBAR32(0x252) & 0x1e000) >> 13);
+ MCHBAR8(0x12d) = (MCHBAR8(0x12d) & ~0xf0) | (reg8 << 4);
+ reg8 = (u8)((MCHBAR32(0x258) & ~0x1e0000) >> 17);
+ MCHBAR8(0x12d) = (MCHBAR8(0x12d) & ~0xf) | reg8;
+ MCHBAR8(0x12f) = 0x4c;
+ reg32 = (1 << 31) | (0x80 << 14) | (1 << 13) | (0xa << 9);
+ MCHBAR32(0x6c0) = (MCHBAR32(0x6c0) & ~0xffffff00) | reg32;
+ MCHBAR8(0x6c4) = (MCHBAR8(0x6c4) & ~0x7) | 0x2;
+}
+
+static void dll_ddr2(sysinfo_t *s)
+{
+ u8 i, j, r, reg8, clk, async;
+ u16 reg16 = 0;
+ u32 reg32 = 0;
+ u8 lane;
+
+ MCHBAR16(0x180) = (MCHBAR16(0x180) & ~0x7e06) | 0xc04;
+ MCHBAR16(0x182) = (MCHBAR16(0x182) & ~0x3ff) | 0xc8;
+ MCHBAR16(0x18a) = (MCHBAR16(0x18a) & ~0x1f1f) | 0x0f0f;
+ MCHBAR16(0x1b4) = (MCHBAR16(0x1b4) & ~0x8020) | 0x100;
+ MCHBAR8(0x194) = (MCHBAR8(0x194) & ~0x77) | 0x33;
+ switch (s->selected_timings.mem_clock) {
+ default:
+ case MEM_CLOCK_667MHz:
+ reg16 = (0xa << 9) | 0xa;
+ break;
+ case MEM_CLOCK_800MHz:
+ reg16 = (0x9 << 9) | 0x9;
+ break;
+ }
+ MCHBAR16(0x19c) = (MCHBAR16(0x19c) & ~0x1e0f) | reg16;
+ MCHBAR16(0x19c) = (MCHBAR16(0x19c) & ~0x2030) | 0x2010;
+ microdelay(1);
+ MCHBAR16(0x198) = MCHBAR16(0x198) & ~0x100;
+
+ MCHBAR16(0x1c8) = (MCHBAR16(0x1c8) & ~0x1f) | 0xd;
+
+ microdelay(1);
+ MCHBAR8(0x190) = MCHBAR8(0x190) & ~1;
+ ns10delay(54); // 533ns
+ MCHBAR32(0x198) = MCHBAR32(0x198) & ~0x11554000;
+ microdelay(1);
+ MCHBAR32(0x198) = MCHBAR32(0x198) & ~0x1455;
+ microdelay(1);
+ MCHBAR8(0x583) = MCHBAR8(0x583) & ~0x1c;
+ MCHBAR8(0x983) = MCHBAR8(0x983) & ~0x1c;
+ ns10delay(54); // 533ns
+ MCHBAR8(0x583) = MCHBAR8(0x583) & ~0x3;
+ MCHBAR8(0x983) = MCHBAR8(0x983) & ~0x3;
+ ns10delay(54); // 533ns
+
+ // ME related
+ MCHBAR32(0x1a0) = (MCHBAR32(0x1a0) & ~0x7ffffff) | 0x551803;
+
+ MCHBAR16(0x1b4) = MCHBAR16(0x1b4) & ~0x800;
+ MCHBAR8(0x1a8) = MCHBAR8(0x1a8) | 0xf0;
+
+ FOR_EACH_CHANNEL(i) {
+ reg16 = 0;
+ MCHBAR16(0x400*i + 0x59c) = MCHBAR16(0x400*i + 0x59c) & ~0x3000;
+
+ reg32 = 0;
+ FOR_EACH_RANK_IN_CHANNEL(r) if (!RANK_IS_POPULATED(s->dimms, i, r)) {
+ reg32 |= 0x111 << r;
+ }
+ MCHBAR32(0x400*i + 0x59c) = (MCHBAR32(0x400*i + 0x59c) & ~0xfff) | reg32;
+ MCHBAR8(0x400*i + 0x594) = MCHBAR8(0x400*i + 0x594) & ~1;
+
+ if (!CHANNEL_IS_POPULATED(s->dimms, i)) {
+ PRINTK_DEBUG("No dimms in channel %d\n", i);
+ reg8 = 0x3f;
+ } else if(ONLY_DIMMA_IS_POPULATED(s->dimms, i)) {
+ PRINTK_DEBUG("DimmA populated only in channel %d\n", i);
+ reg8 = 0x38;
+ } else if(ONLY_DIMMB_IS_POPULATED(s->dimms, i)) {
+ PRINTK_DEBUG("DimmB populated only in channel %d\n", i);
+ reg8 = 0x7;
+ } else if(BOTH_DIMMS_ARE_POPULATED(s->dimms, i)) {
+ PRINTK_DEBUG("Both dimms populated in channel %d\n", i);
+ reg8 = 0;
+ } else {
+ die("Unhandled case\n");
+ }
+
+ //reg8 = 0x00; // FIXME dont switch on all clocks anyway
+
+ MCHBAR32(0x400*i + 0x5a0) = (MCHBAR32(0x400*i + 0x5a0) & ~0x3f000000) |
+ ((u32)(reg8 << 24));
+ } // END EACH CHANNEL
+
+ MCHBAR8(0x1a8) = MCHBAR8(0x1a8) | 1;
+ MCHBAR8(0x1a8) = MCHBAR8(0x1a8) & ~0x4;
+
+ // Update DLL timing
+ MCHBAR8(0x1a4) = MCHBAR8(0x1a4) & ~0x80;
+ MCHBAR8(0x1a4) = MCHBAR8(0x1a4) | 0x40;
+ MCHBAR16(0x5f0) = (MCHBAR16(0x5f0) & ~0x400) | 0x400;
+
+ u8 dll_setting_667[23][5] = {
+ // tap pi db delay
+ {13, 0, 1,0, 0},
+ {4, 1, 0,0, 0},
+ {13, 0, 1,0, 0},
+ {4, 5, 0,0, 0},
+ {4, 1, 0,0, 0},
+ {4, 1, 0,0, 0},
+ {4, 1, 0,0, 0},
+ {1, 5, 1,1, 1},
+ {1, 6, 1,1, 1},
+ {2, 0, 1,1, 1},
+ {2, 1, 1,1, 1},
+ {2, 1, 1,1, 1},
+ {14, 6, 1,0, 0},
+ {14, 3, 1,0, 0},
+ {14, 0, 1,0, 0},
+ {9, 0, 0,0, 1},
+ {9, 1, 0,0, 1},
+ {9, 2, 0,0, 1},
+ {9, 2, 0,0, 1},
+ {9, 1, 0,0, 1},
+ {6, 4, 0,0, 1},
+ {6, 2, 0,0, 1},
+ {5, 4, 0,0, 1}
+ };
+
+ u8 dll_setting_800[23][5] = {
+ // tap pi db delay
+ {11, 5, 1,0, 0},
+ {0, 5, 1,1, 0},
+ {11, 5, 1,0, 0},
+ {1, 4, 1,1, 0},
+ {0, 5, 1,1, 0},
+ {0, 5, 1,1, 0},
+ {0, 5, 1,1, 0},
+ {2, 5, 1,1, 1},
+ {2, 6, 1,1, 1},
+ {3, 0, 1,1, 1},
+ {3, 0, 1,1, 1},
+ {3, 3, 1,1, 1},
+ {2, 0, 1,1, 1},
+ {1, 3, 1,1, 1},
+ {0, 3, 1,1, 1},
+ {9, 3, 0,0, 1},
+ {9, 4, 0,0, 1},
+ {9, 5, 0,0, 1},
+ {9, 6, 0,0, 1},
+ {10, 0, 0,0, 1},
+ {8, 1, 0,0, 1},
+ {7, 5, 0,0, 1},
+ {6, 2, 0,0, 1}
+ };
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ MCHBAR16(0x400*i + 0x5f0) = (MCHBAR16(0x400*i + 0x5f0) & ~0x3fc) | 0x3fc;
+ MCHBAR32(0x400*i + 0x5fc) = MCHBAR32(0x400*i + 0x5fc) & ~0xcccccccc;
+ MCHBAR8(0x400*i + 0x5d9) = (MCHBAR8(0x400*i + 0x5d9) & ~0xf0) | 0x70;
+ MCHBAR16(0x400*i + 0x590) = (MCHBAR16(0x400*i + 0x590) & ~0xffff) | 0x5555;
+ }
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
+ clkset0(i, &dll_setting_667[CLKSET0][0]);
+ clkset1(i, &dll_setting_667[CLKSET1][0]);
+ ctrlset0(i, &dll_setting_667[CTRL0][0]);
+ ctrlset1(i, &dll_setting_667[CTRL1][0]);
+ ctrlset2(i, &dll_setting_667[CTRL2][0]);
+ ctrlset3(i, &dll_setting_667[CTRL3][0]);
+ cmdset(i, &dll_setting_667[CMD][0]);
+ } else {
+ clkset0(i, &dll_setting_800[CLKSET0][0]);
+ clkset1(i, &dll_setting_800[CLKSET1][0]);
+ ctrlset0(i, &dll_setting_800[CTRL0][0]);
+ ctrlset1(i, &dll_setting_800[CTRL1][0]);
+ ctrlset2(i, &dll_setting_800[CTRL2][0]);
+ ctrlset3(i, &dll_setting_800[CTRL3][0]);
+ cmdset(i, &dll_setting_800[CMD][0]);
+ }
+ }
+
+ // XXX if not async mode
+ MCHBAR16(0x180) = MCHBAR16(0x180) & ~0x8200;
+ MCHBAR8(0x180) = MCHBAR8(0x180) | 0x4;
+ j = 0;
+ for (i = 0; i < 16; i++) {
+ MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
+ MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
+ while (MCHBAR8(0x180) & 0x10);
+ if (MCHBAR32(0x184) == 0xffffffff) {
+ j++;
+ if (j >= 2)
+ break;
+
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
+ j = 2;
+ break;
+ }
+ } else {
+ j = 0;
+ }
+ }
+ if (i == 1 || ((i == 0) && s->selected_timings.mem_clock == MEM_CLOCK_667MHz)) {
+ j = 0;
+ i++;
+ for (; i < 16; i++) {
+ MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
+ MCHBAR8(0x180) = MCHBAR8(0x180) | 0x4;
+ while (MCHBAR8(0x180) & 0x10);
+ if (MCHBAR32(0x184) == 0) {
+ i++;
+ break;
+ }
+ }
+ for (; i < 16; i++) {
+ MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
+ MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
+ while (MCHBAR8(0x180) & 0x10);
+ if (MCHBAR32(0x184) == 0xffffffff) {
+ j++;
+ if (j >= 2)
+ break;
+ } else {
+ j = 0;
+ }
+ }
+ if (j < 2) {
+ MCHBAR8(0x1c8) = MCHBAR8(0x1c8) & ~0x1f;
+ MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
+ while (MCHBAR8(0x180) & 0x10);
+ j = 2;
+ }
+ }
+
+ if (j < 2) {
+ MCHBAR8(0x1c8) = MCHBAR8(0x1c8) & ~0x1f;
+ async = 1;
+ }
+
+ clk = 0x1a;
+ if (async != 1) {
+ reg8 = MCHBAR8(0x188) & 0x1e;
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz &&
+ s->selected_timings.fsb_clock == FSB_CLOCK_800MHz) {
+ clk = 0x10;
+ } else if (s->selected_timings.mem_clock == MEM_CLOCK_800MHz) {
+ clk = 0x10;
+ } else {
+ clk = 0x1a;
+ }
+ }
+ MCHBAR8(0x180) = MCHBAR8(0x180) & ~0x80;
+
+ if ((s->selected_timings.fsb_clock == FSB_CLOCK_800MHz) &&
+ (s->selected_timings.mem_clock == MEM_CLOCK_667MHz)) {
+ i = MCHBAR8(0x180) & 0xf;
+ i = (i + 10) % 14;
+ MCHBAR8(0x1c8) = (MCHBAR8(0x1c8) & ~0x1f) | i;
+ MCHBAR8(0x180) = MCHBAR8(0x180) | 0x10;
+ while(MCHBAR8(0x180) & 0x10);
+ }
+
+ reg8 = MCHBAR8(0x188) & ~1;
+ MCHBAR8(0x188) = reg8;
+ reg8 &= ~0x3e;
+ reg8 |= clk;
+ MCHBAR8(0x188) = reg8;
+ reg8 |= 1;
+ MCHBAR8(0x188) = reg8;
+
+ if (s->selected_timings.mem_clock == MEM_CLOCK_1333MHz) {
+ MCHBAR8(0x18c) = MCHBAR8(0x18c) | 1;
+ }
+
+ // Program DQ/DQS dll settings
+ reg32 = 0;
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ for (lane = 0; lane < 8; lane++) {
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
+ reg32 = 0x06db7777;
+ } else if (s->selected_timings.mem_clock == MEM_CLOCK_800MHz) {
+ reg32 = 0x00007777;
+ }
+ MCHBAR32(0x400*i + 0x540 + lane*4) =
+ (MCHBAR32(0x400*i + 0x540 + lane*4) & 0x0fffffff) |
+ reg32;
+ }
+ }
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
+ for (lane = 0; lane < 8; lane++) {
+ dqsset(i, lane, &dll_setting_667[DQS1+lane][0]);
+ }
+ for (lane = 0; lane < 8; lane++) {
+ dqset(i, lane, &dll_setting_667[DQ1+lane][0]);
+ }
+ } else {
+ for (lane = 0; lane < 8; lane++) {
+ dqsset(i, lane, &dll_setting_800[DQS1+lane][0]);
+ }
+ for (lane = 0; lane < 8; lane++) {
+ dqset(i, lane, &dll_setting_800[DQ1+lane][0]);
+ }
+ }
+ }
+}
+
+static void rcomp_ddr2(sysinfo_t *s)
+{
+ u8 i, j, k;
+ u32 x32a[8] = { 0x04040404, 0x06050505, 0x09090807, 0x0D0C0B0A, 0x04040404, 0x08070605, 0x0C0B0A09, 0x100F0E0D };
+ u16 x378[6] = { 0, 0xAAAA, 0x7777, 0x7777, 0x7777, 0x7777 };
+ u32 x382[6] = { 0, 0x02020202, 0x02020202, 0x02020202, 0x04030303, 0x04030303 };
+ u32 x386[6] = { 0, 0x03020202, 0x03020202, 0x03020202, 0x05040404, 0x05040404 };
+ u32 x38a[6] = { 0, 0x04040303, 0x04040303, 0x04040303, 0x07070605, 0x07070605 };
+ u32 x38e[6] = { 0, 0x06060505, 0x06060505, 0x06060505, 0x09090808, 0x09090808 };
+ u32 x392[6] = { 0, 0x02020202, 0x02020202, 0x02020202, 0x03030202, 0x03030202 };
+ u32 x396[6] = { 0, 0x03030202, 0x03030202, 0x03030202, 0x05040303, 0x05040303 };
+ u32 x39a[6] = { 0, 0x04040403, 0x04040403, 0x04040403, 0x07070605, 0x07070605 };
+ u32 x39e[6] = { 0, 0x06060505, 0x06060505, 0x06060505, 0x08080808, 0x08080808 };
+ u16 addr[6] = { 0x31c, 0x374, 0x3a2, 0x3d0, 0x3fe, 0x42c };
+ u8 bit[6] = { 0, 0, 1, 1, 0, 0 };
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ for (j = 0; j < 6; j++) {
+ if (j == 0) {
+ MCHBAR32(0x400*i + addr[j]) =
+ (MCHBAR32(0x400*i + addr[j]) & ~0xff000) | 0xaa000;
+ MCHBAR16(0x400*i + 0x320) = (MCHBAR16(0x400*i + 0x320) & ~0xffff) | 0x6666;
+ for (k = 0; k < 8; k++) {
+ MCHBAR32(0x400*i + addr[j] + 0xe + (k << 2)) =
+ (MCHBAR32(0x400*i + addr[j] + 0xe + (k << 2)) & ~0x3f3f3f3f) | x32a[k];
+ MCHBAR32(0x400*i + addr[j] + 0x2e + (k << 2)) =
+ (MCHBAR32(0x400*i + addr[j] + 0x2e + (k << 2)) & ~0x3f3f3f3f) | x32a[k];
+ }
+ } else {
+ MCHBAR16(0x400*i + addr[j]) = (MCHBAR16(0x400*i + addr[j]) & ~0xf000) | 0xa000;
+ MCHBAR16(0x400*i + addr[j] + 4) = (MCHBAR16(0x400*i + addr[j] + 4) & ~0xffff) |
+ x378[j];
+ MCHBAR32(0x400*i + addr[j] + 0xe) =
+ (MCHBAR32(0x400*i + addr[j] + 0xe) & ~0x3f3f3f3f) | x382[j];
+ MCHBAR32(0x400*i + addr[j] + 0x12) =
+ (MCHBAR32(0x400*i + addr[j] + 0x12) & ~0x3f3f3f3f) | x386[j];
+ MCHBAR32(0x400*i + addr[j] + 0x16) =
+ (MCHBAR32(0x400*i + addr[j] + 0x16) & ~0x3f3f3f3f) | x38a[j];
+ MCHBAR32(0x400*i + addr[j] + 0x1a) =
+ (MCHBAR32(0x400*i + addr[j] + 0x1a) & ~0x3f3f3f3f) | x38e[j];
+ MCHBAR32(0x400*i + addr[j] + 0x1e) =
+ (MCHBAR32(0x400*i + addr[j] + 0x1e) & ~0x3f3f3f3f) | x392[j];
+ MCHBAR32(0x400*i + addr[j] + 0x22) =
+ (MCHBAR32(0x400*i + addr[j] + 0x22) & ~0x3f3f3f3f) | x396[j];
+ MCHBAR32(0x400*i + addr[j] + 0x26) =
+ (MCHBAR32(0x400*i + addr[j] + 0x26) & ~0x3f3f3f3f) | x39a[j];
+ MCHBAR32(0x400*i + addr[j] + 0x2a) =
+ (MCHBAR32(0x400*i + addr[j] + 0x2a) & ~0x3f3f3f3f) | x39e[j];
+ }
+ MCHBAR8(0x400*i + addr[j]) = (MCHBAR8(0x400*i + addr[j]) & ~1) | bit[j];
+ }
+ MCHBAR8(0x400*i + 0x45a) = (MCHBAR8(0x400*i + 0x45a) & ~0x3f) | 0x12;
+ MCHBAR8(0x400*i + 0x45e) = (MCHBAR8(0x400*i + 0x45e) & ~0x3f) | 0x12;
+ MCHBAR8(0x400*i + 0x462) = (MCHBAR8(0x400*i + 0x462) & ~0x3f) | 0x12;
+ MCHBAR8(0x400*i + 0x466) = (MCHBAR8(0x400*i + 0x466) & ~0x3f) | 0x12;
+ } // END EACH POPULATED CHANNEL
+
+ MCHBAR32(0x134) = (MCHBAR32(0x134) & ~0x63c00) | 0x63c00;
+ MCHBAR16(0x174) = (MCHBAR16(0x174) & ~0x63ff) | 0x63ff;
+ MCHBAR16(0x178) = 0x0135;
+ MCHBAR32(0x130) = (MCHBAR32(0x130) & ~0x7bdffe0) | 0x7a9ffa0;
+
+ if (!CHANNEL_IS_POPULATED(s->dimms, 0)) {
+ MCHBAR32(0x130) = MCHBAR32(0x130) & ~(1 << 27);
+ }
+ if (!CHANNEL_IS_POPULATED(s->dimms, 1)) {
+ MCHBAR32(0x130) = MCHBAR32(0x130) & ~(1 << 28);
+ }
+
+ MCHBAR8(0x130) = MCHBAR8(0x130) | 1;
+}
+
+static void odt_ddr2(sysinfo_t *s)
+{
+ u8 i;
+ u16 odt[16][2] = {
+ { 0x0000,0x0000 }, // NC_NC
+ { 0x0000,0x0001 }, // x8SS_NC
+ { 0x0000,0x0011 }, // x8DS_NC
+ { 0x0000,0x0001 }, // x16SS_NC
+ { 0x0004,0x0000 }, // NC_x8SS
+ { 0x0101,0x0404 }, // x8SS_x8SS
+ { 0x0101,0x4444 }, // x8DS_x8SS
+ { 0x0101,0x0404 }, // x16SS_x8SS
+ { 0x0044,0x0000 }, // NC_x8DS
+ { 0x1111,0x0404 }, // x8SS_x8DS
+ { 0x1111,0x4444 }, // x8DS_x8DS
+ { 0x1111,0x0404 }, // x16SS_x8DS
+ { 0x0004,0x0000 }, // NC_x16SS
+ { 0x0101,0x0404 }, // x8SS_x16SS
+ { 0x0101,0x4444 }, // x8DS_x16SS
+ { 0x0101,0x0404 }, // x16SS_x16SS
+ };
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, i) {
+ MCHBAR16(0x400*i + 0x298) = odt[s->dimm_config[i]][1];
+ MCHBAR16(0x400*i + 0x294) = odt[s->dimm_config[i]][0];
+ MCHBAR16(0x400*i + 0x29c) = (MCHBAR16(0x400*i + 0x29c) & ~0xfff) | 0x66b;
+ MCHBAR32(0x400*i + 0x260) = (MCHBAR32(0x400*i + 0x260) & ~0x70e3c00) | 0x3063c00;
+ }
+}
+
+static void dojedec_ddr2(u8 r, u8 ch, u8 cmd, u16 val)
+{
+ u32 addr = (ch << 29) | (r*0x08000000);
+ volatile u32 rubbish;
+
+ MCHBAR8(0x271) = (MCHBAR8(0x271) & ~0x3e) | cmd;
+ MCHBAR8(0x671) = (MCHBAR8(0x671) & ~0x3e) | cmd;
+ rubbish = read32((void*)((val<<3) | addr));
+ microdelay(10);
+ MCHBAR8(0x271) = (MCHBAR8(0x271) & ~0x3e) | NORMALOP_CMD;
+ MCHBAR8(0x671) = (MCHBAR8(0x671) & ~0x3e) | NORMALOP_CMD;
+}
+
+static void jedec_ddr2(sysinfo_t *s)
+{
+ u8 i;
+ u16 mrsval, ch, r, v;
+
+ u8 odt[16][4] = {
+ {0x00, 0x00, 0x00, 0x00},
+ {0x01, 0x00, 0x00, 0x00},
+ {0x01, 0x01, 0x00, 0x00},
+ {0x01, 0x00, 0x00, 0x00},
+ {0x00, 0x00, 0x01, 0x00},
+ {0x11, 0x00, 0x11, 0x00},
+ {0x11, 0x11, 0x11, 0x00},
+ {0x11, 0x00, 0x11, 0x00},
+ {0x00, 0x00, 0x01, 0x01},
+ {0x11, 0x00, 0x11, 0x11},
+ {0x11, 0x11, 0x11, 0x11},
+ {0x11, 0x00, 0x11, 0x11},
+ {0x00, 0x00, 0x01, 0x00},
+ {0x11, 0x00, 0x11, 0x00},
+ {0x11, 0x11, 0x11, 0x00},
+ {0x11, 0x00, 0x11, 0x00}
+ };
+
+ u16 jedec[12][2] = {
+ {NOP_CMD, 0x0},
+ {PRECHARGE_CMD, 0x0},
+ {EMRS2_CMD, 0x0},
+ {EMRS3_CMD, 0x0},
+ {EMRS1_CMD, 0x0},
+ {MRS_CMD, 0x100}, // DLL Reset
+ {PRECHARGE_CMD, 0x0},
+ {CBR_CMD, 0x0},
+ {CBR_CMD, 0x0},
+ {MRS_CMD, 0x0}, // DLL out of reset
+ {EMRS1_CMD, 0x380}, // OCD calib default
+ {EMRS1_CMD, 0x0}
+ };
+
+ mrsval = (s->selected_timings.CAS << 4) | ((s->selected_timings.tWR - 1) << 9) | 0xb;
+
+ PRINTK_DEBUG("MRS...\n");
+
+ microdelay(200);
+
+ FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
+ PRINTK_DEBUG("CH%d: Found Rank %d\n", ch, r);
+ for (i = 0; i < 12; i++) {
+ v = jedec[i][1];
+ switch (jedec[i][0]) {
+ case EMRS1_CMD:
+ v |= (odt[s->dimm_config[ch]][r] << 2);
+ break;
+ case MRS_CMD:
+ v |= mrsval;
+ break;
+ default:
+ break;
+ }
+ dojedec_ddr2(r + ch*4, ch, jedec[i][0], v);
+ microdelay(1);
+ //PRINTK_DEBUG("Jedec step %d\n", i);
+ }
+ }
+ PRINTK_DEBUG("MRS done\n");
+}
+
+static u8 sampledqs(u16 mchloc, u32 addr, u8 hilow, u8 repeat)
+{
+ u8 dqsmatch = 1;
+ volatile u32 strobe;
+
+ while (repeat-- > 0) {
+ MCHBAR8(0x5d8) = MCHBAR8(0x5d8) & ~0x2;
+ microdelay(2);
+ MCHBAR8(0x5d8) = MCHBAR8(0x5d8) | 0x2;
+ microdelay(2);
+ MCHBAR8(0x9d8) = MCHBAR8(0x9d8) & ~0x2;
+ microdelay(2);
+ MCHBAR8(0x9d8) = MCHBAR8(0x9d8) | 0x2;
+ microdelay(2);
+ barrier();
+ strobe = read32((u32 *)addr);
+ barrier();
+ if (((MCHBAR32(mchloc) & 0x40) >> 6) != hilow) {
+ dqsmatch = 0;
+ }
+ }
+ return dqsmatch;
+}
+
+static void rcven_ddr2(sysinfo_t *s)
+{
+ u8 i, reg8, ch, lane;
+ u32 addr;
+ u8 tap = 0;
+ u8 savecc, savemedium, savetap, coarsecommon, medium;
+ u8 lanecoarse[8] = {0};
+ u8 mincoarse = 0xff;
+ u8 pitap[2][8];
+ u16 coarsectrl[2];
+ u16 coarsedelay[2];
+ u16 mediumphase[2];
+ u16 readdelay[2];
+ u16 mchbar;
+ MCHBAR8(0x5d8) = MCHBAR8(0x5d8) & ~0xc;
+ MCHBAR8(0x9d8) = MCHBAR8(0x9d8) & ~0xc;
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) & ~0x80;
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
+ addr = (ch << 29);
+ for (i = 0; !RANK_IS_POPULATED(s->dimms, ch, i); i++) {
+ addr += 128*1024*1024;
+ }
+ for (lane = 0; lane < 8; lane++) {
+ PRINTK_DEBUG("Channel %d, Lane %d addr=0x%08x\n", ch, lane, addr);
+//trylaneagain:
+ coarsecommon = (s->selected_timings.CAS - 1);
+ switch (lane) {
+ case 0: case 1: medium = 0; break;
+ case 2: case 3: medium = 1; break;
+ case 4: case 5: medium = 2; break;
+ case 6: case 7: medium = 3; break;
+ default: medium = 0; break;
+ }
+ mchbar = 0x400*ch + 0x561 + (lane << 2);
+ tap = 0;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) |
+ (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) & ~(3 << (lane*2))) |
+ (medium << (lane*2));
+ MCHBAR8(0x400*ch + 0x560 + lane*4) = MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0xf;
+ MCHBAR8(0x400*ch + 0x560 + lane*4) = MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0x70;
+ savecc = coarsecommon;
+ savemedium = medium;
+ savetap = 0;
+
+ MCHBAR16(0x400*ch + 0x588) = (MCHBAR16(0x400*ch + 0x588) & ~(3 << (lane*2))) |
+ (1 << (lane*2));
+
+ PRINTK_VERBOSE("rcven 0.1 coarse=%d\n", coarsecommon);
+ while (sampledqs(mchbar, addr, 1, 1) == 1) {
+ if (medium < 3) {
+ medium++;
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ } else {
+ medium = 0;
+ coarsecommon++;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ }
+ if (coarsecommon > 16) {
+ die("Coarse > 16: DQS tuning failed, halt\n");
+ break;
+ }
+ }
+ PRINTK_VERBOSE(" GOT IT (high -> low transition) coarse=%d medium=%d\n", coarsecommon, medium);
+
+ savemedium = medium;
+ savecc = coarsecommon;
+ if (medium < 3) {
+ medium++;
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ } else {
+ medium = 0;
+ coarsecommon++;
+
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) |
+ (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) & ~(3 << (lane*2))) |
+ (medium << (lane*2));
+ }
+
+ PRINTK_VERBOSE("rcven 0.2\n");
+ while (sampledqs(mchbar, addr, 0, 1) == 1) {
+ savemedium = medium;
+ savecc = coarsecommon;
+ if (medium < 3) {
+ medium++;
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ } else {
+ medium = 0;
+ coarsecommon++;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ }
+ if (coarsecommon > 16) {
+ die("Coarse DQS tuning 2 failed, halt\n");
+ break;
+ }
+ }
+ PRINTK_VERBOSE(" GOT IT (low -> high transition) coarse=%d medium=%d\n", coarsecommon, medium);
+
+
+ coarsecommon = savecc;
+ medium = savemedium;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+
+ PRINTK_VERBOSE("rcven 0.3\n");
+ tap = 0;
+ while (sampledqs(mchbar, addr, 1, 1) == 0) {
+ savetap = tap;
+ tap++;
+ if (tap > 14) {
+ break;
+ }
+ MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
+ (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0xf) | tap;
+ }
+
+ tap = savetap;
+ MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
+ (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0xf) | tap;
+ MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
+ (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0x70) | 0x30;
+ if (medium < 3) {
+ medium++;
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ } else {
+ medium = 0;
+ coarsecommon++;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ }
+ if (sampledqs(mchbar, addr, 1, 1) == 0) {
+ die("Not at DQS high, doh\n");
+ }
+
+ PRINTK_VERBOSE("rcven 0.4\n");
+ while (sampledqs(mchbar, addr, 1, 1) == 1) {
+ coarsecommon--;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ if (coarsecommon == 0) {
+ die("Couldn't find DQS-high 0 indicator, halt\n");
+ break;
+ }
+ }
+ PRINTK_VERBOSE(" GOT IT (high -> low transition) coarse=%d medium=%d\n", coarsecommon, medium);
+
+ PRINTK_VERBOSE("rcven 0.5\n");
+ while (sampledqs(mchbar, addr, 0, 1) == 1) {
+ savemedium = medium;
+ savecc = coarsecommon;
+ if (medium < 3) {
+ medium++;
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ } else {
+ medium = 0;
+ coarsecommon++;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ }
+ if (coarsecommon > 16) {
+ die("Coarse DQS tuning 5 failed, halt\n");
+ break;
+ }
+ }
+ PRINTK_VERBOSE(" GOT IT (low -> high transition) coarse=%d medium=%d\n", coarsecommon, medium);
+
+ PRINTK_VERBOSE("rcven 0.6\n");
+ coarsecommon = savecc;
+ medium = savemedium;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) &
+ ~0xf0000) | (coarsecommon << 16);
+ MCHBAR16(0x400*ch + 0x58c) = (MCHBAR16(0x400*ch + 0x58c) &
+ ~(3 << (lane*2))) | (medium << (lane*2));
+ while (sampledqs(mchbar, addr, 1, 1) == 0) {
+ savetap = tap;
+ tap++;
+ if (tap > 14) {
+ break;
+ }
+ MCHBAR8(0x400*ch + 0x560 + lane*4) =
+ (MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0xf) | tap;
+ }
+ tap = savetap;
+ MCHBAR8(0x400*ch + 0x560 + lane*4) =
+ (MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0xf) | tap;
+ MCHBAR8(0x400*ch + 0x560 + lane*4) =
+ (MCHBAR8(0x400*ch + 0x560 + lane*4) & ~0x70) | 0x70;
+
+ pitap[ch][lane] = 0x70 | tap;
+
+ MCHBAR16(0x400*ch + 0x588) = MCHBAR16(0x400*ch + 0x588) & ~(3 << (lane*2));
+ lanecoarse[lane] = coarsecommon;
+ PRINTK_VERBOSE("rcven 0.7\n");
+ } // END EACH LANE
+
+ // Find minimum coarse value
+ for (lane = 0; lane < 8; lane++) {
+ if (mincoarse > lanecoarse[lane]) {
+ mincoarse = lanecoarse[lane];
+ }
+ }
+
+ PRINTK_DEBUG("Found min coarse value = %d\n", mincoarse);
+
+ for (lane = 0; lane < 8; lane++) {
+ reg8 = (lanecoarse[lane] == 0) ? 0 : lanecoarse[lane] - mincoarse;
+ MCHBAR16(0x400*ch + 0x5fa) = (MCHBAR16(0x400*ch + 0x5fa) & ~(3 << (lane*2))) |
+ (reg8 << (lane*2));
+ }
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) | (mincoarse << 16);
+ coarsectrl[ch] = mincoarse;
+ coarsedelay[ch] = MCHBAR16(0x400*ch + 0x5fa);
+ mediumphase[ch] = MCHBAR16(0x400*ch + 0x58c);
+ readdelay[ch] = MCHBAR16(0x400*ch + 0x588);
+ } // END EACH POPULATED CHANNEL
+
+/* Resume support */
+ FOR_EACH_CHANNEL(ch) {
+ for (lane = 0; lane < 8; lane++) {
+ MCHBAR8(0x400*ch + 0x560 + (lane*4)) =
+ (MCHBAR8(0x400*ch + 0x560 + (lane*4)) & ~0xf) | pitap[ch][lane];
+ }
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0xf0000) |
+ (coarsectrl[ch] << 16);
+ MCHBAR16(0x400*ch + 0x5fa) = coarsedelay[ch];
+ MCHBAR16(0x400*ch + 0x58c) = mediumphase[ch];
+ }
+ PRINTK_DEBUG("End rcven\n");
+}
+
+static void dradrb_ddr2(sysinfo_t *s)
+{
+ u8 map, i, ch, r, rankpop0, rankpop1;
+ u32 c0dra = 0;
+ u32 c1dra = 0;
+ u32 c0drb = 0;
+ u32 c1drb = 0;
+ u32 dra;
+ u32 dra0;
+ u32 dra1;
+ u16 totalmemorymb;
+ u16 size, offset;
+ u8 dratab[2][2][2][4] = {
+ {
+ {
+ {0xff, 0xff, 0xff, 0xff},
+ {0xff, 0x00, 0x02, 0xff}
+ },
+ {
+ {0xff, 0x01, 0xff, 0xff},
+ {0xff, 0x03, 0xff, 0xff}
+ }
+ },
+ {
+ {
+ {0xff, 0xff, 0xff, 0xff},
+ {0xff, 0x04, 0x06, 0x08}
+ },
+ {
+ {0xff, 0xff, 0xff, 0xff},
+ {0x05, 0x07, 0x09, 0xff}
+ }
+ }
+ };
+
+ u8 drbtab[10] = {0x04, 0x02, 0x08, 0x04, 0x08, 0x04, 0x10, 0x08, 0x20, 0x10};
+
+ // DRA
+ rankpop0 = 0;
+ rankpop1 = 0;
+ FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
+ if ((s->dimms[ch<<1].card_type && ((r) < s->dimms[ch<<1].ranks))) {
+ i = ch << 1;
+ } else {
+ i = (ch << 1) + 1;
+ }
+ dra = dratab[s->dimms[i].banks]
+ [s->dimms[i].width]
+ [s->dimms[i].cols-9]
+ [s->dimms[i].rows-12];
+ if (s->dimms[i].banks == 1) {
+ dra |= 0x80;
+ }
+ if (ch == 0) {
+ c0dra |= dra << (r*8);
+ rankpop0 |= 1 << r;
+ } else {
+ c1dra |= dra << (r*8);
+ rankpop1 |= 1 << r;
+ }
+ }
+ MCHBAR32(0x208) = c0dra;
+ MCHBAR32(0x608) = c1dra;
+
+ MCHBAR8(0x262) = (MCHBAR8(0x262) & ~0xf0) | ((rankpop0 << 4) & 0xf0);
+ MCHBAR8(0x662) = (MCHBAR8(0x662) & ~0xf0) | ((rankpop1 << 4) & 0xf0);
+
+ if (ONLY_DIMMA_IS_POPULATED(s->dimms, 0) || ONLY_DIMMB_IS_POPULATED(s->dimms, 0)) {
+ MCHBAR8(0x260) = MCHBAR8(0x260) | 1;
+ }
+ if (ONLY_DIMMA_IS_POPULATED(s->dimms, 1) || ONLY_DIMMB_IS_POPULATED(s->dimms, 1)) {
+ MCHBAR8(0x660) = MCHBAR8(0x660) | 1;
+ }
+
+ // DRB
+ FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
+ if ((s->dimms[ch<<1].card_type && ((r) < s->dimms[ch<<1].ranks))) {
+ i = ch << 1;
+ } else {
+ i = (ch << 1) + 1;
+ }
+ if (ch == 0) {
+ dra0 = (c0dra >> (8*r)) & 0x7f;
+ c0drb = (u16)(c0drb + drbtab[dra0]);
+ s->dimms[i].rank_capacity_mb = drbtab[dra0] << 6;
+ MCHBAR16(0x200 + 2*r) = c0drb;
+ } else {
+ dra1 = (c1dra >> (8*r)) & 0x7f;
+ c1drb = (u16)(c1drb + drbtab[dra1]);
+ s->dimms[i].rank_capacity_mb = drbtab[dra1] << 6;
+ MCHBAR16(0x600 + 2*r) = c1drb;
+ }
+ }
+
+ s->channel_capacity[0] = c0drb << 6;
+ s->channel_capacity[1] = c1drb << 6;
+ totalmemorymb = s->channel_capacity[0] + s->channel_capacity[1];
+ PRINTK_DEBUG("Total memory: %d + %d = %dMiB\n",
+ s->channel_capacity[0], s->channel_capacity[1], totalmemorymb);
+
+ rankpop1 >>= 4;
+ if (rankpop1) {
+ MCHBAR16(0x600 + 2*msbpos(rankpop1)) = c0drb + c1drb;
+ MCHBAR16(0x602 + 2*msbpos(rankpop1)) = c0drb + c1drb;
+ MCHBAR16(0x604 + 2*msbpos(rankpop1)) = c0drb + c1drb;
+ MCHBAR16(0x606 + 2*msbpos(rankpop1)) = c0drb + c1drb;
+ }
+
+ MCHBAR8(0x111) = MCHBAR8(0x111) | 0x2;
+ MCHBAR16(0x104) = 0;
+ size = s->channel_capacity[0] + s->channel_capacity[1];
+ MCHBAR16(0x102) = size;
+ map = 0;
+ if (s->channel_capacity[0] == 0) {
+ map = 0;
+ } else if (s->channel_capacity[1] == 0) {
+ map |= 0x20;
+ } else {
+ map |= 0x40;
+ }
+ map |= 0x18;
+ if (s->channel_capacity[0] <= s->channel_capacity[1]) {
+ map |= 0x5;
+ } else if (s->channel_capacity[0] > s->channel_capacity[1]) {
+ map |= 0x4;
+ }
+ MCHBAR8(0x110) = map;
+ MCHBAR16(0x10e) = 0;
+ if (s->channel_capacity[1] != 0) {
+ offset = 0;
+ } else if (s->channel_capacity[0] > s->channel_capacity[1]) {
+ offset = size;
+ } else {
+ offset = 0;
+ }
+ MCHBAR16(0x108) = offset;
+ MCHBAR16(0x10a) = 0;
+}
+
+static void mmap_ddr2(sysinfo_t *s)
+{
+ u32 gfxsize, gttsize, tsegsize, mmiosize, tom, tolud, touud, gfxbase, gttbase, tsegbase;
+ u16 ggc;
+ u16 ggc2uma[14] = { 0, 0, 0, 0, 0, 32, 48, 64, 128, 256, 96, 160, 224, 352 };
+ u8 ggc2gtt[12] = { 0, 1, 0, 2, 0, 0, 0, 0, 0, 2, 3, 4};
+
+ ggc = pci_read_config16(PCI_DEV(0,0,0), 0x52);
+ gfxsize = ggc2uma[(ggc & 0xf0) >> 4];
+ gttsize = ggc2gtt[(ggc & 0xf00) >> 8];
+ tsegsize = 0; // 1MB TSEG
+ mmiosize = 0x400; // 1GB MMIO
+ tom = s->channel_capacity[0] + s->channel_capacity[1];
+ tolud = min(0x1000 - mmiosize, tom);
+ touud = tom;
+ gfxbase = tolud - gfxsize;
+ gttbase = gfxbase - gttsize;
+ tsegbase = gttbase - tsegsize;
+
+ pci_write_config16(PCI_DEV(0,0,0), 0xb0, tolud << 4);
+ pci_write_config16(PCI_DEV(0,0,0), 0xa0, tom >> 6);
+ pci_write_config16(PCI_DEV(0,0,0), 0xa2, touud);
+ pci_write_config32(PCI_DEV(0,0,0), 0xa4, gfxbase << 20);
+ pci_write_config32(PCI_DEV(0,0,0), 0xa8, gttbase << 20);
+ pci_write_config32(PCI_DEV(0,0,0), 0xac, tsegbase << 20);
+}
+
+static void enhanced_ddr2(sysinfo_t *s)
+{
+ u8 ch, reg8;
+
+ MCHBAR32(0xfb0) = 0x1000d024;
+ MCHBAR32(0xfb4) = 0xc842;
+ MCHBAR32(0xfbc) = 0xf;
+ MCHBAR32(0xfc4) = 0xfe22244;
+ MCHBAR8(0x12f) = 0x5c;
+ MCHBAR8(0xfb0) = (MCHBAR8(0xfb0) & ~1) | 1;
+ MCHBAR8(0x12f) = MCHBAR8(0x12f) | 0x2;
+ MCHBAR8(0x6c0) = (MCHBAR8(0x6c0) & ~0xf0) | 0xa0;
+ MCHBAR32(0xfa8) = 0x30d400;
+
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
+ MCHBAR8(0x400*ch + 0x26c) = MCHBAR8(0x400*ch + 0x26c) | 1;
+ MCHBAR32(0x400*ch + 0x278) = 0x88141881;
+ MCHBAR16(0x400*ch + 0x27c) = 0x0041;
+ MCHBAR8(0x400*ch + 0x292) = 0xf2;
+ MCHBAR16(0x400*ch + 0x272) = MCHBAR16(0x400*ch + 0x272) | 0x100;
+ MCHBAR8(0x400*ch + 0x243) = (MCHBAR8(0x400*ch + 0x243) & ~0x2) | 1;
+ MCHBAR32(0x400*ch + 0x288) = 0x8040200;
+ MCHBAR32(0x400*ch + 0x28c) = 0xff402010;
+ MCHBAR32(0x400*ch + 0x290) = 0x4f2091c;
+ }
+
+ reg8 = pci_read_config8(PCI_DEV(0,0,0), 0xf0);
+ pci_write_config8(PCI_DEV(0,0,0), 0xf0, reg8 | 1);
+ MCHBAR32(0xfa0) = (MCHBAR32(0xfa0) & ~0x20002) | 0x2;
+ MCHBAR32(0xfa4) = (MCHBAR32(0xfa4) & ~0x219100c3) | 0x219100c2;
+ MCHBAR32(0x2c) = 0x44a53;
+ MCHBAR32(0x30) = 0x1f5a86;
+ MCHBAR32(0x34) = 0x1902810;
+ MCHBAR32(0x38) = 0xf7000000;
+ MCHBAR32(0x3c) = 0x23014410;
+ MCHBAR32(0x40) = (MCHBAR32(0x40) & ~0x8f038000) | 0x8f038000;
+ MCHBAR32(0x20) = 0x33001;
+ pci_write_config8(PCI_DEV(0,0,0), 0xf0, reg8 & ~1);
+}
+
+static void power_ddr2(sysinfo_t *s)
+{
+ u32 reg1, reg2, reg3, reg4, clkgate, x592;
+ u8 lane, ch;
+ u8 twl = 0;
+ u16 x264, x23c;
+
+ twl = s->selected_timings.CAS - 1;
+ x264 = 0x78;
+ switch (s->selected_timings.mem_clock) {
+ default:
+ case MEM_CLOCK_667MHz:
+ reg1 = 0x99;
+ reg2 = 0x1048a9;
+ clkgate = 0x230000;
+ x23c = 0x7a89;
+ break;
+ case MEM_CLOCK_800MHz:
+ if (s->selected_timings.CAS == 5) {
+ reg1 = 0x19a;
+ reg2 = 0x1048aa;
+ } else {
+ reg1 = 0x9a;
+ reg2 = 0x2158aa;
+ x264 = 0x89;
+ }
+ clkgate = 0x280000;
+ x23c = 0x7b89;
+ break;
+ }
+ reg3 = 0x232;
+ reg4 = 0x2864;
+
+ if (CHANNEL_IS_POPULATED(s->dimms, 0) && CHANNEL_IS_POPULATED(s->dimms, 1)) {
+ MCHBAR32(0x14) = 0x0010461f;
+ } else {
+ MCHBAR32(0x14) = 0x0010691f;
+ }
+ MCHBAR32(0x18) = 0xdf6437f7;
+ MCHBAR32(0x1c) = 0x0;
+ MCHBAR32(0x24) = (MCHBAR32(0x24) & ~0xe0000000) | 0x30000000;
+ MCHBAR32(0x44) = (MCHBAR32(0x44) & ~0x1fef0000) | 0x6b0000;
+ MCHBAR16(0x115) = (u16) reg1;
+ MCHBAR32(0x117) = (MCHBAR32(0x117) & ~0xffffff) | reg2;
+ MCHBAR8(0x124) = 0x7;
+ MCHBAR16(0x12a) = (MCHBAR16(0x12a) & 0) | 0x80;
+ MCHBAR8(0x12c) = (MCHBAR8(0x12c) & 0) | 0xa0;
+ MCHBAR16(0x174) = MCHBAR16(0x174) & ~(1 << 15);
+ MCHBAR16(0x188) = (MCHBAR16(0x188) & ~0x1f00) | 0x1f00;
+ MCHBAR8(0x18c) = MCHBAR8(0x18c) & ~0x8;
+ MCHBAR8(0x192) = (MCHBAR8(0x192) & ~1) | 1;
+ MCHBAR8(0x193) = (MCHBAR8(0x193) & ~0xf) | 0xf;
+ MCHBAR16(0x1b4) = (MCHBAR16(0x1b4) & ~0x480) | 0x80;
+ MCHBAR16(0x210) = (MCHBAR16(0x210) & ~0x1fff) | 0x3f; // | clockgatingiii
+ MCHBAR32(0x6d1) = (MCHBAR32(0x6d1) & ~0xff03ff) | 0x100 | clkgate;
+ MCHBAR8(0x212) = (MCHBAR8(0x212) & ~0x7f) | 0x7f;
+ MCHBAR32(0x2c0) = (MCHBAR32(0x2c0) & ~0xffff0) | 0xcc5f0;
+ MCHBAR8(0x2c4) = (MCHBAR8(0x2c4) & ~0x70) | 0x70;
+ MCHBAR32(0x2d1) = (MCHBAR32(0x2d1) & ~0xffffff) | 0xff2831; // | clockgatingi
+ MCHBAR32(0x2d4) = 0x40453600;
+ MCHBAR32(0x300) = 0xc0b0a08;
+ MCHBAR32(0x304) = 0x6040201;
+ MCHBAR32(0x30c) = (MCHBAR32(0x30c) & ~0x43c0f) | 0x41405;
+ MCHBAR16(0x610) = 0x232;
+ MCHBAR16(0x612) = 0x2864;
+ MCHBAR32(0x62c) = (MCHBAR32(0x62c) & ~0xc000000) | 0x4000000;
+ MCHBAR32(0xae4) = 0;
+ MCHBAR32(0xc00) = (MCHBAR32(0xc00) & ~0xf0000) | 0x10000;
+ MCHBAR32(0xf00) = 0x393a3b3c;
+ MCHBAR32(0xf04) = 0x3d3e3f40;
+ MCHBAR32(0xf08) = 0x393a3b3c;
+ MCHBAR32(0xf0c) = 0x3d3e3f40;
+ MCHBAR32(0xf18) = MCHBAR32(0xf18) & ~0xfff00001;
+ MCHBAR32(0xf48) = 0xfff0ffe0;
+ MCHBAR32(0xf4c) = 0xffc0ff00;
+ MCHBAR32(0xf50) = 0xfc00f000;
+ MCHBAR32(0xf54) = 0xc0008000;
+ MCHBAR32(0xf6c) = (MCHBAR32(0xf6c) & ~0xffff0000) | 0xffff0000;
+ MCHBAR32(0xfac) = MCHBAR32(0xfac) & ~0x80000000;
+ MCHBAR32(0xfb8) = MCHBAR32(0xfb8) & ~0xff000000;
+ MCHBAR32(0xfbc) = (MCHBAR32(0xfbc) & ~0x7f800) | 0xf000;
+ MCHBAR32(0x1104) = 0x3003232;
+ MCHBAR32(0x1108) = 0x74;
+ if (s->selected_timings.fsb_clock == FSB_CLOCK_800MHz) {
+ MCHBAR32(0x110c) = 0xaa;
+ } else {
+ MCHBAR32(0x110c) = 0x100;
+ }
+ MCHBAR32(0x1110) = 0x10810350 & ~0x78;
+ MCHBAR32(0x1114) = 0;
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
+ twl = 5;
+ } else {
+ twl = 6;
+ }
+ x592 = 0xff;
+ if (pci_read_config8(PCI_DEV(0,0,0), 0x8) < 3) {
+ x592 = ~0x4;
+ }
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
+ MCHBAR8(0x400*ch + 0x239) = twl + 15;
+ MCHBAR16(0x400*ch + 0x23c) = x23c;
+ MCHBAR32(0x400*ch + 0x248) = (MCHBAR32(0x400*ch + 0x248) & ~0x706033) | 0x406033;
+ MCHBAR32(0x400*ch + 0x260) = (MCHBAR32(0x400*ch + 0x260) & ~(1 << 16)) | (1 << 16);
+ MCHBAR8(0x400*ch + 0x264) = x264;
+ MCHBAR8(0x400*ch + 0x592) = (MCHBAR8(0x400*ch + 0x592) & ~0x3f) | (0x3c & x592);
+ MCHBAR8(0x400*ch + 0x593) = (MCHBAR8(0x400*ch + 0x593) & ~0x1f) | 0x1e;
+ }
+
+ for (lane = 0; lane < 8; lane++) {
+ MCHBAR8(0x561 + (lane << 2)) = MCHBAR8(0x561 + (lane << 2)) & ~(1 << 3);
+ }
+}
+
+void raminit_ddr2(sysinfo_t *s)
+{
+ u8 ch;
+ u8 r, bank;
+ u32 reg32;
+
+ // Select timings based on SPD info
+ sdram_detect_smallest_params2(s);
+
+ // Reset if required
+ checkreset_ddr2(s);
+
+ // Clear self refresh
+ MCHBAR32(0xf14) = MCHBAR32(0xf14) | 0x3;
+
+ // Clear host clk gate reg
+ MCHBAR32(0x1c) = MCHBAR32(0x1c) | 0xffffffff;
+
+ // Select DDR2
+ MCHBAR8(0x1a8) = MCHBAR8(0x1a8) & ~0x4;
+
+ // Set freq
+ MCHBAR32(0xc00) = (MCHBAR32(0xc00) & ~0x70) |
+ (s->selected_timings.mem_clock << 4) | (1 << 10);
+
+ // Overwrite freq if chipset rejects it
+ s->selected_timings.mem_clock = (MCHBAR8(0xc00) & 0x70) >> 4;
+ if (s->selected_timings.mem_clock > (s->max_fsb + 3)) {
+ die("Error: DDR is faster than FSB, halt\n");
+ }
+
+ microdelay(250000);
+
+ // Program clock crossing
+ clkcross_ddr2(s);
+ PRINTK_DEBUG("Done clk crossing\n");
+
+ // DDR2 IO
+ setioclk_ddr2(s);
+ PRINTK_DEBUG("Done I/O clk\n");
+
+ // Grant to launch
+ launch_ddr2(s);
+ PRINTK_DEBUG("Done launch\n");
+
+ // Program DDR2 timings
+ timings_ddr2(s);
+ PRINTK_DEBUG("Done timings\n");
+
+ // Program DLL
+ dll_ddr2(s);
+
+ // RCOMP
+ rcomp_ddr2(s);
+ PRINTK_DEBUG("RCOMP\n");
+
+ // ODT
+ odt_ddr2(s);
+ PRINTK_DEBUG("Done ODT\n");
+
+ // RCOMP update
+ while ((MCHBAR8(0x130) & 1) != 0 );
+ PRINTK_DEBUG("Done RCOMP update\n");
+
+ // Set defaults
+ MCHBAR32(0x260) = (MCHBAR32(0x260) & ~1) | 0xf00000;
+ MCHBAR32(0x660) = (MCHBAR32(0x660) & ~1) | 0xf00000;
+ MCHBAR32(0x208) = 0x01010101;
+ MCHBAR32(0x608) = 0x01010101;
+ MCHBAR32(0x200) = 0x00040002;
+ MCHBAR32(0x204) = 0x00080006;
+ MCHBAR32(0x600) = 0x00040002;
+ MCHBAR32(0x604) = 0x00100006;
+ MCHBAR8(0x111) = MCHBAR8(0x111) | 0x2;
+ MCHBAR32(0x104) = 0;
+ MCHBAR16(0x102) = 0x400;
+ MCHBAR8(0x100) = (2 << 5) | (3 << 3);
+ MCHBAR16(0x10e) = 0;
+ MCHBAR32(0x108) = 0;
+ pci_write_config16(PCI_DEV(0,0,0), 0xb0, 0x4000);
+ pci_write_config16(PCI_DEV(0,0,0), 0xa0, 0x0010);
+ pci_write_config16(PCI_DEV(0,0,0), 0xa2, 0x0400);
+ pci_write_config32(PCI_DEV(0,0,0), 0xa4, 0x40000000);
+ pci_write_config32(PCI_DEV(0,0,0), 0xa8, 0x40000000);
+ pci_write_config32(PCI_DEV(0,0,0), 0xac, 0x40000000);
+
+ // IOBUFACT
+ if (CHANNEL_IS_POPULATED(s->dimms, 0)) {
+ MCHBAR8(0x5dd) = (MCHBAR8(0x5dd) & ~0x3f) | 0x3f;
+ MCHBAR8(0x5d8) = MCHBAR8(0x5d8) | 0x7;
+ }
+ if (CHANNEL_IS_POPULATED(s->dimms, 1)) {
+ if (pci_read_config8(PCI_DEV(0,0,0), 0x8) < 2) {
+ MCHBAR8(0x5dd) = (MCHBAR8(0x5dd) & ~0x3f) | 0x3f;
+ MCHBAR8(0x5d8) = MCHBAR8(0x5d8) | 1;
+ }
+ MCHBAR8(0x9dd) = (MCHBAR8(0x9dd) & ~0x3f) | 0x3f;
+ MCHBAR8(0x9d8) = MCHBAR8(0x9d8) | 0x7;
+ }
+
+
+ // Pre jedec
+ MCHBAR8(0x40) = MCHBAR8(0x40) | 0x2;
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
+ MCHBAR32(0x400*ch + 0x260) = MCHBAR32(0x400*ch + 0x260) | (1 << 27);
+ }
+ MCHBAR16(0x212) = (MCHBAR16(0x212) & ~0xf000) | 0xf000;
+ MCHBAR16(0x212) = (MCHBAR16(0x212) & ~0xf00) | 0xf00;
+ PRINTK_DEBUG("Done pre-jedec\n");
+
+ // JEDEC reset
+ jedec_ddr2(s);
+
+ PRINTK_DEBUG("Done jedec steps\n");
+
+ // After JEDEC reset
+ MCHBAR8(0x40) = MCHBAR8(0x40) & ~0x2;
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
+ if (s->selected_timings.mem_clock == MEM_CLOCK_667MHz) {
+ reg32 = (2 << 18) | (3 << 13) | (5 << 8);
+ } else {
+ reg32 = (2 << 18) | (3 << 13) | (4 << 8);
+ }
+ MCHBAR32(0x400*ch + 0x274) = (MCHBAR32(0x400*ch + 0x274) & ~0xfff00) | reg32;
+ MCHBAR8(0x400*ch + 0x274) = MCHBAR8(0x400*ch + 0x274) & ~0x80;
+ MCHBAR8(0x400*ch + 0x26c) = MCHBAR8(0x400*ch + 0x26c) | 1;
+ MCHBAR32(0x400*ch + 0x278) = 0x88141881;
+ MCHBAR16(0x400*ch + 0x27c) = 0x41;
+ MCHBAR8(0x400*ch + 0x292) = 0xf2;
+ MCHBAR8(0x400*ch + 0x271) = (MCHBAR8(0x400*ch + 0x271) & ~0xe) | 0xe;
+ }
+ MCHBAR8(0x2c4) = MCHBAR8(0x2c4) | 0x8;
+ MCHBAR8(0x2c3) = MCHBAR8(0x2c3) | 0x40;
+ MCHBAR8(0x2c4) = MCHBAR8(0x2c4) | 0x4;
+
+ PRINTK_DEBUG("Done post-jedec\n");
+
+ // Set DDR2 init complete
+ FOR_EACH_POPULATED_CHANNEL(s->dimms, ch) {
+ MCHBAR32(0x400*ch + 0x268) = (MCHBAR32(0x400*ch + 0x268) & ~0xc0000000) | 0xc0000000;
+ }
+
+ // Receive enable
+ rcven_ddr2(s);
+ PRINTK_DEBUG("Done rcven\n");
+
+ // Finish rcven
+ FOR_EACH_CHANNEL(ch) {
+ MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) & ~0xe;
+ MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) | 0x2;
+ MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) | 0x4;
+ MCHBAR8(0x400*ch + 0x5d8) = MCHBAR8(0x400*ch + 0x5d8) | 0x8;
+ }
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) | 0x80;
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) & ~0x80;
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) | 0x80;
+
+ // Dummy writes / reads
+ volatile u32 data;
+ FOR_EACH_POPULATED_RANK(s->dimms, ch, r) {
+ for (bank = 0; bank < 4; bank++) {
+ reg32 = (ch << 29) | (r*0x8000000) | (bank << 12);
+ write32((u32 *)reg32, 0xffffffff);
+ data = read32((u32 *)reg32);
+ PRINTK_DEBUG("Wrote ones, Read: [0x%08x]=0x%08x\n", reg32, data);
+ write32((u32 *)reg32, 0x00000000);
+ data = read32((u32 *)reg32);
+ PRINTK_DEBUG("Wrote zeros, Read: [0x%08x]=0x%08x\n", reg32, data);
+ }
+ }
+ PRINTK_DEBUG("Done dummy reads\n");
+
+ // XXX tRD
+
+ // XXX Write training
+
+ // XXX Read training
+
+ // DRADRB
+ dradrb_ddr2(s);
+ PRINTK_DEBUG("Done DRADRB\n");
+
+ // Memory map
+ mmap_ddr2(s);
+ PRINTK_DEBUG("Done memory map\n");
+
+ // Enhanced mode
+ enhanced_ddr2(s);
+ PRINTK_DEBUG("Done enhanced mode\n");
+
+ // Periodic RCOMP
+ MCHBAR16(0x160) = (MCHBAR16(0x160) & ~0xfff) | 0x999;
+ MCHBAR16(0x1b4) = MCHBAR16(0x1b4) | 0x3000;
+ MCHBAR8(0x130) = MCHBAR8(0x130) | 0x82;
+ PRINTK_DEBUG("Done PRCOMP\n");
+
+/*
+ MCHBAR8(0x5d8) = MCHBAR8(0x5d8) & ~1;
+ MCHBAR8(0x9d8) = MCHBAR8(0x9d8) & ~1;
+ MCHBAR8(0x188) = MCHBAR8(0x188) & ~1;
+*/
+
+ // Power settings
+ power_ddr2(s);
+ PRINTK_DEBUG("Done power settings\n");
+
+/*
+ MCHBAR32(0x174) = MCHBAR32(0x174) & ~0x30000;
+ MCHBAR16(0x1b4) = MCHBAR16(0x1b4) | 0x3000;
+ MCHBAR8(0x130) = MCHBAR8(0x130) | 0x2;
+
+ if (s->channel_capacity[0]) {
+ MCHBAR32(0x260) = MCHBAR32(0x260) | (1 << 27);
+ MCHBAR32(0x174) = MCHBAR32(0x174) & ~0x30000;
+ MCHBAR32(0x268) = MCHBAR32(0x268) | 0x80000000;
+ MCHBAR32(0x268) = MCHBAR32(0x268) | 0x40000000;
+
+ }
+ if (s->channel_capacity[1]) {
+ MCHBAR32(0x660) = MCHBAR32(0x660) | (1 << 27);
+ MCHBAR32(0x174) = MCHBAR32(0x174) & ~0x30000;
+ MCHBAR32(0x668) = MCHBAR32(0x668) | 0x80000000;
+ MCHBAR32(0x668) = MCHBAR32(0x668) | 0x40000000;
+ }
+
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) | 0x80;
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) & ~0x80;
+ MCHBAR8(0x5dc) = MCHBAR8(0x5dc) | 0x80;
+
+ // ME related
+ //MCHBAR32(0xa30) = MCHBAR32(0xa30) | (1 << 26);
+*/
+ PRINTK_DEBUG("Done ddr2\n");
+}
diff --git a/src/northbridge/intel/x4x/x4x.h b/src/northbridge/intel/x4x/x4x.h
index 99347fa..91c4916 100644
--- a/src/northbridge/intel/x4x/x4x.h
+++ b/src/northbridge/intel/x4x/x4x.h
@@ -29,25 +29,11 @@
#include <stdint.h>
typedef enum {
- FSB_CLOCK_1067MHz = 0,
- FSB_CLOCK_800MHz = 1,
- FSB_CLOCK_667MHz = 2,
+ FSB_CLOCK_800MHz = 0,
+ FSB_CLOCK_1066MHz = 1,
+ FSB_CLOCK_1333MHz = 2,
} fsb_clock_t;
-typedef enum { /* Steppings below B1 were pre-production,
- conversion stepping A1 is... ?
- We'll support B1, B2, B3, and conversion stepping A1. */
- STEPPING_A0 = 0,
- STEPPING_A1 = 1,
- STEPPING_A2 = 2,
- STEPPING_A3 = 3,
- STEPPING_B0 = 4,
- STEPPING_B1 = 5,
- STEPPING_B2 = 6,
- STEPPING_B3 = 7,
- STEPPING_CONVERSION_A1 = 9,
-} stepping_t;
-
typedef enum {
GMCH_GM45 = 0,
GMCH_GM47,
@@ -62,16 +48,15 @@ typedef enum {
} gmch_gfx_t;
typedef enum {
- MEM_CLOCK_533MHz = 0,
- MEM_CLOCK_400MHz = 1,
- MEM_CLOCK_333MHz = 2,
- MEM_CLOCK_1067MT = 0,
- MEM_CLOCK_800MT = 1,
- MEM_CLOCK_667MT = 2,
+ MEM_CLOCK_400MHz = 0,
+ MEM_CLOCK_533MHz = 1,
+ MEM_CLOCK_667MHz = 2,
+ MEM_CLOCK_800MHz = 3,
+ MEM_CLOCK_1066MHz = 4,
+ MEM_CLOCK_1333MHz = 5,
} mem_clock_t;
typedef enum {
- DDR1 = 1,
DDR2 = 2,
DDR3 = 3,
} ddr_t;
@@ -107,34 +92,42 @@ typedef struct {
unsigned int tRAS;
unsigned int tRP;
unsigned int tRCD;
- unsigned int tRFC;
unsigned int tWR;
- unsigned int tRD;
+ unsigned int tRFC;
+ unsigned int tWTR;
unsigned int tRRD;
- unsigned int tFAW;
- unsigned int tWL;
+ unsigned int tRTP;
} timings_t;
typedef struct {
unsigned int card_type; /* 0x0: unpopulated,
0xa - 0xf: raw card type A - F */
- chip_width_t chip_width;
+ chip_width_t width;
chip_capacity_t chip_capacity;
unsigned int page_size; /* of whole DIMM in Bytes (4096 or 8192) */
+ unsigned int sides;
unsigned int banks;
unsigned int ranks;
+ unsigned int rows;
+ unsigned int cols;
+ unsigned int cas_latencies;
+ unsigned int tAAmin;
+ unsigned int tCKmin;
+ unsigned int tWR;
+ unsigned int tRP;
+ unsigned int tRCD;
+ unsigned int tRAS;
unsigned int rank_capacity_mb; /* per rank in Mega Bytes */
+ u8 spd_data[256];
} dimminfo_t;
-/* The setup is one DIMM per channel, so there's no need to find a
- common timing setup between multiple chips (but chip and controller
- still need to be coordinated */
+/* The setup is up to two DIMMs per channel */
typedef struct {
- stepping_t stepping;
int txt_enabled;
int cores;
gmch_gfx_t gfx_type;
- int gs45_low_power_mode; /* low power mode of GMCH_GS45 */
+ int boot_path;
+ int gs45_low_power_mode;
int max_ddr2_mhz;
int max_ddr3_mt;
fsb_clock_t max_fsb;
@@ -144,23 +137,85 @@ typedef struct {
int enable_peg;
u16 ggc;
+ int dimm_config[2];
+ int dimms_per_ch;
int spd_type;
+ int channel_capacity[2];
timings_t selected_timings;
- dimminfo_t dimms[2];
+ dimminfo_t dimms[4];
u8 spd_map[4];
} sysinfo_t;
+
+typedef enum {
+ CLKSET0 = 0,
+ CTRL0,
+ CLKSET1,
+ CMD,
+ CTRL1,
+ CTRL2,
+ CTRL3,
+ DQS1,
+ DQS2,
+ DQS3,
+ DQS4,
+ DQS5,
+ DQS6,
+ DQS7,
+ DQS8,
+ DQ1,
+ DQ2,
+ DQ3,
+ DQ4,
+ DQ5,
+ DQ6,
+ DQ7,
+ DQ8
+} DDR2_Signals;
+
+#define NOP_CMD 0x2
+#define PRECHARGE_CMD 0x4
+#define MRS_CMD 0x6
+#define EMRS_CMD 0x8
+#define EMRS1_CMD (EMRS_CMD | 0x10)
+#define EMRS2_CMD (EMRS_CMD | 0x20)
+#define EMRS3_CMD (EMRS_CMD | 0x30)
+#define ZQCAL_CMD 0xa
+#define CBR_CMD 0xc
+#define NORMALOP_CMD 0xe
+
#define TOTAL_CHANNELS 2
-#define CHANNEL_IS_POPULATED(dimms, idx) (dimms[idx].card_type != 0)
-#define CHANNEL_IS_CARDF(dimms, idx) (dimms[idx].card_type == 0xf)
-#define IF_CHANNEL_POPULATED(dimms, idx) if (dimms[idx].card_type != 0)
+#define TOTAL_DIMMS 4
+
+#define DIMM_IS_POPULATED(dimms, idx) (dimms[idx].card_type != 0)
+#define IF_DIMM_POPULATED(dimms, idx) if (dimms[idx].card_type != 0)
+#define ONLY_DIMMA_IS_POPULATED(dimms, ch) ( \
+ (DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2) && \
+ !DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3)))
+#define ONLY_DIMMB_IS_POPULATED(dimms, ch) ( \
+ (DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3) && \
+ !DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2)))
+#define BOTH_DIMMS_ARE_POPULATED(dimms, ch) ( \
+ (DIMM_IS_POPULATED(dimms, (ch == 0) ? 0 : 2) && \
+ (DIMM_IS_POPULATED(dimms, (ch == 0) ? 1 : 3))))
+#define FOR_EACH_DIMM(idx) \
+ for (idx = 0; idx < TOTAL_DIMMS; ++idx)
+#define FOR_EACH_POPULATED_DIMM(dimms, idx) \
+ FOR_EACH_DIMM(idx) IF_DIMM_POPULATED(dimms, idx)
+#define CHANNEL_IS_POPULATED(dimms, idx) ((dimms[idx<<1].card_type != 0) || (dimms[(idx<<1) + 1].card_type != 0))
+#define CHANNEL_IS_CARDF(dimms, idx) ((dimms[idx<<1].card_type == 0xf) || (dimms[(idx<<1) + 1].card_type == 0xf))
+#define IF_CHANNEL_POPULATED(dimms, idx) if ((dimms[idx<<1].card_type != 0) || (dimms[(idx<<1) + 1].card_type != 0))
#define FOR_EACH_CHANNEL(idx) \
for (idx = 0; idx < TOTAL_CHANNELS; ++idx)
#define FOR_EACH_POPULATED_CHANNEL(dimms, idx) \
FOR_EACH_CHANNEL(idx) IF_CHANNEL_POPULATED(dimms, idx)
-#define RANKS_PER_CHANNEL 4 /* Only two may be populated */
+#define RANKS_PER_CHANNEL 4
+#define RANK_IS_POPULATED(dimms, ch, r) \
+ ((dimms[ch<<1].card_type && ((r) < dimms[ch<<1].ranks)) || \
+ (dimms[(ch<<1) + 1].card_type && ((r) >= 2) && ((r) < (dimms[(ch<<1) + 1].ranks + 2))))
#define IF_RANK_POPULATED(dimms, ch, r) \
- if (dimms[ch].card_type && ((r) < dimms[ch].ranks))
+ if ((dimms[ch<<1].card_type && ((r) < dimms[ch<<1].ranks)) || \
+ (dimms[(ch<<1) + 1].card_type && ((r) >= 2) && ((r) < (dimms[(ch<<1) + 1].ranks + 2))))
#define FOR_EACH_RANK_IN_CHANNEL(r) \
for (r = 0; r < RANKS_PER_CHANNEL; ++r)
#define FOR_EACH_POPULATED_RANK_IN_CHANNEL(dimms, ch, r) \
@@ -196,7 +251,7 @@ enum {
#define DEFAULT_DMIBAR 0xfed18000
#endif
#define DEFAULT_EPBAR 0xfed19000
-#define DEFAULT_HECIBAR ((u8 *)0xfed10000)
+#define DEFAULT_HECIBAR 0xfed10000
/* 4 KB per PCIe device */
#define DEFAULT_PCIEXBAR CONFIG_MMCONF_BASE_ADDRESS
@@ -429,6 +484,8 @@ u32 decode_igd_gtt_size(u32 gsm);
void init_igd(const sysinfo_t *const);
void igd_compute_ggc(sysinfo_t *const sysinfo);
int raminit_read_vco_index(void);
+void sdram_initialize(int boot_path, const u8 *spd_map);
+void raminit_ddr2(sysinfo_t *);
#if ENV_RAMSTAGE
More information about the coreboot-gerrit
mailing list