diff options
Diffstat (limited to 'src/northbridge/intel/nehalem/raminit.c')
-rw-r--r-- | src/northbridge/intel/nehalem/raminit.c | 4774 |
1 files changed, 0 insertions, 4774 deletions
diff --git a/src/northbridge/intel/nehalem/raminit.c b/src/northbridge/intel/nehalem/raminit.c deleted file mode 100644 index de02882483..0000000000 --- a/src/northbridge/intel/nehalem/raminit.c +++ /dev/null @@ -1,4774 +0,0 @@ -/* - * This file is part of the coreboot project. - * - * Copyright (C) 2013 Vladimir Serbinenko. - * - * This program is free software; you can redistribute it and/or modify - * it under the terms of the GNU General Public License as published by - * the Free Software Foundation; either version 2 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU General Public License for more details. - */ - -#include <console/console.h> -#include <commonlib/helpers.h> -#include <string.h> -#include <arch/io.h> -#include <device/mmio.h> -#include <device/pci_ops.h> -#include <cpu/x86/msr.h> -#include <cpu/x86/cache.h> -#include <cbmem.h> -#include <cf9_reset.h> -#include <ip_checksum.h> -#include <option.h> -#include <device/pci_def.h> -#include <device/device.h> -#include <halt.h> -#include <spd.h> -#include <timestamp.h> -#include <cpu/x86/mtrr.h> -#include <cpu/intel/speedstep.h> -#include <cpu/intel/turbo.h> -#include <mrc_cache.h> -#include <southbridge/intel/ibexpeak/me.h> -#include <southbridge/intel/common/pmbase.h> -#include <delay.h> -#include <types.h> - -#include "chip.h" -#include "nehalem.h" -#include "raminit.h" -#include "raminit_tables.h" - -#define NORTHBRIDGE PCI_DEV(0, 0, 0) -#define SOUTHBRIDGE PCI_DEV(0, 0x1f, 0) -#define GMA PCI_DEV (0, 0x2, 0x0) -#define HECIDEV PCI_DEV(0, 0x16, 0) -#define HECIBAR 0x10 - -#define FOR_ALL_RANKS \ - for (channel = 0; channel < NUM_CHANNELS; channel++) \ - for (slot = 0; slot < NUM_SLOTS; slot++) \ - for (rank = 0; rank < NUM_RANKS; rank++) - -#define FOR_POPULATED_RANKS \ - for (channel = 0; channel < NUM_CHANNELS; channel++) \ - for (slot = 0; slot < NUM_SLOTS; slot++) \ - for (rank = 0; rank < NUM_RANKS; rank++) \ - if (info->populated_ranks[channel][slot][rank]) - -#define FOR_POPULATED_RANKS_BACKWARDS \ - for (channel = NUM_CHANNELS - 1; channel >= 0; channel--) \ - for (slot = 0; slot < NUM_SLOTS; slot++) \ - for (rank = 0; rank < NUM_RANKS; rank++) \ - if (info->populated_ranks[channel][slot][rank]) - -/* [REG_178][CHANNEL][2 * SLOT + RANK][LANE] */ -typedef struct { - u8 smallest; - u8 largest; -} timing_bounds_t[2][2][2][9]; - -#define MRC_CACHE_VERSION 1 - -struct ram_training { - /* [TM][CHANNEL][SLOT][RANK][LANE] */ - u16 lane_timings[4][2][2][2][9]; - u16 reg_178; - u16 reg_10b; - - u8 reg178_center; - u8 reg178_smallest; - u8 reg178_largest; - timing_bounds_t timing_bounds[2]; - u16 timing_offset[2][2][2][9]; - u16 timing2_offset[2][2][2][9]; - u16 timing2_bounds[2][2][2][9][2]; - u8 reg274265[2][3]; /* [CHANNEL][REGISTER] */ - u8 reg2ca9_bit0; - u32 reg_6dc; - u32 reg_6e8; -}; - -#include <lib.h> /* Prototypes */ - -typedef struct _u128 { - u64 lo; - u64 hi; -} u128; - -static void read128(u32 addr, u64 * out) -{ - u128 ret; - u128 stor; - asm volatile ("movdqu %%xmm0, %0\n" - "movdqa (%2), %%xmm0\n" - "movdqu %%xmm0, %1\n" - "movdqu %0, %%xmm0":"+m" (stor), "=m"(ret):"r"(addr)); - out[0] = ret.lo; - out[1] = ret.hi; -} - -/* OK */ -static void write_1d0(u32 val, u16 addr, int bits, int flag) -{ - MCHBAR32(0x1d0) = 0; - while (MCHBAR32(0x1d0) & 0x800000) - ; - MCHBAR32(0x1d4) = - (val & ((1 << bits) - 1)) | (2 << bits) | (flag << bits); - MCHBAR32(0x1d0) = 0x40000000 | addr; - while (MCHBAR32(0x1d0) & 0x800000) - ; -} - -/* OK */ -static u16 read_1d0(u16 addr, int split) -{ - u32 val; - MCHBAR32(0x1d0) = 0; - while (MCHBAR32(0x1d0) & 0x800000) - ; - MCHBAR32(0x1d0) = - 0x80000000 | (((MCHBAR8(0x246) >> 2) & 3) + 0x361 - addr); - while (MCHBAR32(0x1d0) & 0x800000) - ; - val = MCHBAR32(0x1d8); - write_1d0(0, 0x33d, 0, 0); - write_1d0(0, 0x33d, 0, 0); - val &= ((1 << split) - 1); - // printk (BIOS_ERR, "R1D0C [%x] => %x\n", addr, val); - return val; -} - -static void write32p(uintptr_t addr, uint32_t val) -{ - write32((void *)addr, val); -} - -static uint32_t read32p(uintptr_t addr) -{ - return read32((void *)addr); -} - -static void sfence(void) -{ - asm volatile ("sfence"); -} - -static inline u16 get_lane_offset(int slot, int rank, int lane) -{ - return 0x124 * lane + ((lane & 4) ? 0x23e : 0) + 11 * rank + 22 * slot - - 0x452 * (lane == 8); -} - -static inline u16 get_timing_register_addr(int lane, int tm, int slot, int rank) -{ - const u16 offs[] = { 0x1d, 0xa8, 0xe6, 0x5c }; - return get_lane_offset(slot, rank, lane) + offs[(tm + 3) % 4]; -} - -static u32 gav_real(int line, u32 in) -{ - // printk (BIOS_DEBUG, "%d: GAV: %x\n", line, in); - return in; -} - -#define gav(x) gav_real (__LINE__, (x)) - -struct raminfo { - u16 clock_speed_index; /* clock_speed (REAL, not DDR) / 133.(3) - 3 */ - u16 fsb_frequency; /* in 1.(1)/2 MHz. */ - u8 is_x16_module[2][2]; /* [CHANNEL][SLOT] */ - u8 density[2][2]; /* [CHANNEL][SLOT] */ - u8 populated_ranks[2][2][2]; /* [CHANNEL][SLOT][RANK] */ - int rank_start[2][2][2]; - u8 cas_latency; - u8 board_lane_delay[9]; - u8 use_ecc; - u8 revision; - u8 max_supported_clock_speed_index; - u8 uma_enabled; - u8 spd[2][2][151]; /* [CHANNEL][SLOT][BYTE] */ - u8 silicon_revision; - u8 populated_ranks_mask[2]; - u8 max_slots_used_in_channel; - u8 mode4030[2]; - u16 avg4044[2]; - u16 max4048[2]; - unsigned int total_memory_mb; - unsigned int interleaved_part_mb; - unsigned int non_interleaved_part_mb; - - u32 heci_bar; - u64 heci_uma_addr; - unsigned int memory_reserved_for_heci_mb; - - struct ram_training training; - u32 last_500_command[2]; - - u32 delay46_ps[2]; - u32 delay54_ps[2]; - u8 revision_flag_1; - u8 some_delay_1_cycle_floor; - u8 some_delay_2_halfcycles_ceil; - u8 some_delay_3_ps_rounded; - - const struct ram_training *cached_training; -}; - -/* Global allocation of timings_car */ -timing_bounds_t timings_car[64]; - -static void -write_500(struct raminfo *info, int channel, u32 val, u16 addr, int bits, - int flag); - -/* OK */ -static u16 -read_500(struct raminfo *info, int channel, u16 addr, int split) -{ - u32 val; - info->last_500_command[channel] = 0x80000000; - MCHBAR32(0x500 + (channel << 10)) = 0; - while (MCHBAR32(0x500 + (channel << 10)) & 0x800000) - ; - MCHBAR32(0x500 + (channel << 10)) = - 0x80000000 | (((MCHBAR8(0x246 + (channel << 10)) >> 2) & 3) - + 0xb88 - addr); - while (MCHBAR32(0x500 + (channel << 10)) & 0x800000) - ; - val = MCHBAR32(0x508 + (channel << 10)); - return val & ((1 << split) - 1); -} - -/* OK */ -static void -write_500(struct raminfo *info, int channel, u32 val, u16 addr, int bits, - int flag) -{ - if (info->last_500_command[channel] == 0x80000000) { - info->last_500_command[channel] = 0x40000000; - write_500(info, channel, 0, 0xb61, 0, 0); - } - MCHBAR32(0x500 + (channel << 10)) = 0; - while (MCHBAR32(0x500 + (channel << 10)) & 0x800000) - ; - MCHBAR32(0x504 + (channel << 10)) = - (val & ((1 << bits) - 1)) | (2 << bits) | (flag << bits); - MCHBAR32(0x500 + (channel << 10)) = 0x40000000 | addr; - while (MCHBAR32(0x500 + (channel << 10)) & 0x800000) - ; -} - -static int rw_test(int rank) -{ - const u32 mask = 0xf00fc33c; - int ok = 0xff; - int i; - for (i = 0; i < 64; i++) - write32p((rank << 28) | (i << 2), 0); - sfence(); - for (i = 0; i < 64; i++) - gav(read32p((rank << 28) | (i << 2))); - sfence(); - for (i = 0; i < 32; i++) { - u32 pat = (((mask >> i) & 1) ? 0xffffffff : 0); - write32p((rank << 28) | (i << 3), pat); - write32p((rank << 28) | (i << 3) | 4, pat); - } - sfence(); - for (i = 0; i < 32; i++) { - u8 pat = (((mask >> i) & 1) ? 0xff : 0); - int j; - u32 val; - gav(val = read32p((rank << 28) | (i << 3))); - for (j = 0; j < 4; j++) - if (((val >> (j * 8)) & 0xff) != pat) - ok &= ~(1 << j); - gav(val = read32p((rank << 28) | (i << 3) | 4)); - for (j = 0; j < 4; j++) - if (((val >> (j * 8)) & 0xff) != pat) - ok &= ~(16 << j); - } - sfence(); - for (i = 0; i < 64; i++) - write32p((rank << 28) | (i << 2), 0); - sfence(); - for (i = 0; i < 64; i++) - gav(read32p((rank << 28) | (i << 2))); - - return ok; -} - -static void -program_timings(struct raminfo *info, u16 base, int channel, int slot, int rank) -{ - int lane; - for (lane = 0; lane < 8; lane++) { - write_500(info, channel, - base + - info->training. - lane_timings[2][channel][slot][rank][lane], - get_timing_register_addr(lane, 2, slot, rank), 9, 0); - write_500(info, channel, - base + - info->training. - lane_timings[3][channel][slot][rank][lane], - get_timing_register_addr(lane, 3, slot, rank), 9, 0); - } -} - -static void write_26c(int channel, u16 si) -{ - MCHBAR32(0x26c + (channel << 10)) = 0x03243f35; - MCHBAR32(0x268 + (channel << 10)) = 0xcfc00000 | (si << 9); - MCHBAR16(0x2b9 + (channel << 10)) = si; -} - -static u32 get_580(int channel, u8 addr) -{ - u32 ret; - gav(read_1d0(0x142, 3)); - MCHBAR8(0x5ff) = 0x0; - MCHBAR8(0x5ff) = 0x80; - MCHBAR32(0x580 + (channel << 10)) = 0x8493c012 | addr; - MCHBAR8_OR(0x580 + (channel << 10), 1); - while (!((ret = MCHBAR32(0x580 + (channel << 10))) & 0x10000)) - ; - MCHBAR8_AND(0x580 + (channel << 10), ~1); - return ret; -} - -const int cached_config = 0; - -#define NUM_CHANNELS 2 -#define NUM_SLOTS 2 -#define NUM_RANKS 2 -#define RANK_SHIFT 28 -#define CHANNEL_SHIFT 10 - -static void seq9(struct raminfo *info, int channel, int slot, int rank) -{ - int i, lane; - - for (i = 0; i < 2; i++) - for (lane = 0; lane < 8; lane++) - write_500(info, channel, - info->training.lane_timings[i + - 1][channel][slot] - [rank][lane], get_timing_register_addr(lane, - i + 1, - slot, - rank), - 9, 0); - - write_1d0(1, 0x103, 6, 1); - for (lane = 0; lane < 8; lane++) - write_500(info, channel, - info->training. - lane_timings[0][channel][slot][rank][lane], - get_timing_register_addr(lane, 0, slot, rank), 9, 0); - - for (i = 0; i < 2; i++) { - for (lane = 0; lane < 8; lane++) - write_500(info, channel, - info->training.lane_timings[i + - 1][channel][slot] - [rank][lane], get_timing_register_addr(lane, - i + 1, - slot, - rank), - 9, 0); - gav(get_580(channel, ((i + 1) << 2) | (rank << 5))); - } - - gav(read_1d0(0x142, 3)); // = 0x10408118 - MCHBAR8(0x5ff) = 0x0; - MCHBAR8(0x5ff) = 0x80; - write_1d0(0x2, 0x142, 3, 1); - for (lane = 0; lane < 8; lane++) { - // printk (BIOS_ERR, "before: %x\n", info->training.lane_timings[2][channel][slot][rank][lane]); - info->training.lane_timings[2][channel][slot][rank][lane] = - read_500(info, channel, - get_timing_register_addr(lane, 2, slot, rank), 9); - //printk (BIOS_ERR, "after: %x\n", info->training.lane_timings[2][channel][slot][rank][lane]); - info->training.lane_timings[3][channel][slot][rank][lane] = - info->training.lane_timings[2][channel][slot][rank][lane] + - 0x20; - } -} - -static int count_ranks_in_channel(struct raminfo *info, int channel) -{ - int slot, rank; - int res = 0; - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_SLOTS; rank++) - res += info->populated_ranks[channel][slot][rank]; - return res; -} - -static void -config_rank(struct raminfo *info, int s3resume, int channel, int slot, int rank) -{ - int add; - - write_1d0(0, 0x178, 7, 1); - seq9(info, channel, slot, rank); - program_timings(info, 0x80, channel, slot, rank); - - if (channel == 0) - add = count_ranks_in_channel(info, 1); - else - add = 0; - if (!s3resume) - gav(rw_test(rank + add)); - program_timings(info, 0x00, channel, slot, rank); - if (!s3resume) - gav(rw_test(rank + add)); - if (!s3resume) - gav(rw_test(rank + add)); - write_1d0(0, 0x142, 3, 1); - write_1d0(0, 0x103, 6, 1); - - gav(get_580(channel, 0xc | (rank << 5))); - gav(read_1d0(0x142, 3)); - - MCHBAR8(0x5ff) = 0x0; - MCHBAR8(0x5ff) = 0x80; -} - -static void set_4cf(struct raminfo *info, int channel, u8 val) -{ - gav(read_500(info, channel, 0x4cf, 4)); // = 0xc2300cf9 - write_500(info, channel, val, 0x4cf, 4, 1); - gav(read_500(info, channel, 0x659, 4)); // = 0x80300839 - write_500(info, channel, val, 0x659, 4, 1); - gav(read_500(info, channel, 0x697, 4)); // = 0x80300839 - write_500(info, channel, val, 0x697, 4, 1); -} - -static void set_334(int zero) -{ - int j, k, channel; - const u32 val3[] = { 0x2a2b2a2b, 0x26272627, 0x2e2f2e2f, 0x2a2b }; - u32 vd8[2][16]; - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - for (j = 0; j < 4; j++) { - u32 a = (j == 1) ? 0x29292929 : 0x31313131; - u32 lmask = (j == 3) ? 0xffff : 0xffffffff; - u16 c; - if ((j == 0 || j == 3) && zero) - c = 0; - else if (j == 3) - c = 0x5f; - else - c = 0x5f5f; - - for (k = 0; k < 2; k++) { - MCHBAR32(0x138 + 8 * k) = - (channel << 26) | (j << 24); - gav(vd8[1][(channel << 3) | (j << 1) | k] = - MCHBAR32(0x138 + 8 * k)); - gav(vd8[0][(channel << 3) | (j << 1) | k] = - MCHBAR32(0x13c + 8 * k)); - } - - MCHBAR32(0x334 + (channel << 10) + (j * 0x44)) = - zero ? 0 : val3[j]; - MCHBAR32(0x32c + (channel << 10) + (j * 0x44)) = - zero ? 0 : (0x18191819 & lmask); - MCHBAR16(0x34a + (channel << 10) + (j * 0x44)) = c; - MCHBAR32(0x33c + (channel << 10) + (j * 0x44)) = - zero ? 0 : (a & lmask); - MCHBAR32(0x344 + (channel << 10) + (j * 0x44)) = - zero ? 0 : (a & lmask); - } - } - - MCHBAR32_OR(0x130, 1); - while (MCHBAR8(0x130) & 1) - ; -} - -static void rmw_1d0(u16 addr, u32 and, u32 or, int split, int flag) -{ - u32 v; - v = read_1d0(addr, split); - write_1d0((v & and) | or, addr, split, flag); -} - -static int find_highest_bit_set(u16 val) -{ - int i; - for (i = 15; i >= 0; i--) - if (val & (1 << i)) - return i; - return -1; -} - -static int find_lowest_bit_set32(u32 val) -{ - int i; - for (i = 0; i < 32; i++) - if (val & (1 << i)) - return i; - return -1; -} - -enum { - DEVICE_TYPE = 2, - MODULE_TYPE = 3, - DENSITY = 4, - RANKS_AND_DQ = 7, - MEMORY_BUS_WIDTH = 8, - TIMEBASE_DIVIDEND = 10, - TIMEBASE_DIVISOR = 11, - CYCLETIME = 12, - - CAS_LATENCIES_LSB = 14, - CAS_LATENCIES_MSB = 15, - CAS_LATENCY_TIME = 16, - THERMAL_AND_REFRESH = 31, - REFERENCE_RAW_CARD_USED = 62, - RANK1_ADDRESS_MAPPING = 63 -}; - -static void calculate_timings(struct raminfo *info) -{ - unsigned int cycletime; - unsigned int cas_latency_time; - unsigned int supported_cas_latencies; - unsigned int channel, slot; - unsigned int clock_speed_index; - unsigned int min_cas_latency; - unsigned int cas_latency; - unsigned int max_clock_index; - - /* Find common CAS latency */ - supported_cas_latencies = 0x3fe; - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - if (info->populated_ranks[channel][slot][0]) - supported_cas_latencies &= - 2 * - (info-> - spd[channel][slot][CAS_LATENCIES_LSB] | - (info-> - spd[channel][slot][CAS_LATENCIES_MSB] << - 8)); - - max_clock_index = MIN(3, info->max_supported_clock_speed_index); - - cycletime = min_cycletime[max_clock_index]; - cas_latency_time = min_cas_latency_time[max_clock_index]; - - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - if (info->populated_ranks[channel][slot][0]) { - unsigned int timebase; - timebase = - 1000 * - info-> - spd[channel][slot][TIMEBASE_DIVIDEND] / - info->spd[channel][slot][TIMEBASE_DIVISOR]; - cycletime = - MAX(cycletime, - timebase * - info->spd[channel][slot][CYCLETIME]); - cas_latency_time = - MAX(cas_latency_time, - timebase * - info-> - spd[channel][slot][CAS_LATENCY_TIME]); - } - if (cycletime > min_cycletime[0]) - die("RAM init: Decoded SPD DRAM freq is slower than the controller minimum!"); - for (clock_speed_index = 0; clock_speed_index < 3; clock_speed_index++) { - if (cycletime == min_cycletime[clock_speed_index]) - break; - if (cycletime > min_cycletime[clock_speed_index]) { - clock_speed_index--; - cycletime = min_cycletime[clock_speed_index]; - break; - } - } - min_cas_latency = DIV_ROUND_UP(cas_latency_time, cycletime); - cas_latency = 0; - while (supported_cas_latencies) { - cas_latency = find_highest_bit_set(supported_cas_latencies) + 3; - if (cas_latency <= min_cas_latency) - break; - supported_cas_latencies &= - ~(1 << find_highest_bit_set(supported_cas_latencies)); - } - - if (cas_latency != min_cas_latency && clock_speed_index) - clock_speed_index--; - - if (cas_latency * min_cycletime[clock_speed_index] > 20000) - die("Couldn't configure DRAM"); - info->clock_speed_index = clock_speed_index; - info->cas_latency = cas_latency; -} - -static void program_base_timings(struct raminfo *info) -{ - unsigned int channel; - unsigned int slot, rank, lane; - unsigned int extended_silicon_revision; - int i; - - extended_silicon_revision = info->silicon_revision; - if (info->silicon_revision == 0) - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - if ((info-> - spd[channel][slot][MODULE_TYPE] & 0xF) == - 3) - extended_silicon_revision = 4; - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_SLOTS; rank++) { - int card_timing_2; - if (!info->populated_ranks[channel][slot][rank]) - continue; - - for (lane = 0; lane < 9; lane++) { - int tm_reg; - int card_timing; - - card_timing = 0; - if ((info-> - spd[channel][slot][MODULE_TYPE] & - 0xF) == 3) { - int reference_card; - reference_card = - info-> - spd[channel][slot] - [REFERENCE_RAW_CARD_USED] & - 0x1f; - if (reference_card == 3) - card_timing = - u16_ffd1188[0][lane] - [info-> - clock_speed_index]; - if (reference_card == 5) - card_timing = - u16_ffd1188[1][lane] - [info-> - clock_speed_index]; - } - - info->training. - lane_timings[0][channel][slot][rank] - [lane] = - u8_FFFD1218[info-> - clock_speed_index]; - info->training. - lane_timings[1][channel][slot][rank] - [lane] = 256; - - for (tm_reg = 2; tm_reg < 4; tm_reg++) - info->training. - lane_timings[tm_reg] - [channel][slot][rank][lane] - = - u8_FFFD1240[channel] - [extended_silicon_revision] - [lane][2 * slot + - rank][info-> - clock_speed_index] - + info->max4048[channel] - + - u8_FFFD0C78[channel] - [extended_silicon_revision] - [info-> - mode4030[channel]][slot] - [rank][info-> - clock_speed_index] - + card_timing; - for (tm_reg = 0; tm_reg < 4; tm_reg++) - write_500(info, channel, - info->training. - lane_timings[tm_reg] - [channel][slot][rank] - [lane], - get_timing_register_addr - (lane, tm_reg, slot, - rank), 9, 0); - } - - card_timing_2 = 0; - if (!(extended_silicon_revision != 4 - || (info-> - populated_ranks_mask[channel] & 5) == - 5)) { - if ((info-> - spd[channel][slot] - [REFERENCE_RAW_CARD_USED] & 0x1F) - == 3) - card_timing_2 = - u16_FFFE0EB8[0][info-> - clock_speed_index]; - if ((info-> - spd[channel][slot] - [REFERENCE_RAW_CARD_USED] & 0x1F) - == 5) - card_timing_2 = - u16_FFFE0EB8[1][info-> - clock_speed_index]; - } - - for (i = 0; i < 3; i++) - write_500(info, channel, - (card_timing_2 + - info->max4048[channel] - + - u8_FFFD0EF8[channel] - [extended_silicon_revision] - [info-> - mode4030[channel]][info-> - clock_speed_index]), - u16_fffd0c50[i][slot][rank], - 8, 1); - write_500(info, channel, - (info->max4048[channel] + - u8_FFFD0C78[channel] - [extended_silicon_revision][info-> - mode4030 - [channel]] - [slot][rank][info-> - clock_speed_index]), - u16_fffd0c70[slot][rank], 7, 1); - } - if (!info->populated_ranks_mask[channel]) - continue; - for (i = 0; i < 3; i++) - write_500(info, channel, - (info->max4048[channel] + - info->avg4044[channel] - + - u8_FFFD17E0[channel] - [extended_silicon_revision][info-> - mode4030 - [channel]][info-> - clock_speed_index]), - u16_fffd0c68[i], 8, 1); - } -} - -static unsigned int fsbcycle_ps(struct raminfo *info) -{ - return 900000 / info->fsb_frequency; -} - -/* The time of DDR transfer in ps. */ -static unsigned int halfcycle_ps(struct raminfo *info) -{ - return 3750 / (info->clock_speed_index + 3); -} - -/* The time of clock cycle in ps. */ -static unsigned int cycle_ps(struct raminfo *info) -{ - return 2 * halfcycle_ps(info); -} - -/* Frequency in 1.(1)=10/9 MHz units. */ -static unsigned int frequency_11(struct raminfo *info) -{ - return (info->clock_speed_index + 3) * 120; -} - -/* Frequency in 0.1 MHz units. */ -static unsigned int frequency_01(struct raminfo *info) -{ - return 100 * frequency_11(info) / 9; -} - -static unsigned int ps_to_halfcycles(struct raminfo *info, unsigned int ps) -{ - return (frequency_11(info) * 2) * ps / 900000; -} - -static unsigned int ns_to_cycles(struct raminfo *info, unsigned int ns) -{ - return (frequency_11(info)) * ns / 900; -} - -static void compute_derived_timings(struct raminfo *info) -{ - unsigned int channel, slot, rank; - int extended_silicon_revision; - int some_delay_1_ps; - int some_delay_2_ps; - int some_delay_2_halfcycles_ceil; - int some_delay_2_halfcycles_floor; - int some_delay_3_ps; - int some_delay_3_ps_rounded; - int some_delay_1_cycle_ceil; - int some_delay_1_cycle_floor; - - some_delay_3_ps_rounded = 0; - extended_silicon_revision = info->silicon_revision; - if (!info->silicon_revision) - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - if ((info-> - spd[channel][slot][MODULE_TYPE] & 0xF) == - 3) - extended_silicon_revision = 4; - if (info->board_lane_delay[7] < 5) - info->board_lane_delay[7] = 5; - info->revision_flag_1 = 2; - if (info->silicon_revision == 2 || info->silicon_revision == 3) - info->revision_flag_1 = 0; - if (info->revision < 16) - info->revision_flag_1 = 0; - - if (info->revision < 8) - info->revision_flag_1 = 0; - if (info->revision >= 8 && (info->silicon_revision == 0 - || info->silicon_revision == 1)) - some_delay_2_ps = 735; - else - some_delay_2_ps = 750; - - if (info->revision >= 0x10 && (info->silicon_revision == 0 - || info->silicon_revision == 1)) - some_delay_1_ps = 3929; - else - some_delay_1_ps = 3490; - - some_delay_1_cycle_floor = some_delay_1_ps / cycle_ps(info); - some_delay_1_cycle_ceil = some_delay_1_ps / cycle_ps(info); - if (some_delay_1_ps % cycle_ps(info)) - some_delay_1_cycle_ceil++; - else - some_delay_1_cycle_floor--; - info->some_delay_1_cycle_floor = some_delay_1_cycle_floor; - if (info->revision_flag_1) - some_delay_2_ps = halfcycle_ps(info) >> 6; - some_delay_2_ps += - MAX(some_delay_1_ps - 30, - 2 * halfcycle_ps(info) * (some_delay_1_cycle_ceil - 1) + 1000) + - 375; - some_delay_3_ps = - halfcycle_ps(info) - some_delay_2_ps % halfcycle_ps(info); - if (info->revision_flag_1) { - if (some_delay_3_ps >= 150) { - const int some_delay_3_halfcycles = - (some_delay_3_ps << 6) / halfcycle_ps(info); - some_delay_3_ps_rounded = - halfcycle_ps(info) * some_delay_3_halfcycles >> 6; - } - } - some_delay_2_halfcycles_ceil = - (some_delay_2_ps + halfcycle_ps(info) - 1) / halfcycle_ps(info) - - 2 * (some_delay_1_cycle_ceil - 1); - if (info->revision_flag_1 && some_delay_3_ps < 150) - some_delay_2_halfcycles_ceil++; - some_delay_2_halfcycles_floor = some_delay_2_halfcycles_ceil; - if (info->revision < 0x10) - some_delay_2_halfcycles_floor = - some_delay_2_halfcycles_ceil - 1; - if (!info->revision_flag_1) - some_delay_2_halfcycles_floor++; - info->some_delay_2_halfcycles_ceil = some_delay_2_halfcycles_ceil; - info->some_delay_3_ps_rounded = some_delay_3_ps_rounded; - if ((info->populated_ranks[0][0][0] && info->populated_ranks[0][1][0]) - || (info->populated_ranks[1][0][0] - && info->populated_ranks[1][1][0])) - info->max_slots_used_in_channel = 2; - else - info->max_slots_used_in_channel = 1; - for (channel = 0; channel < 2; channel++) - MCHBAR32(0x244 + (channel << 10)) = - ((info->revision < 8) ? 1 : 0x200) | - ((2 - info->max_slots_used_in_channel) << 17) | - (channel << 21) | - (info->some_delay_1_cycle_floor << 18) | 0x9510; - if (info->max_slots_used_in_channel == 1) { - info->mode4030[0] = (count_ranks_in_channel(info, 0) == 2); - info->mode4030[1] = (count_ranks_in_channel(info, 1) == 2); - } else { - info->mode4030[0] = ((count_ranks_in_channel(info, 0) == 1) || (count_ranks_in_channel(info, 0) == 2)) ? 2 : 3; /* 2 if 1 or 2 ranks */ - info->mode4030[1] = ((count_ranks_in_channel(info, 1) == 1) - || (count_ranks_in_channel(info, 1) == - 2)) ? 2 : 3; - } - for (channel = 0; channel < NUM_CHANNELS; channel++) { - int max_of_unk; - int min_of_unk_2; - - int i, count; - int sum; - - if (!info->populated_ranks_mask[channel]) - continue; - - max_of_unk = 0; - min_of_unk_2 = 32767; - - sum = 0; - count = 0; - for (i = 0; i < 3; i++) { - int unk1; - if (info->revision < 8) - unk1 = - u8_FFFD1891[0][channel][info-> - clock_speed_index] - [i]; - else if (! - (info->revision >= 0x10 - || info->revision_flag_1)) - unk1 = - u8_FFFD1891[1][channel][info-> - clock_speed_index] - [i]; - else - unk1 = 0; - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) { - int a = 0; - int b = 0; - - if (!info-> - populated_ranks[channel][slot] - [rank]) - continue; - if (extended_silicon_revision == 4 - && (info-> - populated_ranks_mask[channel] & - 5) != 5) { - if ((info-> - spd[channel][slot] - [REFERENCE_RAW_CARD_USED] & - 0x1F) == 3) { - a = u16_ffd1178[0] - [info-> - clock_speed_index]; - b = u16_fe0eb8[0][info-> - clock_speed_index]; - } else - if ((info-> - spd[channel][slot] - [REFERENCE_RAW_CARD_USED] - & 0x1F) == 5) { - a = u16_ffd1178[1] - [info-> - clock_speed_index]; - b = u16_fe0eb8[1][info-> - clock_speed_index]; - } - } - min_of_unk_2 = MIN(min_of_unk_2, a); - min_of_unk_2 = MIN(min_of_unk_2, b); - if (rank == 0) { - sum += a; - count++; - } - { - int t; - t = b + - u8_FFFD0EF8[channel] - [extended_silicon_revision] - [info-> - mode4030[channel]][info-> - clock_speed_index]; - if (unk1 >= t) - max_of_unk = - MAX(max_of_unk, - unk1 - t); - } - } - { - int t = - u8_FFFD17E0[channel] - [extended_silicon_revision][info-> - mode4030 - [channel]] - [info->clock_speed_index] + min_of_unk_2; - if (unk1 >= t) - max_of_unk = MAX(max_of_unk, unk1 - t); - } - } - - if (count == 0) - die("No memory ranks found for channel %u\n", channel); - - info->avg4044[channel] = sum / count; - info->max4048[channel] = max_of_unk; - } -} - -static void jedec_read(struct raminfo *info, - int channel, int slot, int rank, - int total_rank, u8 addr3, unsigned int value) -{ - /* Handle mirrored mapping. */ - if ((rank & 1) && (info->spd[channel][slot][RANK1_ADDRESS_MAPPING] & 1)) - addr3 = (addr3 & 0xCF) | ((addr3 & 0x10) << 1) | - ((addr3 >> 1) & 0x10); - MCHBAR8(0x271) = addr3 | (MCHBAR8(0x271) & 0xC1); - MCHBAR8(0x671) = addr3 | (MCHBAR8(0x671) & 0xC1); - - /* Handle mirrored mapping. */ - if ((rank & 1) && (info->spd[channel][slot][RANK1_ADDRESS_MAPPING] & 1)) - value = - (value & ~0x1f8) | ((value >> 1) & 0xa8) | ((value & 0xa8) - << 1); - - read32p((value << 3) | (total_rank << 28)); - - MCHBAR8(0x271) = (MCHBAR8(0x271) & 0xC3) | 2; - MCHBAR8(0x671) = (MCHBAR8(0x671) & 0xC3) | 2; - - read32p(total_rank << 28); -} - -enum { - MR1_RZQ12 = 512, - MR1_RZQ2 = 64, - MR1_RZQ4 = 4, - MR1_ODS34OHM = 2 -}; - -enum { - MR0_BT_INTERLEAVED = 8, - MR0_DLL_RESET_ON = 256 -}; - -enum { - MR2_RTT_WR_DISABLED = 0, - MR2_RZQ2 = 1 << 10 -}; - -static void jedec_init(struct raminfo *info) -{ - int write_recovery; - int channel, slot, rank; - int total_rank; - int dll_on; - int self_refresh_temperature; - int auto_self_refresh; - - auto_self_refresh = 1; - self_refresh_temperature = 1; - if (info->board_lane_delay[3] <= 10) { - if (info->board_lane_delay[3] <= 8) - write_recovery = info->board_lane_delay[3] - 4; - else - write_recovery = 5; - } else { - write_recovery = 6; - } - FOR_POPULATED_RANKS { - auto_self_refresh &= - (info->spd[channel][slot][THERMAL_AND_REFRESH] >> 2) & 1; - self_refresh_temperature &= - info->spd[channel][slot][THERMAL_AND_REFRESH] & 1; - } - if (auto_self_refresh == 1) - self_refresh_temperature = 0; - - dll_on = ((info->silicon_revision != 2 && info->silicon_revision != 3) - || (info->populated_ranks[0][0][0] - && info->populated_ranks[0][1][0]) - || (info->populated_ranks[1][0][0] - && info->populated_ranks[1][1][0])); - - total_rank = 0; - - for (channel = NUM_CHANNELS - 1; channel >= 0; channel--) { - int rtt, rtt_wr = MR2_RTT_WR_DISABLED; - int rzq_reg58e; - - if (info->silicon_revision == 2 || info->silicon_revision == 3) { - rzq_reg58e = 64; - rtt = MR1_RZQ2; - if (info->clock_speed_index != 0) { - rzq_reg58e = 4; - if (info->populated_ranks_mask[channel] == 3) - rtt = MR1_RZQ4; - } - } else { - if ((info->populated_ranks_mask[channel] & 5) == 5) { - rtt = MR1_RZQ12; - rzq_reg58e = 64; - rtt_wr = MR2_RZQ2; - } else { - rzq_reg58e = 4; - rtt = MR1_RZQ4; - } - } - - MCHBAR16(0x588 + (channel << 10)) = 0x0; - MCHBAR16(0x58a + (channel << 10)) = 0x4; - MCHBAR16(0x58c + (channel << 10)) = rtt | MR1_ODS34OHM; - MCHBAR16(0x58e + (channel << 10)) = rzq_reg58e | 0x82; - MCHBAR16(0x590 + (channel << 10)) = 0x1282; - - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - if (info->populated_ranks[channel][slot][rank]) { - jedec_read(info, channel, slot, rank, - total_rank, 0x28, - rtt_wr | (info-> - clock_speed_index - << 3) - | (auto_self_refresh << 6) | - (self_refresh_temperature << - 7)); - jedec_read(info, channel, slot, rank, - total_rank, 0x38, 0); - jedec_read(info, channel, slot, rank, - total_rank, 0x18, - rtt | MR1_ODS34OHM); - jedec_read(info, channel, slot, rank, - total_rank, 6, - (dll_on << 12) | - (write_recovery << 9) - | ((info->cas_latency - 4) << - 4) | MR0_BT_INTERLEAVED | - MR0_DLL_RESET_ON); - total_rank++; - } - } -} - -static void program_modules_memory_map(struct raminfo *info, int pre_jedec) -{ - unsigned int channel, slot, rank; - unsigned int total_mb[2] = { 0, 0 }; /* total memory per channel in MB */ - unsigned int channel_0_non_interleaved; - - FOR_ALL_RANKS { - if (info->populated_ranks[channel][slot][rank]) { - total_mb[channel] += - pre_jedec ? 256 : (256 << info-> - density[channel][slot] >> info-> - is_x16_module[channel][slot]); - MCHBAR8(0x208 + rank + 2 * slot + (channel << 10)) = - (pre_jedec ? (1 | ((1 + 1) << 1)) : - (info->is_x16_module[channel][slot] | - ((info->density[channel][slot] + 1) << 1))) | - 0x80; - } - MCHBAR16(0x200 + (channel << 10) + 4 * slot + 2 * rank) = - total_mb[channel] >> 6; - } - - info->total_memory_mb = total_mb[0] + total_mb[1]; - - info->interleaved_part_mb = - pre_jedec ? 0 : 2 * MIN(total_mb[0], total_mb[1]); - info->non_interleaved_part_mb = - total_mb[0] + total_mb[1] - info->interleaved_part_mb; - channel_0_non_interleaved = total_mb[0] - info->interleaved_part_mb / 2; - MCHBAR32(0x100) = channel_0_non_interleaved | - (info->non_interleaved_part_mb << 16); - if (!pre_jedec) - MCHBAR16(0x104) = info->interleaved_part_mb; -} - -static void program_board_delay(struct raminfo *info) -{ - int cas_latency_shift; - int some_delay_ns; - int some_delay_3_half_cycles; - - unsigned int channel, i; - int high_multiplier; - int lane_3_delay; - int cas_latency_derived; - - high_multiplier = 0; - some_delay_ns = 200; - some_delay_3_half_cycles = 4; - cas_latency_shift = info->silicon_revision == 0 - || info->silicon_revision == 1 ? 1 : 0; - if (info->revision < 8) { - some_delay_ns = 600; - cas_latency_shift = 0; - } - { - int speed_bit; - speed_bit = - ((info->clock_speed_index > 1 - || (info->silicon_revision != 2 - && info->silicon_revision != 3))) ^ (info->revision >= - 0x10); - write_500(info, 0, speed_bit | ((!info->use_ecc) << 1), 0x60e, - 3, 1); - write_500(info, 1, speed_bit | ((!info->use_ecc) << 1), 0x60e, - 3, 1); - if (info->revision >= 0x10 && info->clock_speed_index <= 1 - && (info->silicon_revision == 2 - || info->silicon_revision == 3)) - rmw_1d0(0x116, 5, 2, 4, 1); - } - MCHBAR32(0x120) = (1 << (info->max_slots_used_in_channel + 28)) | - 0x188e7f9f; - - MCHBAR8(0x124) = info->board_lane_delay[4] + - ((frequency_01(info) + 999) / 1000); - MCHBAR16(0x125) = 0x1360; - MCHBAR8(0x127) = 0x40; - if (info->fsb_frequency < frequency_11(info) / 2) { - unsigned int some_delay_2_half_cycles; - high_multiplier = 1; - some_delay_2_half_cycles = ps_to_halfcycles(info, - ((3 * - fsbcycle_ps(info)) - >> 1) + - (halfcycle_ps(info) - * - reg178_min[info-> - clock_speed_index] - >> 6) - + - 4 * - halfcycle_ps(info) - + 2230); - some_delay_3_half_cycles = - MIN((some_delay_2_half_cycles + - (frequency_11(info) * 2) * (28 - - some_delay_2_half_cycles) / - (frequency_11(info) * 2 - - 4 * (info->fsb_frequency))) >> 3, 7); - } - if (MCHBAR8(0x2ca9) & 1) - some_delay_3_half_cycles = 3; - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32_OR(0x220 + (channel << 10), 0x18001117); - MCHBAR32(0x224 + (channel << 10)) = - (info->max_slots_used_in_channel - 1) | - ((info->cas_latency - 5 - info->clock_speed_index) - << 21) | ((info->max_slots_used_in_channel + - info->cas_latency - cas_latency_shift - 4) << 16) | - ((info->cas_latency - cas_latency_shift - 4) << 26) | - ((info->cas_latency - info->clock_speed_index + - info->max_slots_used_in_channel - 6) << 8); - MCHBAR32(0x228 + (channel << 10)) = - info->max_slots_used_in_channel; - MCHBAR8(0x239 + (channel << 10)) = 32; - MCHBAR32(0x248 + (channel << 10)) = (high_multiplier << 24) | - (some_delay_3_half_cycles << 25) | 0x840000; - MCHBAR32(0x278 + (channel << 10)) = 0xc362042; - MCHBAR32(0x27c + (channel << 10)) = 0x8b000062; - MCHBAR32(0x24c + (channel << 10)) = - ((!!info->clock_speed_index) << 17) | - (((2 + info->clock_speed_index - - (!!info->clock_speed_index))) << 12) | 0x10200; - - MCHBAR8(0x267 + (channel << 10)) = 0x4; - MCHBAR16(0x272 + (channel << 10)) = 0x155; - MCHBAR32_AND_OR(0x2bc + (channel << 10), 0xFF000000, 0x707070); - - write_500(info, channel, - ((!info->populated_ranks[channel][1][1]) - | (!info->populated_ranks[channel][1][0] << 1) - | (!info->populated_ranks[channel][0][1] << 2) - | (!info->populated_ranks[channel][0][0] << 3)), - 0x4c9, 4, 1); - } - - MCHBAR8(0x2c4) = ((1 + (info->clock_speed_index != 0)) << 6) | 0xC; - { - u8 freq_divisor = 2; - if (info->fsb_frequency == frequency_11(info)) - freq_divisor = 3; - else if (2 * info->fsb_frequency < 3 * (frequency_11(info) / 2)) - freq_divisor = 1; - else - freq_divisor = 2; - MCHBAR32(0x2c0) = (freq_divisor << 11) | 0x6009c400; - } - - if (info->board_lane_delay[3] <= 10) { - if (info->board_lane_delay[3] <= 8) - lane_3_delay = info->board_lane_delay[3]; - else - lane_3_delay = 10; - } else { - lane_3_delay = 12; - } - cas_latency_derived = info->cas_latency - info->clock_speed_index + 2; - if (info->clock_speed_index > 1) - cas_latency_derived++; - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32(0x240 + (channel << 10)) = - ((info->clock_speed_index == 0) * 0x11000) | - 0x1002100 | ((2 + info->clock_speed_index) << 4) | - (info->cas_latency - 3); - write_500(info, channel, (info->clock_speed_index << 1) | 1, - 0x609, 6, 1); - write_500(info, channel, - info->clock_speed_index + 2 * info->cas_latency - 7, - 0x601, 6, 1); - - MCHBAR32(0x250 + (channel << 10)) = - ((lane_3_delay + info->clock_speed_index + 9) << 6) | - (info->board_lane_delay[7] << 2) | - (info->board_lane_delay[4] << 16) | - (info->board_lane_delay[1] << 25) | - (info->board_lane_delay[1] << 29) | 1; - MCHBAR32(0x254 + (channel << 10)) = - (info->board_lane_delay[1] >> 3) | - ((info->board_lane_delay[8] + 4 * info->use_ecc) << 6) | - 0x80 | (info->board_lane_delay[6] << 1) | - (info->board_lane_delay[2] << 28) | - (cas_latency_derived << 16) | 0x4700000; - MCHBAR32(0x258 + (channel << 10)) = - ((info->board_lane_delay[5] + info->clock_speed_index + - 9) << 12) | ((info->clock_speed_index - - info->cas_latency + 12) << 8) | - (info->board_lane_delay[2] << 17) | - (info->board_lane_delay[4] << 24) | 0x47; - MCHBAR32(0x25c + (channel << 10)) = - (info->board_lane_delay[1] << 1) | - (info->board_lane_delay[0] << 8) | 0x1da50000; - MCHBAR8(0x264 + (channel << 10)) = 0xff; - MCHBAR8(0x5f8 + (channel << 10)) = - (cas_latency_shift << 3) | info->use_ecc; - } - - program_modules_memory_map(info, 1); - - MCHBAR16(0x610) = (MIN(ns_to_cycles(info, some_delay_ns) / 2, 127) << 9) - | (MCHBAR16(0x610) & 0x1C3) | 0x3C; - MCHBAR16_OR(0x612, 0x100); - MCHBAR16_OR(0x214, 0x3E00); - for (i = 0; i < 8; i++) { - pci_write_config32(PCI_DEV (QUICKPATH_BUS, 0, 1), 0x80 + 4 * i, - (info->total_memory_mb - 64) | !i | 2); - pci_write_config32(PCI_DEV (QUICKPATH_BUS, 0, 1), 0xc0 + 4 * i, 0); - } -} - -#define DEFAULT_PCI_MMIO_SIZE 2048 -#define HOST_BRIDGE PCI_DEVFN(0, 0) - -static unsigned int get_mmio_size(void) -{ - const struct device *dev; - const struct northbridge_intel_nehalem_config *cfg = NULL; - - dev = pcidev_path_on_root(HOST_BRIDGE); - if (dev) - cfg = dev->chip_info; - - /* If this is zero, it just means devicetree.cb didn't set it */ - if (!cfg || cfg->pci_mmio_size == 0) - return DEFAULT_PCI_MMIO_SIZE; - else - return cfg->pci_mmio_size; -} - -#define BETTER_MEMORY_MAP 0 - -static void program_total_memory_map(struct raminfo *info) -{ - unsigned int TOM, TOLUD, TOUUD; - unsigned int quickpath_reserved; - unsigned int REMAPbase; - unsigned int uma_base_igd; - unsigned int uma_base_gtt; - unsigned int mmio_size; - int memory_remap; - unsigned int memory_map[8]; - int i; - unsigned int current_limit; - unsigned int tseg_base; - int uma_size_igd = 0, uma_size_gtt = 0; - - memset(memory_map, 0, sizeof(memory_map)); - - if (info->uma_enabled) { - u16 t = pci_read_config16(NORTHBRIDGE, D0F0_GGC); - gav(t); - const int uma_sizes_gtt[16] = - { 0, 1, 0, 2, 0, 0, 0, 0, 0, 2, 3, 4, 42, 42, 42, 42 }; - /* Igd memory */ - const int uma_sizes_igd[16] = { - 0, 0, 0, 0, 0, 32, 48, 64, 128, 256, 96, 160, 224, 352, - 256, 512 - }; - - uma_size_igd = uma_sizes_igd[(t >> 4) & 0xF]; - uma_size_gtt = uma_sizes_gtt[(t >> 8) & 0xF]; - } - - mmio_size = get_mmio_size(); - - TOM = info->total_memory_mb; - if (TOM == 4096) - TOM = 4032; - TOUUD = ALIGN_DOWN(TOM - info->memory_reserved_for_heci_mb, 64); - TOLUD = ALIGN_DOWN(MIN(4096 - mmio_size + ALIGN_UP(uma_size_igd + uma_size_gtt, 64) - , TOUUD), 64); - memory_remap = 0; - if (TOUUD - TOLUD > 64) { - memory_remap = 1; - REMAPbase = MAX(4096, TOUUD); - TOUUD = TOUUD - TOLUD + 4096; - } - if (TOUUD > 4096) - memory_map[2] = TOUUD | 1; - quickpath_reserved = 0; - - u32 t = pci_read_config32(PCI_DEV(QUICKPATH_BUS, 0, 1), 0x68); - - gav(t); - - if (t & 0x800) { - u32 shift = t >> 20; - if (shift == 0) - die("Quickpath value is 0\n"); - quickpath_reserved = (u32)1 << find_lowest_bit_set32(shift); - } - - if (memory_remap) - TOUUD -= quickpath_reserved; - - uma_base_igd = TOLUD - uma_size_igd; - uma_base_gtt = uma_base_igd - uma_size_gtt; - tseg_base = ALIGN_DOWN(uma_base_gtt, 64) - (CONFIG_SMM_TSEG_SIZE >> 20); - if (!memory_remap) - tseg_base -= quickpath_reserved; - tseg_base = ALIGN_DOWN(tseg_base, 8); - - pci_write_config16(NORTHBRIDGE, D0F0_TOLUD, TOLUD << 4); - pci_write_config16(NORTHBRIDGE, D0F0_TOM, TOM >> 6); - if (memory_remap) { - pci_write_config16(NORTHBRIDGE, D0F0_REMAPBASE, REMAPbase >> 6); - pci_write_config16(NORTHBRIDGE, D0F0_REMAPLIMIT, (TOUUD - 64) >> 6); - } - pci_write_config16(NORTHBRIDGE, D0F0_TOUUD, TOUUD); - - if (info->uma_enabled) { - pci_write_config32(NORTHBRIDGE, D0F0_IGD_BASE, uma_base_igd << 20); - pci_write_config32(NORTHBRIDGE, D0F0_GTT_BASE, uma_base_gtt << 20); - } - pci_write_config32(NORTHBRIDGE, TSEG, tseg_base << 20); - - current_limit = 0; - memory_map[0] = ALIGN_DOWN(uma_base_gtt, 64) | 1; - memory_map[1] = 4096; - for (i = 0; i < ARRAY_SIZE(memory_map); i++) { - current_limit = MAX(current_limit, memory_map[i] & ~1); - pci_write_config32(PCI_DEV(QUICKPATH_BUS, 0, 1), 4 * i + 0x80, - (memory_map[i] & 1) | ALIGN_DOWN(current_limit - - 1, 64) | 2); - pci_write_config32(PCI_DEV(QUICKPATH_BUS, 0, 1), 4 * i + 0xc0, 0); - } -} - -static void collect_system_info(struct raminfo *info) -{ - u32 capid0[3]; - int i; - unsigned int channel; - - /* Wait for some bit, maybe TXT clear. */ - while (!(read8((u8 *)0xfed40000) & (1 << 7))) - ; - - if (!info->heci_bar) - gav(info->heci_bar = - pci_read_config32(HECIDEV, HECIBAR) & 0xFFFFFFF8); - if (!info->memory_reserved_for_heci_mb) { - /* Wait for ME to be ready */ - intel_early_me_init(); - info->memory_reserved_for_heci_mb = intel_early_me_uma_size(); - } - - for (i = 0; i < 3; i++) - gav(capid0[i] = - pci_read_config32(NORTHBRIDGE, D0F0_CAPID0 | (i << 2))); - gav(info->revision = pci_read_config8(NORTHBRIDGE, PCI_REVISION_ID)); - info->max_supported_clock_speed_index = (~capid0[1] & 7); - - if ((capid0[1] >> 11) & 1) - info->uma_enabled = 0; - else - gav(info->uma_enabled = - pci_read_config8(NORTHBRIDGE, D0F0_DEVEN) & 8); - /* Unrecognised: [0000:fffd3d2d] 37f81.37f82 ! CPUID: eax: 00000001; ecx: 00000e00 => 00020655.00010800.029ae3ff.bfebfbff */ - info->silicon_revision = 0; - - if (capid0[2] & 2) { - info->silicon_revision = 0; - info->max_supported_clock_speed_index = 2; - for (channel = 0; channel < NUM_CHANNELS; channel++) - if (info->populated_ranks[channel][0][0] - && (info->spd[channel][0][MODULE_TYPE] & 0xf) == - 3) { - info->silicon_revision = 2; - info->max_supported_clock_speed_index = 1; - } - } else { - switch (((capid0[2] >> 18) & 1) + 2 * ((capid0[1] >> 3) & 1)) { - case 1: - case 2: - info->silicon_revision = 3; - break; - case 3: - info->silicon_revision = 0; - break; - case 0: - info->silicon_revision = 2; - break; - } - switch (pci_read_config16(NORTHBRIDGE, PCI_DEVICE_ID)) { - case 0x40: - info->silicon_revision = 0; - break; - case 0x48: - info->silicon_revision = 1; - break; - } - } -} - -static void write_training_data(struct raminfo *info) -{ - int tm, channel, slot, rank, lane; - if (info->revision < 8) - return; - - for (tm = 0; tm < 4; tm++) - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - for (lane = 0; lane < 9; lane++) - write_500(info, channel, - info-> - cached_training-> - lane_timings[tm] - [channel][slot][rank] - [lane], - get_timing_register_addr - (lane, tm, slot, - rank), 9, 0); - write_1d0(info->cached_training->reg_178, 0x178, 7, 1); - write_1d0(info->cached_training->reg_10b, 0x10b, 6, 1); -} - -static void dump_timings(struct raminfo *info) -{ - int channel, slot, rank, lane, i; - printk(RAM_SPEW, "Timings:\n"); - FOR_POPULATED_RANKS { - printk(RAM_SPEW, "channel %d, slot %d, rank %d\n", channel, - slot, rank); - for (lane = 0; lane < 9; lane++) { - printk(RAM_SPEW, "lane %d: ", lane); - for (i = 0; i < 4; i++) { - printk(RAM_SPEW, "%x (%x) ", - read_500(info, channel, - get_timing_register_addr - (lane, i, slot, rank), - 9), - info->training. - lane_timings[i][channel][slot][rank] - [lane]); - } - printk(RAM_SPEW, "\n"); - } - } - printk(RAM_SPEW, "[178] = %x (%x)\n", read_1d0(0x178, 7), - info->training.reg_178); - printk(RAM_SPEW, "[10b] = %x (%x)\n", read_1d0(0x10b, 6), - info->training.reg_10b); -} - -/* Read timings and other registers that need to be restored verbatim and - put them to CBMEM. - */ -static void save_timings(struct raminfo *info) -{ - struct ram_training train; - int channel, slot, rank, lane, i; - - train = info->training; - FOR_POPULATED_RANKS for (lane = 0; lane < 9; lane++) - for (i = 0; i < 4; i++) - train.lane_timings[i][channel][slot][rank][lane] = - read_500(info, channel, - get_timing_register_addr(lane, i, slot, - rank), 9); - train.reg_178 = read_1d0(0x178, 7); - train.reg_10b = read_1d0(0x10b, 6); - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - u32 reg32; - reg32 = MCHBAR32((channel << 10) + 0x274); - train.reg274265[channel][0] = reg32 >> 16; - train.reg274265[channel][1] = reg32 & 0xffff; - train.reg274265[channel][2] = - MCHBAR16((channel << 10) + 0x265) >> 8; - } - train.reg2ca9_bit0 = MCHBAR8(0x2ca9) & 1; - train.reg_6dc = MCHBAR32(0x6dc); - train.reg_6e8 = MCHBAR32(0x6e8); - - printk(RAM_SPEW, "[6dc] = %x\n", train.reg_6dc); - printk(RAM_SPEW, "[6e8] = %x\n", train.reg_6e8); - - /* Save the MRC S3 restore data to cbmem */ - mrc_cache_stash_data(MRC_TRAINING_DATA, MRC_CACHE_VERSION, - &train, sizeof(train)); -} - -static const struct ram_training *get_cached_training(void) -{ - struct region_device rdev; - if (mrc_cache_get_current(MRC_TRAINING_DATA, MRC_CACHE_VERSION, - &rdev)) - return 0; - return (void *)rdev_mmap_full(&rdev); -} - -/* FIXME: add timeout. */ -static void wait_heci_ready(void) -{ - while (!(read32(DEFAULT_HECIBAR + 0xc) & 8)) // = 0x8000000c - ; - write32((DEFAULT_HECIBAR + 0x4), - (read32(DEFAULT_HECIBAR + 0x4) & ~0x10) | 0xc); -} - -/* FIXME: add timeout. */ -static void wait_heci_cb_avail(int len) -{ - union { - struct mei_csr csr; - u32 raw; - } csr; - - while (!(read32(DEFAULT_HECIBAR + 0xc) & 8)) - ; - - do - csr.raw = read32(DEFAULT_HECIBAR + 0x4); - while (len > - csr.csr.buffer_depth - (csr.csr.buffer_write_ptr - - csr.csr.buffer_read_ptr)) - ; -} - -static void send_heci_packet(struct mei_header *head, u32 *payload) -{ - int len = (head->length + 3) / 4; - int i; - - wait_heci_cb_avail(len + 1); - - /* FIXME: handle leftovers correctly. */ - write32(DEFAULT_HECIBAR + 0, *(u32 *) head); - for (i = 0; i < len - 1; i++) - write32(DEFAULT_HECIBAR + 0, payload[i]); - - write32(DEFAULT_HECIBAR + 0, payload[i] & ((1 << (8 * len)) - 1)); - write32(DEFAULT_HECIBAR + 0x4, read32(DEFAULT_HECIBAR + 0x4) | 0x4); -} - -static void -send_heci_message(u8 *msg, int len, u8 hostaddress, u8 clientaddress) -{ - struct mei_header head; - int maxlen; - - wait_heci_ready(); - maxlen = (read32(DEFAULT_HECIBAR + 0x4) >> 24) * 4 - 4; - - while (len) { - int cur = len; - if (cur > maxlen) { - cur = maxlen; - head.is_complete = 0; - } else - head.is_complete = 1; - head.length = cur; - head.reserved = 0; - head.client_address = clientaddress; - head.host_address = hostaddress; - send_heci_packet(&head, (u32 *) msg); - len -= cur; - msg += cur; - } -} - -/* FIXME: Add timeout. */ -static int -recv_heci_packet(struct raminfo *info, struct mei_header *head, u32 *packet, - u32 *packet_size) -{ - union { - struct mei_csr csr; - u32 raw; - } csr; - int i = 0; - - write32(DEFAULT_HECIBAR + 0x4, read32(DEFAULT_HECIBAR + 0x4) | 2); - do { - csr.raw = read32(DEFAULT_HECIBAR + 0xc); - } - while (csr.csr.buffer_write_ptr == csr.csr.buffer_read_ptr) - ; - *(u32 *) head = read32(DEFAULT_HECIBAR + 0x8); - if (!head->length) { - write32(DEFAULT_HECIBAR + 0x4, - read32(DEFAULT_HECIBAR + 0x4) | 2); - *packet_size = 0; - return 0; - } - if (head->length + 4 > 4 * csr.csr.buffer_depth - || head->length > *packet_size) { - *packet_size = 0; - return -1; - } - - do - csr.raw = read32(DEFAULT_HECIBAR + 0xc); - while (((head->length + 3) >> 2) > - (csr.csr.buffer_write_ptr - csr.csr.buffer_read_ptr)) - ; - - for (i = 0; i < (head->length + 3) >> 2; i++) - packet[i++] = read32(DEFAULT_HECIBAR + 0x8); - *packet_size = head->length; - if (!csr.csr.ready) - *packet_size = 0; - write32(DEFAULT_HECIBAR + 0x4, read32(DEFAULT_HECIBAR + 0x4) | 4); - return 0; -} - -/* FIXME: Add timeout. */ -static int -recv_heci_message(struct raminfo *info, u32 *message, u32 *message_size) -{ - struct mei_header head; - int current_position; - - current_position = 0; - while (1) { - u32 current_size; - current_size = *message_size - current_position; - if (recv_heci_packet - (info, &head, message + (current_position >> 2), - ¤t_size) == -1) - break; - if (!current_size) - break; - current_position += current_size; - if (head.is_complete) { - *message_size = current_position; - return 0; - } - - if (current_position >= *message_size) - break; - } - *message_size = 0; - return -1; -} - -static void send_heci_uma_message(struct raminfo *info) -{ - struct uma_reply { - u8 group_id; - u8 command; - u8 reserved; - u8 result; - u8 field2; - u8 unk3[0x48 - 4 - 1]; - } __packed reply; - struct uma_message { - u8 group_id; - u8 cmd; - u8 reserved; - u8 result; - u32 c2; - u64 heci_uma_addr; - u32 memory_reserved_for_heci_mb; - u16 c3; - } __packed msg = { - 0, MKHI_SET_UMA, 0, 0, - 0x82, - info->heci_uma_addr, info->memory_reserved_for_heci_mb, 0}; - u32 reply_size; - - send_heci_message((u8 *) & msg, sizeof(msg), 0, 7); - - reply_size = sizeof(reply); - if (recv_heci_message(info, (u32 *) & reply, &reply_size) == -1) - return; - - if (reply.command != (MKHI_SET_UMA | (1 << 7))) - die("HECI init failed\n"); -} - -static void setup_heci_uma(struct raminfo *info) -{ - u32 reg44; - - reg44 = pci_read_config32(HECIDEV, 0x44); // = 0x80010020 - info->memory_reserved_for_heci_mb = 0; - info->heci_uma_addr = 0; - if (!((reg44 & 0x10000) && !(pci_read_config32(HECIDEV, 0x40) & 0x20))) - return; - - info->heci_bar = pci_read_config32(HECIDEV, 0x10) & 0xFFFFFFF0; - info->memory_reserved_for_heci_mb = reg44 & 0x3f; - info->heci_uma_addr = - ((u64) - ((((u64) pci_read_config16(NORTHBRIDGE, D0F0_TOM)) << 6) - - info->memory_reserved_for_heci_mb)) << 20; - - pci_read_config32(NORTHBRIDGE, DMIBAR); - if (info->memory_reserved_for_heci_mb) { - write32(DEFAULT_DMIBAR + 0x14, - read32(DEFAULT_DMIBAR + 0x14) & ~0x80); - write32(DEFAULT_RCBA + 0x14, - read32(DEFAULT_RCBA + 0x14) & ~0x80); - write32(DEFAULT_DMIBAR + 0x20, - read32(DEFAULT_DMIBAR + 0x20) & ~0x80); - write32(DEFAULT_RCBA + 0x20, - read32(DEFAULT_RCBA + 0x20) & ~0x80); - write32(DEFAULT_DMIBAR + 0x2c, - read32(DEFAULT_DMIBAR + 0x2c) & ~0x80); - write32(DEFAULT_RCBA + 0x30, - read32(DEFAULT_RCBA + 0x30) & ~0x80); - write32(DEFAULT_DMIBAR + 0x38, - read32(DEFAULT_DMIBAR + 0x38) & ~0x80); - write32(DEFAULT_RCBA + 0x40, - read32(DEFAULT_RCBA + 0x40) & ~0x80); - - write32(DEFAULT_RCBA + 0x40, 0x87000080); // OK - write32(DEFAULT_DMIBAR + 0x38, 0x87000080); // OK - while ((read16(DEFAULT_RCBA + 0x46) & 2) && - read16(DEFAULT_DMIBAR + 0x3e) & 2) - ; - } - - MCHBAR32(0x24) = 0x10000 + info->memory_reserved_for_heci_mb; - - send_heci_uma_message(info); - - pci_write_config32(HECIDEV, 0x10, 0x0); - pci_write_config8(HECIDEV, 0x4, 0x0); - -} - -static int have_match_ranks(struct raminfo *info, int channel, int ranks) -{ - int ranks_in_channel; - ranks_in_channel = info->populated_ranks[channel][0][0] - + info->populated_ranks[channel][0][1] - + info->populated_ranks[channel][1][0] - + info->populated_ranks[channel][1][1]; - - /* empty channel */ - if (ranks_in_channel == 0) - return 1; - - if (ranks_in_channel != ranks) - return 0; - /* single slot */ - if (info->populated_ranks[channel][0][0] != - info->populated_ranks[channel][1][0]) - return 1; - if (info->populated_ranks[channel][0][1] != - info->populated_ranks[channel][1][1]) - return 1; - if (info->is_x16_module[channel][0] != info->is_x16_module[channel][1]) - return 0; - if (info->density[channel][0] != info->density[channel][1]) - return 0; - return 1; -} - -static void read_4090(struct raminfo *info) -{ - int i, channel, slot, rank, lane; - for (i = 0; i < 2; i++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - for (lane = 0; lane < 9; lane++) - info->training. - lane_timings[0][i][slot][rank][lane] - = 32; - - for (i = 1; i < 4; i++) - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - for (lane = 0; lane < 9; lane++) { - info->training. - lane_timings[i][channel] - [slot][rank][lane] = - read_500(info, channel, - get_timing_register_addr - (lane, i, slot, - rank), 9) - + (i == 1) * 11; // !!!! - } - -} - -static u32 get_etalon2(int flip, u32 addr) -{ - const u16 invmask[] = { - 0xaaaa, 0x6db6, 0x4924, 0xeeee, 0xcccc, 0x8888, 0x7bde, 0x739c, - 0x6318, 0x4210, 0xefbe, 0xcf3c, 0x8e38, 0x0c30, 0x0820 - }; - u32 ret; - u32 comp4 = addr / 480; - addr %= 480; - u32 comp1 = addr & 0xf; - u32 comp2 = (addr >> 4) & 1; - u32 comp3 = addr >> 5; - - if (comp4) - ret = 0x1010101 << (comp4 - 1); - else - ret = 0; - if (flip ^ (((invmask[comp3] >> comp1) ^ comp2) & 1)) - ret = ~ret; - - return ret; -} - -static void disable_cache_region(void) -{ - msr_t msr = {.lo = 0, .hi = 0 }; - - wrmsr(MTRR_PHYS_BASE(3), msr); - wrmsr(MTRR_PHYS_MASK(3), msr); -} - -static void enable_cache_region(unsigned int base, unsigned int size) -{ - msr_t msr; - msr.lo = base | MTRR_TYPE_WRPROT; - msr.hi = 0; - wrmsr(MTRR_PHYS_BASE(3), msr); - msr.lo = ((~(ALIGN_DOWN(size + 4096, 4096) - 1) | MTRR_DEF_TYPE_EN) - & 0xffffffff); - msr.hi = 0x0000000f; - wrmsr(MTRR_PHYS_MASK(3), msr); -} - -static void flush_cache(u32 start, u32 size) -{ - u32 end; - u32 addr; - - end = start + (ALIGN_DOWN(size + 4096, 4096)); - for (addr = start; addr < end; addr += 64) - clflush((void *)addr); -} - -static void clear_errors(void) -{ - pci_write_config8(NORTHBRIDGE, 0xc0, 0x01); -} - -static void write_testing(struct raminfo *info, int totalrank, int flip) -{ - int nwrites = 0; - /* in 8-byte units. */ - u32 offset; - u8 *base; - - base = (u8 *)(totalrank << 28); - for (offset = 0; offset < 9 * 480; offset += 2) { - write32(base + offset * 8, get_etalon2(flip, offset)); - write32(base + offset * 8 + 4, get_etalon2(flip, offset)); - write32(base + offset * 8 + 8, get_etalon2(flip, offset + 1)); - write32(base + offset * 8 + 12, get_etalon2(flip, offset + 1)); - nwrites += 4; - if (nwrites >= 320) { - clear_errors(); - nwrites = 0; - } - } -} - -static u8 check_testing(struct raminfo *info, u8 total_rank, int flip) -{ - u8 failmask = 0; - int i; - int comp1, comp2, comp3; - u32 failxor[2] = { 0, 0 }; - - enable_cache_region((total_rank << 28), 1728 * 5 * 4); - - for (comp3 = 0; comp3 < 9 && failmask != 0xff; comp3++) { - for (comp1 = 0; comp1 < 4; comp1++) - for (comp2 = 0; comp2 < 60; comp2++) { - u32 re[4]; - u32 curroffset = - comp3 * 8 * 60 + 2 * comp1 + 8 * comp2; - read128((total_rank << 28) | (curroffset << 3), - (u64 *) re); - failxor[0] |= - get_etalon2(flip, curroffset) ^ re[0]; - failxor[1] |= - get_etalon2(flip, curroffset) ^ re[1]; - failxor[0] |= - get_etalon2(flip, curroffset | 1) ^ re[2]; - failxor[1] |= - get_etalon2(flip, curroffset | 1) ^ re[3]; - } - for (i = 0; i < 8; i++) - if ((0xff << (8 * (i % 4))) & failxor[i / 4]) - failmask |= 1 << i; - } - disable_cache_region(); - flush_cache((total_rank << 28), 1728 * 5 * 4); - return failmask; -} - -const u32 seed1[0x18] = { - 0x3a9d5ab5, 0x576cb65b, 0x555773b6, 0x2ab772ee, - 0x555556ee, 0x3a9d5ab5, 0x576cb65b, 0x555773b6, - 0x2ab772ee, 0x555556ee, 0x5155a555, 0x5155a555, - 0x5155a555, 0x5155a555, 0x3a9d5ab5, 0x576cb65b, - 0x555773b6, 0x2ab772ee, 0x555556ee, 0x55d6b4a5, - 0x366d6b3a, 0x2ae5ddbb, 0x3b9ddbb7, 0x55d6b4a5, -}; - -static u32 get_seed2(int a, int b) -{ - const u32 seed2[5] = { - 0x55555555, 0x33333333, 0x2e555a55, 0x55555555, - 0x5b6db6db, - }; - u32 r; - r = seed2[(a + (a >= 10)) / 5]; - return b ? ~r : r; -} - -static int make_shift(int comp2, int comp5, int x) -{ - const u8 seed3[32] = { - 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, - 0x00, 0x00, 0x38, 0x1c, 0x3c, 0x18, 0x38, 0x38, - 0x38, 0x38, 0x38, 0x38, 0x0f, 0x0f, 0x0f, 0x0f, - 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, - }; - - return (comp2 - ((seed3[comp5] >> (x & 7)) & 1)) & 0x1f; -} - -static u32 get_etalon(int flip, u32 addr) -{ - u32 mask_byte = 0; - int comp1 = (addr >> 1) & 1; - int comp2 = (addr >> 3) & 0x1f; - int comp3 = (addr >> 8) & 0xf; - int comp4 = (addr >> 12) & 0xf; - int comp5 = (addr >> 16) & 0x1f; - u32 mask_bit = ~(0x10001 << comp3); - u32 part1; - u32 part2; - int byte; - - part2 = - ((seed1[comp5] >> - make_shift(comp2, comp5, - (comp3 >> 3) | (comp1 << 2) | 2)) & 1) ^ flip; - part1 = - ((seed1[comp5] >> - make_shift(comp2, comp5, - (comp3 >> 3) | (comp1 << 2) | 0)) & 1) ^ flip; - - for (byte = 0; byte < 4; byte++) - if ((get_seed2(comp5, comp4) >> - make_shift(comp2, comp5, (byte | (comp1 << 2)))) & 1) - mask_byte |= 0xff << (8 * byte); - - return (mask_bit & mask_byte) | (part1 << comp3) | (part2 << - (comp3 + 16)); -} - -static void -write_testing_type2(struct raminfo *info, u8 totalrank, u8 region, u8 block, - char flip) -{ - int i; - for (i = 0; i < 2048; i++) - write32p((totalrank << 28) | (region << 25) | (block << 16) | - (i << 2), get_etalon(flip, (block << 16) | (i << 2))); -} - -static u8 -check_testing_type2(struct raminfo *info, u8 totalrank, u8 region, u8 block, - char flip) -{ - u8 failmask = 0; - u32 failxor[2]; - int i; - int comp1, comp2, comp3; - - failxor[0] = 0; - failxor[1] = 0; - - enable_cache_region(totalrank << 28, 134217728); - for (comp3 = 0; comp3 < 2 && failmask != 0xff; comp3++) { - for (comp1 = 0; comp1 < 16; comp1++) - for (comp2 = 0; comp2 < 64; comp2++) { - u32 addr = - (totalrank << 28) | (region << 25) | (block - << 16) - | (comp3 << 12) | (comp2 << 6) | (comp1 << - 2); - failxor[comp1 & 1] |= - read32p(addr) ^ get_etalon(flip, addr); - } - for (i = 0; i < 8; i++) - if ((0xff << (8 * (i % 4))) & failxor[i / 4]) - failmask |= 1 << i; - } - disable_cache_region(); - flush_cache((totalrank << 28) | (region << 25) | (block << 16), 16384); - return failmask; -} - -static int check_bounded(unsigned short *vals, u16 bound) -{ - int i; - - for (i = 0; i < 8; i++) - if (vals[i] < bound) - return 0; - return 1; -} - -enum state { - BEFORE_USABLE = 0, AT_USABLE = 1, AT_MARGIN = 2, COMPLETE = 3 -}; - -static int validate_state(enum state *in) -{ - int i; - for (i = 0; i < 8; i++) - if (in[i] != COMPLETE) - return 0; - return 1; -} - -static void -do_fsm(enum state *state, u16 *counter, - u8 fail_mask, int margin, int uplimit, - u8 *res_low, u8 *res_high, u8 val) -{ - int lane; - - for (lane = 0; lane < 8; lane++) { - int is_fail = (fail_mask >> lane) & 1; - switch (state[lane]) { - case BEFORE_USABLE: - if (!is_fail) { - counter[lane] = 1; - state[lane] = AT_USABLE; - break; - } - counter[lane] = 0; - state[lane] = BEFORE_USABLE; - break; - case AT_USABLE: - if (!is_fail) { - ++counter[lane]; - if (counter[lane] >= margin) { - state[lane] = AT_MARGIN; - res_low[lane] = val - margin + 1; - break; - } - state[lane] = 1; - break; - } - counter[lane] = 0; - state[lane] = BEFORE_USABLE; - break; - case AT_MARGIN: - if (is_fail) { - state[lane] = COMPLETE; - res_high[lane] = val - 1; - } else { - counter[lane]++; - state[lane] = AT_MARGIN; - if (val == uplimit) { - state[lane] = COMPLETE; - res_high[lane] = uplimit; - } - } - break; - case COMPLETE: - break; - } - } -} - -static void -train_ram_at_178(struct raminfo *info, u8 channel, int slot, int rank, - u8 total_rank, u8 reg_178, int first_run, int niter, - timing_bounds_t * timings) -{ - int lane; - enum state state[8]; - u16 count[8]; - u8 lower_usable[8]; - u8 upper_usable[8]; - unsigned short num_successfully_checked[8]; - u8 reg1b3; - int i; - - for (i = 0; i < 8; i++) - state[i] = BEFORE_USABLE; - - if (!first_run) { - int is_all_ok = 1; - for (lane = 0; lane < 8; lane++) - if (timings[reg_178][channel][slot][rank][lane]. - smallest == - timings[reg_178][channel][slot][rank][lane]. - largest) { - timings[reg_178][channel][slot][rank][lane]. - smallest = 0; - timings[reg_178][channel][slot][rank][lane]. - largest = 0; - is_all_ok = 0; - } - if (is_all_ok) { - for (i = 0; i < 8; i++) - state[i] = COMPLETE; - } - } - - for (reg1b3 = 0; reg1b3 < 0x30 && !validate_state(state); reg1b3++) { - u8 failmask = 0; - write_1d0(reg1b3 ^ 32, 0x1b3, 6, 1); - write_1d0(reg1b3 ^ 32, 0x1a3, 6, 1); - failmask = check_testing(info, total_rank, 0); - MCHBAR32_OR(0xfb0, 0x00030000); - do_fsm(state, count, failmask, 5, 47, lower_usable, - upper_usable, reg1b3); - } - - if (reg1b3) { - write_1d0(0, 0x1b3, 6, 1); - write_1d0(0, 0x1a3, 6, 1); - for (lane = 0; lane < 8; lane++) { - if (state[lane] == COMPLETE) { - timings[reg_178][channel][slot][rank][lane]. - smallest = - lower_usable[lane] + - (info->training. - lane_timings[0][channel][slot][rank][lane] - & 0x3F) - 32; - timings[reg_178][channel][slot][rank][lane]. - largest = - upper_usable[lane] + - (info->training. - lane_timings[0][channel][slot][rank][lane] - & 0x3F) - 32; - } - } - } - - if (!first_run) { - for (lane = 0; lane < 8; lane++) - if (state[lane] == COMPLETE) { - write_500(info, channel, - timings[reg_178][channel][slot][rank] - [lane].smallest, - get_timing_register_addr(lane, 0, - slot, rank), - 9, 1); - write_500(info, channel, - timings[reg_178][channel][slot][rank] - [lane].smallest + - info->training. - lane_timings[1][channel][slot][rank] - [lane] - - - info->training. - lane_timings[0][channel][slot][rank] - [lane], get_timing_register_addr(lane, - 1, - slot, - rank), - 9, 1); - num_successfully_checked[lane] = 0; - } else - num_successfully_checked[lane] = -1; - - do { - u8 failmask = 0; - for (i = 0; i < niter; i++) { - if (failmask == 0xFF) - break; - failmask |= - check_testing_type2(info, total_rank, 2, i, - 0); - failmask |= - check_testing_type2(info, total_rank, 3, i, - 1); - } - MCHBAR32_OR(0xfb0, 0x00030000); - for (lane = 0; lane < 8; lane++) - if (num_successfully_checked[lane] != 0xffff) { - if ((1 << lane) & failmask) { - if (timings[reg_178][channel] - [slot][rank][lane]. - largest <= - timings[reg_178][channel] - [slot][rank][lane].smallest) - num_successfully_checked - [lane] = -1; - else { - num_successfully_checked - [lane] = 0; - timings[reg_178] - [channel][slot] - [rank][lane]. - smallest++; - write_500(info, channel, - timings - [reg_178] - [channel] - [slot][rank] - [lane]. - smallest, - get_timing_register_addr - (lane, 0, - slot, rank), - 9, 1); - write_500(info, channel, - timings - [reg_178] - [channel] - [slot][rank] - [lane]. - smallest + - info-> - training. - lane_timings - [1][channel] - [slot][rank] - [lane] - - - info-> - training. - lane_timings - [0][channel] - [slot][rank] - [lane], - get_timing_register_addr - (lane, 1, - slot, rank), - 9, 1); - } - } else - num_successfully_checked[lane] - ++; - } - } - while (!check_bounded(num_successfully_checked, 2)) - ; - - for (lane = 0; lane < 8; lane++) - if (state[lane] == COMPLETE) { - write_500(info, channel, - timings[reg_178][channel][slot][rank] - [lane].largest, - get_timing_register_addr(lane, 0, - slot, rank), - 9, 1); - write_500(info, channel, - timings[reg_178][channel][slot][rank] - [lane].largest + - info->training. - lane_timings[1][channel][slot][rank] - [lane] - - - info->training. - lane_timings[0][channel][slot][rank] - [lane], get_timing_register_addr(lane, - 1, - slot, - rank), - 9, 1); - num_successfully_checked[lane] = 0; - } else - num_successfully_checked[lane] = -1; - - do { - int failmask = 0; - for (i = 0; i < niter; i++) { - if (failmask == 0xFF) - break; - failmask |= - check_testing_type2(info, total_rank, 2, i, - 0); - failmask |= - check_testing_type2(info, total_rank, 3, i, - 1); - } - - MCHBAR32_OR(0xfb0, 0x00030000); - for (lane = 0; lane < 8; lane++) { - if (num_successfully_checked[lane] != 0xffff) { - if ((1 << lane) & failmask) { - if (timings[reg_178][channel] - [slot][rank][lane]. - largest <= - timings[reg_178][channel] - [slot][rank][lane]. - smallest) { - num_successfully_checked - [lane] = -1; - } else { - num_successfully_checked - [lane] = 0; - timings[reg_178] - [channel][slot] - [rank][lane]. - largest--; - write_500(info, channel, - timings - [reg_178] - [channel] - [slot][rank] - [lane]. - largest, - get_timing_register_addr - (lane, 0, - slot, rank), - 9, 1); - write_500(info, channel, - timings - [reg_178] - [channel] - [slot][rank] - [lane]. - largest + - info-> - training. - lane_timings - [1][channel] - [slot][rank] - [lane] - - - info-> - training. - lane_timings - [0][channel] - [slot][rank] - [lane], - get_timing_register_addr - (lane, 1, - slot, rank), - 9, 1); - } - } else - num_successfully_checked[lane] - ++; - } - } - } - while (!check_bounded(num_successfully_checked, 3)) - ; - - for (lane = 0; lane < 8; lane++) { - write_500(info, channel, - info->training. - lane_timings[0][channel][slot][rank][lane], - get_timing_register_addr(lane, 0, slot, rank), - 9, 1); - write_500(info, channel, - info->training. - lane_timings[1][channel][slot][rank][lane], - get_timing_register_addr(lane, 1, slot, rank), - 9, 1); - if (timings[reg_178][channel][slot][rank][lane]. - largest <= - timings[reg_178][channel][slot][rank][lane]. - smallest) { - timings[reg_178][channel][slot][rank][lane]. - largest = 0; - timings[reg_178][channel][slot][rank][lane]. - smallest = 0; - } - } - } -} - -static void set_10b(struct raminfo *info, u8 val) -{ - int channel; - int slot, rank; - int lane; - - if (read_1d0(0x10b, 6) == val) - return; - - write_1d0(val, 0x10b, 6, 1); - - FOR_POPULATED_RANKS_BACKWARDS for (lane = 0; lane < 9; lane++) { - u16 reg_500; - reg_500 = read_500(info, channel, - get_timing_register_addr(lane, 0, slot, - rank), 9); - if (val == 1) { - if (lut16[info->clock_speed_index] <= reg_500) - reg_500 -= lut16[info->clock_speed_index]; - else - reg_500 = 0; - } else { - reg_500 += lut16[info->clock_speed_index]; - } - write_500(info, channel, reg_500, - get_timing_register_addr(lane, 0, slot, rank), 9, 1); - } -} - -static void set_ecc(int onoff) -{ - int channel; - for (channel = 0; channel < NUM_CHANNELS; channel++) { - u8 t; - t = MCHBAR8((channel << 10) + 0x5f8); - if (onoff) - t |= 1; - else - t &= ~1; - MCHBAR8((channel << 10) + 0x5f8) = t; - } -} - -static void set_178(u8 val) -{ - if (val >= 31) - val = val - 31; - else - val = 63 - val; - - write_1d0(2 * val, 0x178, 7, 1); -} - -static void -write_500_timings_type(struct raminfo *info, int channel, int slot, int rank, - int type) -{ - int lane; - - for (lane = 0; lane < 8; lane++) - write_500(info, channel, - info->training. - lane_timings[type][channel][slot][rank][lane], - get_timing_register_addr(lane, type, slot, rank), 9, - 0); -} - -static void -try_timing_offsets(struct raminfo *info, int channel, - int slot, int rank, int totalrank) -{ - u16 count[8]; - enum state state[8]; - u8 lower_usable[8], upper_usable[8]; - int lane; - int i; - int flip = 1; - int timing_offset; - - for (i = 0; i < 8; i++) - state[i] = BEFORE_USABLE; - - memset(count, 0, sizeof(count)); - - for (lane = 0; lane < 8; lane++) - write_500(info, channel, - info->training. - lane_timings[2][channel][slot][rank][lane] + 32, - get_timing_register_addr(lane, 3, slot, rank), 9, 1); - - for (timing_offset = 0; !validate_state(state) && timing_offset < 64; - timing_offset++) { - u8 failmask; - write_1d0(timing_offset ^ 32, 0x1bb, 6, 1); - failmask = 0; - for (i = 0; i < 2 && failmask != 0xff; i++) { - flip = !flip; - write_testing(info, totalrank, flip); - failmask |= check_testing(info, totalrank, flip); - } - do_fsm(state, count, failmask, 10, 63, lower_usable, - upper_usable, timing_offset); - } - write_1d0(0, 0x1bb, 6, 1); - dump_timings(info); - if (!validate_state(state)) - die("Couldn't discover DRAM timings (1)\n"); - - for (lane = 0; lane < 8; lane++) { - u8 bias = 0; - - if (info->silicon_revision) { - int usable_length; - - usable_length = upper_usable[lane] - lower_usable[lane]; - if (usable_length >= 20) { - bias = usable_length / 2 - 10; - if (bias >= 2) - bias = 2; - } - } - write_500(info, channel, - info->training. - lane_timings[2][channel][slot][rank][lane] + - (upper_usable[lane] + lower_usable[lane]) / 2 - bias, - get_timing_register_addr(lane, 3, slot, rank), 9, 1); - info->training.timing2_bounds[channel][slot][rank][lane][0] = - info->training.lane_timings[2][channel][slot][rank][lane] + - lower_usable[lane]; - info->training.timing2_bounds[channel][slot][rank][lane][1] = - info->training.lane_timings[2][channel][slot][rank][lane] + - upper_usable[lane]; - info->training.timing2_offset[channel][slot][rank][lane] = - info->training.lane_timings[2][channel][slot][rank][lane]; - } -} - -static u8 -choose_training(struct raminfo *info, int channel, int slot, int rank, - int lane, timing_bounds_t * timings, u8 center_178) -{ - u16 central_weight; - u16 side_weight; - unsigned int sum = 0, count = 0; - u8 span; - u8 lower_margin, upper_margin; - u8 reg_178; - u8 result; - - span = 12; - central_weight = 20; - side_weight = 20; - if (info->silicon_revision == 1 && channel == 1) { - central_weight = 5; - side_weight = 20; - if ((info-> - populated_ranks_mask[1] ^ (info-> - populated_ranks_mask[1] >> 2)) & - 1) - span = 18; - } - if ((info->populated_ranks_mask[0] & 5) == 5) { - central_weight = 20; - side_weight = 20; - } - if (info->clock_speed_index >= 2 - && (info->populated_ranks_mask[0] & 5) == 5 && slot == 1) { - if (info->silicon_revision == 1) { - switch (channel) { - case 0: - if (lane == 1) { - central_weight = 10; - side_weight = 20; - } - break; - case 1: - if (lane == 6) { - side_weight = 5; - central_weight = 20; - } - break; - } - } - if (info->silicon_revision == 0 && channel == 0 && lane == 0) { - side_weight = 5; - central_weight = 20; - } - } - for (reg_178 = center_178 - span; reg_178 <= center_178 + span; - reg_178 += span) { - u8 smallest; - u8 largest; - largest = timings[reg_178][channel][slot][rank][lane].largest; - smallest = timings[reg_178][channel][slot][rank][lane].smallest; - if (largest - smallest + 1 >= 5) { - unsigned int weight; - if (reg_178 == center_178) - weight = central_weight; - else - weight = side_weight; - sum += weight * (largest + smallest); - count += weight; - } - } - dump_timings(info); - if (count == 0) - die("Couldn't discover DRAM timings (2)\n"); - result = sum / (2 * count); - lower_margin = - result - timings[center_178][channel][slot][rank][lane].smallest; - upper_margin = - timings[center_178][channel][slot][rank][lane].largest - result; - if (upper_margin < 10 && lower_margin > 10) - result -= MIN(lower_margin - 10, 10 - upper_margin); - if (upper_margin > 10 && lower_margin < 10) - result += MIN(upper_margin - 10, 10 - lower_margin); - return result; -} - -#define STANDARD_MIN_MARGIN 5 - -static u8 choose_reg178(struct raminfo *info, timing_bounds_t * timings) -{ - u16 margin[64]; - int lane, rank, slot, channel; - u8 reg178; - int count = 0, sum = 0; - - for (reg178 = reg178_min[info->clock_speed_index]; - reg178 < reg178_max[info->clock_speed_index]; - reg178 += reg178_step[info->clock_speed_index]) { - margin[reg178] = -1; - FOR_POPULATED_RANKS_BACKWARDS for (lane = 0; lane < 8; lane++) { - int curmargin = - timings[reg178][channel][slot][rank][lane].largest - - timings[reg178][channel][slot][rank][lane]. - smallest + 1; - if (curmargin < margin[reg178]) - margin[reg178] = curmargin; - } - if (margin[reg178] >= STANDARD_MIN_MARGIN) { - u16 weight; - weight = margin[reg178] - STANDARD_MIN_MARGIN; - sum += weight * reg178; - count += weight; - } - } - dump_timings(info); - if (count == 0) - die("Couldn't discover DRAM timings (3)\n"); - - u8 threshold; - - for (threshold = 30; threshold >= 5; threshold--) { - int usable_length = 0; - int smallest_fount = 0; - for (reg178 = reg178_min[info->clock_speed_index]; - reg178 < reg178_max[info->clock_speed_index]; - reg178 += reg178_step[info->clock_speed_index]) - if (margin[reg178] >= threshold) { - usable_length += - reg178_step[info->clock_speed_index]; - info->training.reg178_largest = - reg178 - - 2 * reg178_step[info->clock_speed_index]; - - if (!smallest_fount) { - smallest_fount = 1; - info->training.reg178_smallest = - reg178 + - reg178_step[info-> - clock_speed_index]; - } - } - if (usable_length >= 0x21) - break; - } - - return sum / count; -} - -static int check_cached_sanity(struct raminfo *info) -{ - int lane; - int slot, rank; - int channel; - - if (!info->cached_training) - return 0; - - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - for (lane = 0; lane < 8 + info->use_ecc; lane++) { - u16 cached_value, estimation_value; - cached_value = - info->cached_training-> - lane_timings[1][channel][slot][rank] - [lane]; - if (cached_value >= 0x18 - && cached_value <= 0x1E7) { - estimation_value = - info->training. - lane_timings[1][channel] - [slot][rank][lane]; - if (estimation_value < - cached_value - 24) - return 0; - if (estimation_value > - cached_value + 24) - return 0; - } - } - return 1; -} - -static int try_cached_training(struct raminfo *info) -{ - u8 saved_243[2]; - u8 tm; - - int channel, slot, rank, lane; - int flip = 1; - int i, j; - - if (!check_cached_sanity(info)) - return 0; - - info->training.reg178_center = info->cached_training->reg178_center; - info->training.reg178_smallest = info->cached_training->reg178_smallest; - info->training.reg178_largest = info->cached_training->reg178_largest; - memcpy(&info->training.timing_bounds, - &info->cached_training->timing_bounds, - sizeof(info->training.timing_bounds)); - memcpy(&info->training.timing_offset, - &info->cached_training->timing_offset, - sizeof(info->training.timing_offset)); - - write_1d0(2, 0x142, 3, 1); - saved_243[0] = MCHBAR8(0x243); - saved_243[1] = MCHBAR8(0x643); - MCHBAR8(0x243) = saved_243[0] | 2; - MCHBAR8(0x643) = saved_243[1] | 2; - set_ecc(0); - pci_write_config16(NORTHBRIDGE, 0xc8, 3); - if (read_1d0(0x10b, 6) & 1) - set_10b(info, 0); - for (tm = 0; tm < 2; tm++) { - int totalrank; - - set_178(tm ? info->cached_training->reg178_largest : info-> - cached_training->reg178_smallest); - - totalrank = 0; - /* Check timing ranges. With i == 0 we check smallest one and with - i == 1 the largest bound. With j == 0 we check that on the bound - it still works whereas with j == 1 we check that just outside of - bound we fail. - */ - FOR_POPULATED_RANKS_BACKWARDS { - for (i = 0; i < 2; i++) { - for (lane = 0; lane < 8; lane++) { - write_500(info, channel, - info->cached_training-> - timing2_bounds[channel][slot] - [rank][lane][i], - get_timing_register_addr(lane, - 3, - slot, - rank), - 9, 1); - - if (!i) - write_500(info, channel, - info-> - cached_training-> - timing2_offset - [channel][slot][rank] - [lane], - get_timing_register_addr - (lane, 2, slot, rank), - 9, 1); - write_500(info, channel, - i ? info->cached_training-> - timing_bounds[tm][channel] - [slot][rank][lane]. - largest : info-> - cached_training-> - timing_bounds[tm][channel] - [slot][rank][lane].smallest, - get_timing_register_addr(lane, - 0, - slot, - rank), - 9, 1); - write_500(info, channel, - info->cached_training-> - timing_offset[channel][slot] - [rank][lane] + - (i ? info->cached_training-> - timing_bounds[tm][channel] - [slot][rank][lane]. - largest : info-> - cached_training-> - timing_bounds[tm][channel] - [slot][rank][lane]. - smallest) - 64, - get_timing_register_addr(lane, - 1, - slot, - rank), - 9, 1); - } - for (j = 0; j < 2; j++) { - u8 failmask; - u8 expected_failmask; - char reg1b3; - - reg1b3 = (j == 1) + 4; - reg1b3 = - j == i ? reg1b3 : (-reg1b3) & 0x3f; - write_1d0(reg1b3, 0x1bb, 6, 1); - write_1d0(reg1b3, 0x1b3, 6, 1); - write_1d0(reg1b3, 0x1a3, 6, 1); - - flip = !flip; - write_testing(info, totalrank, flip); - failmask = - check_testing(info, totalrank, - flip); - expected_failmask = - j == 0 ? 0x00 : 0xff; - if (failmask != expected_failmask) - goto fail; - } - } - totalrank++; - } - } - - set_178(info->cached_training->reg178_center); - if (info->use_ecc) - set_ecc(1); - write_training_data(info); - write_1d0(0, 322, 3, 1); - info->training = *info->cached_training; - - write_1d0(0, 0x1bb, 6, 1); - write_1d0(0, 0x1b3, 6, 1); - write_1d0(0, 0x1a3, 6, 1); - MCHBAR8(0x243) = saved_243[0]; - MCHBAR8(0x643) = saved_243[1]; - - return 1; - -fail: - FOR_POPULATED_RANKS { - write_500_timings_type(info, channel, slot, rank, 1); - write_500_timings_type(info, channel, slot, rank, 2); - write_500_timings_type(info, channel, slot, rank, 3); - } - - write_1d0(0, 0x1bb, 6, 1); - write_1d0(0, 0x1b3, 6, 1); - write_1d0(0, 0x1a3, 6, 1); - MCHBAR8(0x243) = saved_243[0]; - MCHBAR8(0x643) = saved_243[1]; - - return 0; -} - -static void do_ram_training(struct raminfo *info) -{ - u8 saved_243[2]; - int totalrank = 0; - u8 reg_178; - int niter; - - timing_bounds_t *timings = timings_car; - int lane, rank, slot, channel; - u8 reg178_center; - - write_1d0(2, 0x142, 3, 1); - saved_243[0] = MCHBAR8(0x243); - saved_243[1] = MCHBAR8(0x643); - MCHBAR8(0x243) = saved_243[0] | 2; - MCHBAR8(0x643) = saved_243[1] | 2; - switch (info->clock_speed_index) { - case 0: - niter = 5; - break; - case 1: - niter = 10; - break; - default: - niter = 19; - break; - } - set_ecc(0); - - FOR_POPULATED_RANKS_BACKWARDS { - int i; - - write_500_timings_type(info, channel, slot, rank, 0); - - write_testing(info, totalrank, 0); - for (i = 0; i < niter; i++) { - write_testing_type2(info, totalrank, 2, i, 0); - write_testing_type2(info, totalrank, 3, i, 1); - } - pci_write_config8(NORTHBRIDGE, 0xc0, 0x01); - totalrank++; - } - - if (reg178_min[info->clock_speed_index] < - reg178_max[info->clock_speed_index]) - memset(timings[reg178_min[info->clock_speed_index]], 0, - sizeof(timings[0]) * - (reg178_max[info->clock_speed_index] - - reg178_min[info->clock_speed_index])); - for (reg_178 = reg178_min[info->clock_speed_index]; - reg_178 < reg178_max[info->clock_speed_index]; - reg_178 += reg178_step[info->clock_speed_index]) { - totalrank = 0; - set_178(reg_178); - for (channel = NUM_CHANNELS - 1; channel >= 0; channel--) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) { - memset(&timings[reg_178][channel][slot] - [rank][0].smallest, 0, 16); - if (info-> - populated_ranks[channel][slot] - [rank]) { - train_ram_at_178(info, channel, - slot, rank, - totalrank, - reg_178, 1, - niter, - timings); - totalrank++; - } - } - } - - reg178_center = choose_reg178(info, timings); - - FOR_POPULATED_RANKS_BACKWARDS for (lane = 0; lane < 8; lane++) { - info->training.timing_bounds[0][channel][slot][rank][lane]. - smallest = - timings[info->training. - reg178_smallest][channel][slot][rank][lane]. - smallest; - info->training.timing_bounds[0][channel][slot][rank][lane]. - largest = - timings[info->training. - reg178_smallest][channel][slot][rank][lane].largest; - info->training.timing_bounds[1][channel][slot][rank][lane]. - smallest = - timings[info->training. - reg178_largest][channel][slot][rank][lane].smallest; - info->training.timing_bounds[1][channel][slot][rank][lane]. - largest = - timings[info->training. - reg178_largest][channel][slot][rank][lane].largest; - info->training.timing_offset[channel][slot][rank][lane] = - info->training.lane_timings[1][channel][slot][rank][lane] - - - info->training.lane_timings[0][channel][slot][rank][lane] + - 64; - } - - if (info->silicon_revision == 1 - && (info-> - populated_ranks_mask[1] ^ (info-> - populated_ranks_mask[1] >> 2)) & 1) { - int ranks_after_channel1; - - totalrank = 0; - for (reg_178 = reg178_center - 18; - reg_178 <= reg178_center + 18; reg_178 += 18) { - totalrank = 0; - set_178(reg_178); - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) { - if (info-> - populated_ranks[1][slot][rank]) { - train_ram_at_178(info, 1, slot, - rank, - totalrank, - reg_178, 0, - niter, - timings); - totalrank++; - } - } - } - ranks_after_channel1 = totalrank; - - for (reg_178 = reg178_center - 12; - reg_178 <= reg178_center + 12; reg_178 += 12) { - totalrank = ranks_after_channel1; - set_178(reg_178); - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - if (info-> - populated_ranks[0][slot][rank]) { - train_ram_at_178(info, 0, slot, - rank, - totalrank, - reg_178, 0, - niter, - timings); - totalrank++; - } - - } - } else { - for (reg_178 = reg178_center - 12; - reg_178 <= reg178_center + 12; reg_178 += 12) { - totalrank = 0; - set_178(reg_178); - FOR_POPULATED_RANKS_BACKWARDS { - train_ram_at_178(info, channel, slot, rank, - totalrank, reg_178, 0, niter, - timings); - totalrank++; - } - } - } - - set_178(reg178_center); - FOR_POPULATED_RANKS_BACKWARDS for (lane = 0; lane < 8; lane++) { - u16 tm0; - - tm0 = - choose_training(info, channel, slot, rank, lane, timings, - reg178_center); - write_500(info, channel, tm0, - get_timing_register_addr(lane, 0, slot, rank), 9, 1); - write_500(info, channel, - tm0 + - info->training. - lane_timings[1][channel][slot][rank][lane] - - info->training. - lane_timings[0][channel][slot][rank][lane], - get_timing_register_addr(lane, 1, slot, rank), 9, 1); - } - - totalrank = 0; - FOR_POPULATED_RANKS_BACKWARDS { - try_timing_offsets(info, channel, slot, rank, totalrank); - totalrank++; - } - MCHBAR8(0x243) = saved_243[0]; - MCHBAR8(0x643) = saved_243[1]; - write_1d0(0, 0x142, 3, 1); - info->training.reg178_center = reg178_center; -} - -static void ram_training(struct raminfo *info) -{ - u16 saved_fc4; - - saved_fc4 = MCHBAR16(0xfc4); - MCHBAR16(0xfc4) = 0xffff; - - if (info->revision >= 8) - read_4090(info); - - if (!try_cached_training(info)) - do_ram_training(info); - if ((info->silicon_revision == 2 || info->silicon_revision == 3) - && info->clock_speed_index < 2) - set_10b(info, 1); - MCHBAR16(0xfc4) = saved_fc4; -} - -static unsigned int gcd(unsigned int a, unsigned int b) -{ - unsigned int t; - if (a > b) { - t = a; - a = b; - b = t; - } - /* invariant a < b. */ - while (a) { - t = b % a; - b = a; - a = t; - } - return b; -} - -static inline int div_roundup(int a, int b) -{ - return DIV_ROUND_UP(a, b); -} - -static unsigned int lcm(unsigned int a, unsigned int b) -{ - return (a * b) / gcd(a, b); -} - -struct stru1 { - u8 freqs_reversed; - u8 freq_diff_reduced; - u8 freq_min_reduced; - u8 divisor_f4_to_fmax; - u8 divisor_f3_to_fmax; - u8 freq4_to_max_remainder; - u8 freq3_to_2_remainder; - u8 freq3_to_2_remaindera; - u8 freq4_to_2_remainder; - int divisor_f3_to_f1, divisor_f4_to_f2; - int common_time_unit_ps; - int freq_max_reduced; -}; - -static void -compute_frequence_ratios(struct raminfo *info, u16 freq1, u16 freq2, - int num_cycles_2, int num_cycles_1, int round_it, - int add_freqs, struct stru1 *result) -{ - int g; - int common_time_unit_ps; - int freq1_reduced, freq2_reduced; - int freq_min_reduced; - int freq_max_reduced; - int freq3, freq4; - - g = gcd(freq1, freq2); - freq1_reduced = freq1 / g; - freq2_reduced = freq2 / g; - freq_min_reduced = MIN(freq1_reduced, freq2_reduced); - freq_max_reduced = MAX(freq1_reduced, freq2_reduced); - - common_time_unit_ps = div_roundup(900000, lcm(freq1, freq2)); - freq3 = div_roundup(num_cycles_2, common_time_unit_ps) - 1; - freq4 = div_roundup(num_cycles_1, common_time_unit_ps) - 1; - if (add_freqs) { - freq3 += freq2_reduced; - freq4 += freq1_reduced; - } - - if (round_it) { - result->freq3_to_2_remainder = 0; - result->freq3_to_2_remaindera = 0; - result->freq4_to_max_remainder = 0; - result->divisor_f4_to_f2 = 0; - result->divisor_f3_to_f1 = 0; - } else { - if (freq2_reduced < freq1_reduced) { - result->freq3_to_2_remainder = - result->freq3_to_2_remaindera = - freq3 % freq1_reduced - freq1_reduced + 1; - result->freq4_to_max_remainder = - -(freq4 % freq1_reduced); - result->divisor_f3_to_f1 = freq3 / freq1_reduced; - result->divisor_f4_to_f2 = - (freq4 - - (freq1_reduced - freq2_reduced)) / freq2_reduced; - result->freq4_to_2_remainder = - -(char)((freq1_reduced - freq2_reduced) + - ((u8) freq4 - - (freq1_reduced - - freq2_reduced)) % (u8) freq2_reduced); - } else { - if (freq2_reduced > freq1_reduced) { - result->freq4_to_max_remainder = - (freq4 % freq2_reduced) - freq2_reduced + 1; - result->freq4_to_2_remainder = - freq4 % freq_max_reduced - - freq_max_reduced + 1; - } else { - result->freq4_to_max_remainder = - -(freq4 % freq2_reduced); - result->freq4_to_2_remainder = - -(char)(freq4 % freq_max_reduced); - } - result->divisor_f4_to_f2 = freq4 / freq2_reduced; - result->divisor_f3_to_f1 = - (freq3 - - (freq2_reduced - freq1_reduced)) / freq1_reduced; - result->freq3_to_2_remainder = -(freq3 % freq2_reduced); - result->freq3_to_2_remaindera = - -(char)((freq_max_reduced - freq_min_reduced) + - (freq3 - - (freq_max_reduced - - freq_min_reduced)) % freq1_reduced); - } - } - result->divisor_f3_to_fmax = freq3 / freq_max_reduced; - result->divisor_f4_to_fmax = freq4 / freq_max_reduced; - if (round_it) { - if (freq2_reduced > freq1_reduced) { - if (freq3 % freq_max_reduced) - result->divisor_f3_to_fmax++; - } - if (freq2_reduced < freq1_reduced) { - if (freq4 % freq_max_reduced) - result->divisor_f4_to_fmax++; - } - } - result->freqs_reversed = (freq2_reduced < freq1_reduced); - result->freq_diff_reduced = freq_max_reduced - freq_min_reduced; - result->freq_min_reduced = freq_min_reduced; - result->common_time_unit_ps = common_time_unit_ps; - result->freq_max_reduced = freq_max_reduced; -} - -static void -set_2d5x_reg(struct raminfo *info, u16 reg, u16 freq1, u16 freq2, - int num_cycles_2, int num_cycles_1, int num_cycles_3, - int num_cycles_4, int reverse) -{ - struct stru1 vv; - char multiplier; - - compute_frequence_ratios(info, freq1, freq2, num_cycles_2, num_cycles_1, - 0, 1, &vv); - - multiplier = - div_roundup(MAX - (div_roundup(num_cycles_2, vv.common_time_unit_ps) + - div_roundup(num_cycles_3, vv.common_time_unit_ps), - div_roundup(num_cycles_1, - vv.common_time_unit_ps) + - div_roundup(num_cycles_4, vv.common_time_unit_ps)) - + vv.freq_min_reduced - 1, vv.freq_max_reduced) - 1; - - u32 y = - (u8) ((vv.freq_max_reduced - vv.freq_min_reduced) + - vv.freq_max_reduced * multiplier) - | (vv. - freqs_reversed << 8) | ((u8) (vv.freq_min_reduced * - multiplier) << 16) | ((u8) (vv. - freq_min_reduced - * - multiplier) - << 24); - u32 x = - vv.freq3_to_2_remaindera | (vv.freq4_to_2_remainder << 8) | (vv. - divisor_f3_to_f1 - << 16) - | (vv.divisor_f4_to_f2 << 20) | (vv.freq_min_reduced << 24); - if (reverse) { - MCHBAR32(reg) = y; - MCHBAR32(reg + 4) = x; - } else { - MCHBAR32(reg + 4) = y; - MCHBAR32(reg) = x; - } -} - -static void -set_6d_reg(struct raminfo *info, u16 reg, u16 freq1, u16 freq2, - int num_cycles_1, int num_cycles_2, int num_cycles_3, - int num_cycles_4) -{ - struct stru1 ratios1; - struct stru1 ratios2; - - compute_frequence_ratios(info, freq1, freq2, num_cycles_1, num_cycles_2, - 0, 1, &ratios2); - compute_frequence_ratios(info, freq1, freq2, num_cycles_3, num_cycles_4, - 0, 1, &ratios1); - printk(RAM_SPEW, "[%x] <= %x\n", reg, - ratios1.freq4_to_max_remainder | (ratios2. - freq4_to_max_remainder - << 8) - | (ratios1.divisor_f4_to_fmax << 16) | (ratios2. - divisor_f4_to_fmax - << 20)); - MCHBAR32(reg) = ratios1.freq4_to_max_remainder | - (ratios2.freq4_to_max_remainder << 8) | - (ratios1.divisor_f4_to_fmax << 16) | - (ratios2.divisor_f4_to_fmax << 20); -} - -static void -set_2dx8_reg(struct raminfo *info, u16 reg, u8 mode, u16 freq1, u16 freq2, - int num_cycles_2, int num_cycles_1, int round_it, int add_freqs) -{ - struct stru1 ratios; - - compute_frequence_ratios(info, freq1, freq2, num_cycles_2, num_cycles_1, - round_it, add_freqs, &ratios); - switch (mode) { - case 0: - MCHBAR32(reg + 4) = ratios.freq_diff_reduced | - (ratios.freqs_reversed << 8); - MCHBAR32(reg) = ratios.freq3_to_2_remainder | - (ratios.freq4_to_max_remainder << 8) | - (ratios.divisor_f3_to_fmax << 16) | - (ratios.divisor_f4_to_fmax << 20) | - (ratios.freq_min_reduced << 24); - break; - - case 1: - MCHBAR32(reg) = ratios.freq3_to_2_remainder | - (ratios.divisor_f3_to_fmax << 16); - break; - - case 2: - MCHBAR32(reg) = ratios.freq3_to_2_remainder | - (ratios.freq4_to_max_remainder << 8) | - (ratios.divisor_f3_to_fmax << 16) | - (ratios.divisor_f4_to_fmax << 20); - break; - - case 4: - MCHBAR32(reg) = (ratios.divisor_f3_to_fmax << 4) | - (ratios.divisor_f4_to_fmax << 8) | - (ratios.freqs_reversed << 12) | - (ratios.freq_min_reduced << 16) | - (ratios.freq_diff_reduced << 24); - break; - } -} - -static void set_2dxx_series(struct raminfo *info, int s3resume) -{ - set_2dx8_reg(info, 0x2d00, 0, 0x78, frequency_11(info) / 2, 1359, 1005, - 0, 1); - set_2dx8_reg(info, 0x2d08, 0, 0x78, 0x78, 3273, 5033, 1, 1); - set_2dx8_reg(info, 0x2d10, 0, 0x78, info->fsb_frequency, 1475, 1131, 0, - 1); - set_2dx8_reg(info, 0x2d18, 0, 2 * info->fsb_frequency, - frequency_11(info), 1231, 1524, 0, 1); - set_2dx8_reg(info, 0x2d20, 0, 2 * info->fsb_frequency, - frequency_11(info) / 2, 1278, 2008, 0, 1); - set_2dx8_reg(info, 0x2d28, 0, info->fsb_frequency, frequency_11(info), - 1167, 1539, 0, 1); - set_2dx8_reg(info, 0x2d30, 0, info->fsb_frequency, - frequency_11(info) / 2, 1403, 1318, 0, 1); - set_2dx8_reg(info, 0x2d38, 0, info->fsb_frequency, 0x78, 3460, 5363, 1, - 1); - set_2dx8_reg(info, 0x2d40, 0, info->fsb_frequency, 0x3c, 2792, 5178, 1, - 1); - set_2dx8_reg(info, 0x2d48, 0, 2 * info->fsb_frequency, 0x78, 2738, 4610, - 1, 1); - set_2dx8_reg(info, 0x2d50, 0, info->fsb_frequency, 0x78, 2819, 5932, 1, - 1); - set_2dx8_reg(info, 0x6d4, 1, info->fsb_frequency, - frequency_11(info) / 2, 4000, 0, 0, 0); - set_2dx8_reg(info, 0x6d8, 2, info->fsb_frequency, - frequency_11(info) / 2, 4000, 4000, 0, 0); - - if (s3resume) { - printk(RAM_SPEW, "[6dc] <= %x\n", - info->cached_training->reg_6dc); - MCHBAR32(0x6dc) = info->cached_training->reg_6dc; - } else - set_6d_reg(info, 0x6dc, 2 * info->fsb_frequency, frequency_11(info), 0, - info->delay46_ps[0], 0, - info->delay54_ps[0]); - set_2dx8_reg(info, 0x6e0, 1, 2 * info->fsb_frequency, - frequency_11(info), 2500, 0, 0, 0); - set_2dx8_reg(info, 0x6e4, 1, 2 * info->fsb_frequency, - frequency_11(info) / 2, 3500, 0, 0, 0); - if (s3resume) { - printk(RAM_SPEW, "[6e8] <= %x\n", - info->cached_training->reg_6e8); - MCHBAR32(0x6e8) = info->cached_training->reg_6e8; - } else - set_6d_reg(info, 0x6e8, 2 * info->fsb_frequency, frequency_11(info), 0, - info->delay46_ps[1], 0, - info->delay54_ps[1]); - set_2d5x_reg(info, 0x2d58, 0x78, 0x78, 864, 1195, 762, 786, 0); - set_2d5x_reg(info, 0x2d60, 0x195, info->fsb_frequency, 1352, 725, 455, - 470, 0); - set_2d5x_reg(info, 0x2d68, 0x195, 0x3c, 2707, 5632, 3277, 2207, 0); - set_2d5x_reg(info, 0x2d70, 0x195, frequency_11(info) / 2, 1276, 758, - 454, 459, 0); - set_2d5x_reg(info, 0x2d78, 0x195, 0x78, 1021, 799, 510, 513, 0); - set_2d5x_reg(info, 0x2d80, info->fsb_frequency, 0xe1, 0, 2862, 2579, - 2588, 0); - set_2d5x_reg(info, 0x2d88, info->fsb_frequency, 0xe1, 0, 2690, 2405, - 2405, 0); - set_2d5x_reg(info, 0x2da0, 0x78, 0xe1, 0, 2560, 2264, 2251, 0); - set_2d5x_reg(info, 0x2da8, 0x195, frequency_11(info), 1060, 775, 484, - 480, 0); - set_2d5x_reg(info, 0x2db0, 0x195, 0x78, 4183, 6023, 2217, 2048, 0); - MCHBAR32(0x2dbc) = ((frequency_11(info) / 2) - 1) | 0xe00000; - MCHBAR32(0x2db8) = ((info->fsb_frequency - 1) << 16) | 0x77; -} - -static u16 get_max_timing(struct raminfo *info, int channel) -{ - int slot, rank, lane; - u16 ret = 0; - - if ((MCHBAR8(0x2ca8) >> 2) < 1) - return 384; - - if (info->revision < 8) - return 256; - - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - if (info->populated_ranks[channel][slot][rank]) - for (lane = 0; lane < 8 + info->use_ecc; lane++) - ret = MAX(ret, read_500(info, channel, - get_timing_register_addr - (lane, 0, slot, - rank), 9)); - return ret; -} - -static void set_274265(struct raminfo *info) -{ - int delay_a_ps, delay_b_ps, delay_c_ps, delay_d_ps; - int delay_e_ps, delay_e_cycles, delay_f_cycles; - int delay_e_over_cycle_ps; - int cycletime_ps; - int channel; - - delay_a_ps = 4 * halfcycle_ps(info) + 6 * fsbcycle_ps(info); - info->training.reg2ca9_bit0 = 0; - for (channel = 0; channel < NUM_CHANNELS; channel++) { - cycletime_ps = - 900000 / lcm(2 * info->fsb_frequency, frequency_11(info)); - delay_d_ps = - (halfcycle_ps(info) * get_max_timing(info, channel) >> 6) - - info->some_delay_3_ps_rounded + 200; - if (! - ((info->silicon_revision == 0 - || info->silicon_revision == 1) - && (info->revision >= 8))) - delay_d_ps += halfcycle_ps(info) * 2; - delay_d_ps += - halfcycle_ps(info) * (!info->revision_flag_1 + - info->some_delay_2_halfcycles_ceil + - 2 * info->some_delay_1_cycle_floor + - info->clock_speed_index + - 2 * info->cas_latency - 7 + 11); - delay_d_ps += info->revision >= 8 ? 2758 : 4428; - - MCHBAR32_AND_OR(0x140, 0xfaffffff, 0x2000000); - MCHBAR32_AND_OR(0x138, 0xfaffffff, 0x2000000); - if ((MCHBAR8(0x144) & 0x1f) > 0x13) - delay_d_ps += 650; - delay_c_ps = delay_d_ps + 1800; - if (delay_c_ps <= delay_a_ps) - delay_e_ps = 0; - else - delay_e_ps = - cycletime_ps * div_roundup(delay_c_ps - delay_a_ps, - cycletime_ps); - - delay_e_over_cycle_ps = delay_e_ps % (2 * halfcycle_ps(info)); - delay_e_cycles = delay_e_ps / (2 * halfcycle_ps(info)); - delay_f_cycles = - div_roundup(2500 - delay_e_over_cycle_ps, - 2 * halfcycle_ps(info)); - if (delay_f_cycles > delay_e_cycles) { - info->delay46_ps[channel] = delay_e_ps; - delay_e_cycles = 0; - } else { - info->delay46_ps[channel] = - delay_e_over_cycle_ps + - 2 * halfcycle_ps(info) * delay_f_cycles; - delay_e_cycles -= delay_f_cycles; - } - - if (info->delay46_ps[channel] < 2500) { - info->delay46_ps[channel] = 2500; - info->training.reg2ca9_bit0 = 1; - } - delay_b_ps = halfcycle_ps(info) + delay_c_ps; - if (delay_b_ps <= delay_a_ps) - delay_b_ps = 0; - else - delay_b_ps -= delay_a_ps; - info->delay54_ps[channel] = - cycletime_ps * div_roundup(delay_b_ps, - cycletime_ps) - - 2 * halfcycle_ps(info) * delay_e_cycles; - if (info->delay54_ps[channel] < 2500) - info->delay54_ps[channel] = 2500; - info->training.reg274265[channel][0] = delay_e_cycles; - if (delay_d_ps + 7 * halfcycle_ps(info) <= - 24 * halfcycle_ps(info)) - info->training.reg274265[channel][1] = 0; - else - info->training.reg274265[channel][1] = - div_roundup(delay_d_ps + 7 * halfcycle_ps(info), - 4 * halfcycle_ps(info)) - 6; - MCHBAR32((channel << 10) + 0x274) = - info->training.reg274265[channel][1] | - (info->training.reg274265[channel][0] << 16); - info->training.reg274265[channel][2] = - div_roundup(delay_c_ps + 3 * fsbcycle_ps(info), - 4 * halfcycle_ps(info)) + 1; - MCHBAR16((channel << 10) + 0x265) = - info->training.reg274265[channel][2] << 8; - } - if (info->training.reg2ca9_bit0) - MCHBAR8_OR(0x2ca9, 1); - else - MCHBAR8_AND(0x2ca9, ~1); -} - -static void restore_274265(struct raminfo *info) -{ - int channel; - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32((channel << 10) + 0x274) = - (info->cached_training->reg274265[channel][0] << 16) | - info->cached_training->reg274265[channel][1]; - MCHBAR16((channel << 10) + 0x265) = - info->cached_training->reg274265[channel][2] << 8; - } - if (info->cached_training->reg2ca9_bit0) - MCHBAR8_OR(0x2ca9, 1); - else - MCHBAR8_AND(0x2ca9, ~1); -} - -static void dmi_setup(void) -{ - gav(read8(DEFAULT_DMIBAR + 0x254)); - write8(DEFAULT_DMIBAR + 0x254, 0x1); - write16(DEFAULT_DMIBAR + 0x1b8, 0x18f2); - MCHBAR16_AND_OR(0x48, 0, 0x2); - - write32(DEFAULT_DMIBAR + 0xd68, read32(DEFAULT_DMIBAR + 0xd68) | 0x08000000); - - outl((gav(inl(DEFAULT_GPIOBASE | 0x38)) & ~0x140000) | 0x400000, - DEFAULT_GPIOBASE | 0x38); - gav(inb(DEFAULT_GPIOBASE | 0xe)); // = 0xfdcaff6e -} - -void chipset_init(const int s3resume) -{ - u8 x2ca8; - u16 ggc; - u8 gfxsize; - - x2ca8 = MCHBAR8(0x2ca8); - if ((x2ca8 & 1) || (x2ca8 == 8 && !s3resume)) { - printk(BIOS_DEBUG, "soft reset detected, rebooting properly\n"); - MCHBAR8(0x2ca8) = 0; - system_reset(); - } -#if 0 - if (!s3resume) { - pre_raminit_3(x2ca8); - } - pre_raminit_4a(x2ca8); -#endif - - dmi_setup(); - - MCHBAR16(0x1170) = 0xa880; - MCHBAR8(0x11c1) = 0x1; - MCHBAR16(0x1170) = 0xb880; - MCHBAR8_AND_OR(0x1210, 0, 0x84); - - if (get_option(&gfxsize, "gfx_uma_size") != CB_SUCCESS) { - /* 0 for 32MB */ - gfxsize = 0; - } - - ggc = 0xb00 | ((gfxsize + 5) << 4); - - pci_write_config16(NORTHBRIDGE, D0F0_GGC, ggc | 2); - - u16 deven; - deven = pci_read_config16(NORTHBRIDGE, D0F0_DEVEN); // = 0x3 - - if (deven & 8) { - MCHBAR8(0x2c30) = 0x20; - pci_read_config8(NORTHBRIDGE, 0x8); // = 0x18 - MCHBAR16_OR(0x2c30, 0x200); - MCHBAR16(0x2c32) = 0x434; - MCHBAR32_AND_OR(0x2c44, 0, 0x1053687); - pci_read_config8(GMA, 0x62); // = 0x2 - pci_write_config8(GMA, 0x62, 0x2); - read8(DEFAULT_RCBA + 0x2318); - write8(DEFAULT_RCBA + 0x2318, 0x47); - read8(DEFAULT_RCBA + 0x2320); - write8(DEFAULT_RCBA + 0x2320, 0xfc); - } - - MCHBAR32_AND_OR(0x30, 0, 0x40); - - pci_write_config16(NORTHBRIDGE, D0F0_GGC, ggc); - gav(read32(DEFAULT_RCBA + 0x3428)); - write32(DEFAULT_RCBA + 0x3428, 0x1d); -} - -void raminit(const int s3resume, const u8 *spd_addrmap) -{ - unsigned int channel, slot, lane, rank; - int i; - struct raminfo info; - u8 x2ca8; - u16 deven; - int cbmem_wasnot_inited; - - x2ca8 = MCHBAR8(0x2ca8); - - printk(RAM_DEBUG, "Scratchpad MCHBAR8(0x2ca8): 0x%04x\n", x2ca8); - - deven = pci_read_config16(NORTHBRIDGE, D0F0_DEVEN); - - memset(&info, 0x5a, sizeof(info)); - - info.last_500_command[0] = 0; - info.last_500_command[1] = 0; - - info.fsb_frequency = 135 * 2; - info.board_lane_delay[0] = 0x14; - info.board_lane_delay[1] = 0x07; - info.board_lane_delay[2] = 0x07; - info.board_lane_delay[3] = 0x08; - info.board_lane_delay[4] = 0x56; - info.board_lane_delay[5] = 0x04; - info.board_lane_delay[6] = 0x04; - info.board_lane_delay[7] = 0x05; - info.board_lane_delay[8] = 0x10; - - info.training.reg_178 = 0; - info.training.reg_10b = 0; - - info.heci_bar = 0; - info.memory_reserved_for_heci_mb = 0; - - /* before SPD */ - timestamp_add_now(101); - - if (!s3resume || 1) { // possible error - pci_read_config8(SOUTHBRIDGE, GEN_PMCON_2); // = 0x80 - - collect_system_info(&info); - - memset(&info.populated_ranks, 0, sizeof(info.populated_ranks)); - - info.use_ecc = 1; - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) { - int v; - int try; - int addr; - const u8 useful_addresses[] = { - DEVICE_TYPE, - MODULE_TYPE, - DENSITY, - RANKS_AND_DQ, - MEMORY_BUS_WIDTH, - TIMEBASE_DIVIDEND, - TIMEBASE_DIVISOR, - CYCLETIME, - CAS_LATENCIES_LSB, - CAS_LATENCIES_MSB, - CAS_LATENCY_TIME, - 0x11, 0x12, 0x13, 0x14, 0x15, - 0x16, 0x17, 0x18, 0x19, 0x1a, 0x1b, - 0x1c, 0x1d, - THERMAL_AND_REFRESH, - 0x20, - REFERENCE_RAW_CARD_USED, - RANK1_ADDRESS_MAPPING, - 0x75, 0x76, 0x77, 0x78, - 0x79, 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, - 0x7f, 0x80, 0x81, 0x82, 0x83, 0x84, - 0x85, 0x86, 0x87, 0x88, - 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, - 0x8f, 0x90, 0x91, 0x92, 0x93, 0x94, - 0x95 - }; - if (!spd_addrmap[2 * channel + slot]) - continue; - for (try = 0; try < 5; try++) { - v = smbus_read_byte(spd_addrmap[2 * channel + slot], - DEVICE_TYPE); - if (v >= 0) - break; - } - if (v < 0) - continue; - for (addr = 0; - addr < - sizeof(useful_addresses) / - sizeof(useful_addresses[0]); addr++) - gav(info. - spd[channel][0][useful_addresses - [addr]] = - smbus_read_byte(spd_addrmap[2 * channel + slot], - useful_addresses - [addr])); - if (info.spd[channel][0][DEVICE_TYPE] != 11) - die("Only DDR3 is supported"); - - v = info.spd[channel][0][RANKS_AND_DQ]; - info.populated_ranks[channel][0][0] = 1; - info.populated_ranks[channel][0][1] = - ((v >> 3) & 7); - if (((v >> 3) & 7) > 1) - die("At most 2 ranks are supported"); - if ((v & 7) == 0 || (v & 7) > 2) - die("Only x8 and x16 modules are supported"); - if ((info. - spd[channel][slot][MODULE_TYPE] & 0xF) != 2 - && (info. - spd[channel][slot][MODULE_TYPE] & 0xF) - != 3) - die("Registered memory is not supported"); - info.is_x16_module[channel][0] = (v & 7) - 1; - info.density[channel][slot] = - info.spd[channel][slot][DENSITY] & 0xF; - if (! - (info. - spd[channel][slot][MEMORY_BUS_WIDTH] & - 0x18)) - info.use_ecc = 0; - } - - gav(0x55); - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - int v = 0; - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - v |= info. - populated_ranks[channel][slot][rank] - << (2 * slot + rank); - info.populated_ranks_mask[channel] = v; - } - - gav(0x55); - - gav(pci_read_config32(NORTHBRIDGE, D0F0_CAPID0 + 4)); - } - - /* after SPD */ - timestamp_add_now(102); - - MCHBAR8_AND(0x2ca8, 0xfc); - - collect_system_info(&info); - calculate_timings(&info); - -#if 0 - pci_write_config8(NORTHBRIDGE, 0xdf, 0x82); -#endif - - if (!s3resume) { - u8 reg8 = pci_read_config8(SOUTHBRIDGE, GEN_PMCON_2); - if (x2ca8 == 0 && (reg8 & 0x80)) { - /* Don't enable S4-assertion stretch. Makes trouble on roda/rk9. - reg8 = pci_read_config8(PCI_DEV(0, 0x1f, 0), 0xa4); - pci_write_config8(PCI_DEV(0, 0x1f, 0), 0xa4, reg8 | 0x08); - */ - - /* Clear bit7. */ - - pci_write_config8(SOUTHBRIDGE, GEN_PMCON_2, - (reg8 & ~(1 << 7))); - - printk(BIOS_INFO, - "Interrupted RAM init, reset required.\n"); - system_reset(); - } - } - - if (!s3resume && x2ca8 == 0) - pci_write_config8(SOUTHBRIDGE, GEN_PMCON_2, - pci_read_config8(SOUTHBRIDGE, GEN_PMCON_2) | 0x80); - - compute_derived_timings(&info); - - if (x2ca8 == 0) { - gav(MCHBAR8(0x164)); - MCHBAR8(0x164) = 0x26; - MCHBAR16(0x2c20) = 0x10; - } - - MCHBAR32_OR(0x18b4, 0x210000); - MCHBAR32_OR(0x1890, 0x2000000); - MCHBAR32_OR(0x18b4, 0x8000); - - gav(pci_read_config32(PCI_DEV(0xff, 2, 1), 0x50)); // !!!! - pci_write_config8(PCI_DEV(0xff, 2, 1), 0x54, 0x12); - - gav(MCHBAR16(0x2c10)); - MCHBAR16(0x2c10) = 0x412; - gav(MCHBAR16(0x2c10)); - MCHBAR16_OR(0x2c12, 0x100); - - gav(MCHBAR8(0x2ca8)); // !!!! - MCHBAR32_AND_OR(0x1804, 0xfffffffc, 0x8400080); - - pci_read_config32(PCI_DEV(0xff, 2, 1), 0x6c); // !!!! - pci_write_config32(PCI_DEV(0xff, 2, 1), 0x6c, 0x40a0a0); - gav(MCHBAR32(0x1c04)); // !!!! - gav(MCHBAR32(0x1804)); // !!!! - - if (x2ca8 == 0) { - MCHBAR8_OR(0x2ca8, 1); - } - - MCHBAR32(0x18d8) = 0x120000; - MCHBAR32(0x18dc) = 0x30a484a; - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xe0, 0x0); - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xf4, 0x9444a); - MCHBAR32(0x18d8) = 0x40000; - MCHBAR32(0x18dc) = 0xb000000; - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xe0, 0x60000); - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xf4, 0x0); - MCHBAR32(0x18d8) = 0x180000; - MCHBAR32(0x18dc) = 0xc0000142; - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xe0, 0x20000); - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xf4, 0x142); - MCHBAR32(0x18d8) = 0x1e0000; - - gav(MCHBAR32(0x18dc)); // !!!! - MCHBAR32(0x18dc) = 0x3; - gav(MCHBAR32(0x18dc)); // !!!! - - if (x2ca8 == 0) { - MCHBAR8_OR(0x2ca8, 1); // guess - } - - MCHBAR32(0x188c) = 0x20bc09; - pci_write_config32(PCI_DEV(0xff, 2, 1), 0xd0, 0x40b0c09); - MCHBAR32(0x1a10) = 0x4200010e; - MCHBAR32_OR(0x18b8, 0x200); - gav(MCHBAR32(0x1918)); // !!!! - MCHBAR32(0x1918) = 0x332; - - gav(MCHBAR32(0x18b8)); // !!!! - MCHBAR32(0x18b8) = 0xe00; - gav(MCHBAR32(0x182c)); // !!!! - MCHBAR32(0x182c) = 0x10202; - gav(pci_read_config32(PCI_DEV(0xff, 2, 1), 0x94)); // !!!! - pci_write_config32(PCI_DEV(0xff, 2, 1), 0x94, 0x10202); - MCHBAR32_AND(0x1a1c, 0x8fffffff); - MCHBAR32_OR(0x1a70, 0x100000); - - MCHBAR32_AND(0x18b4, 0xffff7fff); - gav(MCHBAR32(0x1a68)); // !!!! - MCHBAR32(0x1a68) = 0x343800; - gav(MCHBAR32(0x1e68)); // !!!! - gav(MCHBAR32(0x1a68)); // !!!! - - if (x2ca8 == 0) { - MCHBAR8_OR(0x2ca8, 1); // guess - } - - pci_read_config32(PCI_DEV(0xff, 2, 0), 0x048); // !!!! - pci_write_config32(PCI_DEV(0xff, 2, 0), 0x048, 0x140000); - pci_read_config32(PCI_DEV(0xff, 2, 0), 0x058); // !!!! - pci_write_config32(PCI_DEV(0xff, 2, 0), 0x058, 0x64555); - pci_read_config32(PCI_DEV(0xff, 2, 0), 0x058); // !!!! - pci_read_config32(PCI_DEV (0xff, 0, 0), 0xd0); // !!!! - pci_write_config32(PCI_DEV (0xff, 0, 0), 0xd0, 0x180); - gav(MCHBAR32(0x1af0)); // !!!! - gav(MCHBAR32(0x1af0)); // !!!! - MCHBAR32(0x1af0) = 0x1f020003; - gav(MCHBAR32(0x1af0)); // !!!! - - if (x2ca8 == 0) { - MCHBAR8_OR(0x2ca8, 1); // guess - } - - gav(MCHBAR32(0x1890)); // !!!! - MCHBAR32(0x1890) = 0x80102; - gav(MCHBAR32(0x18b4)); // !!!! - MCHBAR32(0x18b4) = 0x216000; - MCHBAR32(0x18a4) = 0x22222222; - MCHBAR32(0x18a8) = 0x22222222; - MCHBAR32(0x18ac) = 0x22222; - - udelay(1000); - - info.cached_training = get_cached_training(); - - if (x2ca8 == 0) { - int j; - if (s3resume && info.cached_training) { - restore_274265(&info); - printk(RAM_SPEW, "reg2ca9_bit0 = %x\n", - info.cached_training->reg2ca9_bit0); - for (i = 0; i < 2; i++) - for (j = 0; j < 3; j++) - printk(RAM_SPEW, "reg274265[%d][%d] = %x\n", - i, j, info.cached_training->reg274265[i][j]); - } else { - set_274265(&info); - printk(RAM_SPEW, "reg2ca9_bit0 = %x\n", - info.training.reg2ca9_bit0); - for (i = 0; i < 2; i++) - for (j = 0; j < 3; j++) - printk(RAM_SPEW, "reg274265[%d][%d] = %x\n", - i, j, info.training.reg274265[i][j]); - } - - set_2dxx_series(&info, s3resume); - - if (!(deven & 8)) { - MCHBAR32_AND_OR(0x2cb0, 0, 0x40); - } - - udelay(1000); - - if (deven & 8) { - MCHBAR32_OR(0xff8, 0x1800); - MCHBAR32_AND(0x2cb0, 0x00); - pci_read_config8(PCI_DEV (0, 0x2, 0x0), 0x4c); - pci_read_config8(PCI_DEV (0, 0x2, 0x0), 0x4c); - pci_read_config8(PCI_DEV (0, 0x2, 0x0), 0x4e); - - MCHBAR8(0x1150); - MCHBAR8(0x1151); - MCHBAR8(0x1022); - MCHBAR8(0x16d0); - MCHBAR32(0x1300) = 0x60606060; - MCHBAR32(0x1304) = 0x60606060; - MCHBAR32(0x1308) = 0x78797a7b; - MCHBAR32(0x130c) = 0x7c7d7e7f; - MCHBAR32(0x1310) = 0x60606060; - MCHBAR32(0x1314) = 0x60606060; - MCHBAR32(0x1318) = 0x60606060; - MCHBAR32(0x131c) = 0x60606060; - MCHBAR32(0x1320) = 0x50515253; - MCHBAR32(0x1324) = 0x54555657; - MCHBAR32(0x1328) = 0x58595a5b; - MCHBAR32(0x132c) = 0x5c5d5e5f; - MCHBAR32(0x1330) = 0x40414243; - MCHBAR32(0x1334) = 0x44454647; - MCHBAR32(0x1338) = 0x48494a4b; - MCHBAR32(0x133c) = 0x4c4d4e4f; - MCHBAR32(0x1340) = 0x30313233; - MCHBAR32(0x1344) = 0x34353637; - MCHBAR32(0x1348) = 0x38393a3b; - MCHBAR32(0x134c) = 0x3c3d3e3f; - MCHBAR32(0x1350) = 0x20212223; - MCHBAR32(0x1354) = 0x24252627; - MCHBAR32(0x1358) = 0x28292a2b; - MCHBAR32(0x135c) = 0x2c2d2e2f; - MCHBAR32(0x1360) = 0x10111213; - MCHBAR32(0x1364) = 0x14151617; - MCHBAR32(0x1368) = 0x18191a1b; - MCHBAR32(0x136c) = 0x1c1d1e1f; - MCHBAR32(0x1370) = 0x10203; - MCHBAR32(0x1374) = 0x4050607; - MCHBAR32(0x1378) = 0x8090a0b; - MCHBAR32(0x137c) = 0xc0d0e0f; - MCHBAR8(0x11cc) = 0x4e; - MCHBAR32(0x1110) = 0x73970404; - MCHBAR32(0x1114) = 0x72960404; - MCHBAR32(0x1118) = 0x6f950404; - MCHBAR32(0x111c) = 0x6d940404; - MCHBAR32(0x1120) = 0x6a930404; - MCHBAR32(0x1124) = 0x68a41404; - MCHBAR32(0x1128) = 0x66a21404; - MCHBAR32(0x112c) = 0x63a01404; - MCHBAR32(0x1130) = 0x609e1404; - MCHBAR32(0x1134) = 0x5f9c1404; - MCHBAR32(0x1138) = 0x5c961404; - MCHBAR32(0x113c) = 0x58a02404; - MCHBAR32(0x1140) = 0x54942404; - MCHBAR32(0x1190) = 0x900080a; - MCHBAR16(0x11c0) = 0xc40b; - MCHBAR16(0x11c2) = 0x303; - MCHBAR16(0x11c4) = 0x301; - MCHBAR32_AND_OR(0x1190, 0, 0x8900080a); - MCHBAR32(0x11b8) = 0x70c3000; - MCHBAR8(0x11ec) = 0xa; - MCHBAR16(0x1100) = 0x800; - MCHBAR32_AND_OR(0x11bc, 0, 0x1e84800); - MCHBAR16(0x11ca) = 0xfa; - MCHBAR32(0x11e4) = 0x4e20; - MCHBAR8(0x11bc) = 0xf; - MCHBAR16(0x11da) = 0x19; - MCHBAR16(0x11ba) = 0x470c; - MCHBAR32(0x1680) = 0xe6ffe4ff; - MCHBAR32(0x1684) = 0xdeffdaff; - MCHBAR32(0x1688) = 0xd4ffd0ff; - MCHBAR32(0x168c) = 0xccffc6ff; - MCHBAR32(0x1690) = 0xc0ffbeff; - MCHBAR32(0x1694) = 0xb8ffb0ff; - MCHBAR32(0x1698) = 0xa8ff0000; - MCHBAR32(0x169c) = 0xc00; - MCHBAR32(0x1290) = 0x5000000; - } - - MCHBAR32(0x124c) = 0x15040d00; - MCHBAR32(0x1250) = 0x7f0000; - MCHBAR32(0x1254) = 0x1e220004; - MCHBAR32(0x1258) = 0x4000004; - MCHBAR32(0x1278) = 0x0; - MCHBAR32(0x125c) = 0x0; - MCHBAR32(0x1260) = 0x0; - MCHBAR32(0x1264) = 0x0; - MCHBAR32(0x1268) = 0x0; - MCHBAR32(0x126c) = 0x0; - MCHBAR32(0x1270) = 0x0; - MCHBAR32(0x1274) = 0x0; - } - - if ((deven & 8) && x2ca8 == 0) { - MCHBAR16(0x1214) = 0x320; - MCHBAR32(0x1600) = 0x40000000; - MCHBAR32_AND_OR(0x11f4, 0, 0x10000000); - MCHBAR16_AND_OR(0x1230, 0, 0x8000); - MCHBAR32(0x1400) = 0x13040020; - MCHBAR32(0x1404) = 0xe090120; - MCHBAR32(0x1408) = 0x5120220; - MCHBAR32(0x140c) = 0x5120330; - MCHBAR32(0x1410) = 0xe090220; - MCHBAR32(0x1414) = 0x1010001; - MCHBAR32(0x1418) = 0x1110000; - MCHBAR32(0x141c) = 0x9020020; - MCHBAR32(0x1420) = 0xd090220; - MCHBAR32(0x1424) = 0x2090220; - MCHBAR32(0x1428) = 0x2090330; - MCHBAR32(0x142c) = 0xd090220; - MCHBAR32(0x1430) = 0x1010001; - MCHBAR32(0x1434) = 0x1110000; - MCHBAR32(0x1438) = 0x11040020; - MCHBAR32(0x143c) = 0x4030220; - MCHBAR32(0x1440) = 0x1060220; - MCHBAR32(0x1444) = 0x1060330; - MCHBAR32(0x1448) = 0x4030220; - MCHBAR32(0x144c) = 0x1010001; - MCHBAR32(0x1450) = 0x1110000; - MCHBAR32(0x1454) = 0x4010020; - MCHBAR32(0x1458) = 0xb090220; - MCHBAR32(0x145c) = 0x1090220; - MCHBAR32(0x1460) = 0x1090330; - MCHBAR32(0x1464) = 0xb090220; - MCHBAR32(0x1468) = 0x1010001; - MCHBAR32(0x146c) = 0x1110000; - MCHBAR32(0x1470) = 0xf040020; - MCHBAR32(0x1474) = 0xa090220; - MCHBAR32(0x1478) = 0x1120220; - MCHBAR32(0x147c) = 0x1120330; - MCHBAR32(0x1480) = 0xa090220; - MCHBAR32(0x1484) = 0x1010001; - MCHBAR32(0x1488) = 0x1110000; - MCHBAR32(0x148c) = 0x7020020; - MCHBAR32(0x1490) = 0x1010220; - MCHBAR32(0x1494) = 0x10210; - MCHBAR32(0x1498) = 0x10320; - MCHBAR32(0x149c) = 0x1010220; - MCHBAR32(0x14a0) = 0x1010001; - MCHBAR32(0x14a4) = 0x1110000; - MCHBAR32(0x14a8) = 0xd040020; - MCHBAR32(0x14ac) = 0x8090220; - MCHBAR32(0x14b0) = 0x1111310; - MCHBAR32(0x14b4) = 0x1111420; - MCHBAR32(0x14b8) = 0x8090220; - MCHBAR32(0x14bc) = 0x1010001; - MCHBAR32(0x14c0) = 0x1110000; - MCHBAR32(0x14c4) = 0x3010020; - MCHBAR32(0x14c8) = 0x7090220; - MCHBAR32(0x14cc) = 0x1081310; - MCHBAR32(0x14d0) = 0x1081420; - MCHBAR32(0x14d4) = 0x7090220; - MCHBAR32(0x14d8) = 0x1010001; - MCHBAR32(0x14dc) = 0x1110000; - MCHBAR32(0x14e0) = 0xb040020; - MCHBAR32(0x14e4) = 0x2030220; - MCHBAR32(0x14e8) = 0x1051310; - MCHBAR32(0x14ec) = 0x1051420; - MCHBAR32(0x14f0) = 0x2030220; - MCHBAR32(0x14f4) = 0x1010001; - MCHBAR32(0x14f8) = 0x1110000; - MCHBAR32(0x14fc) = 0x5020020; - MCHBAR32(0x1500) = 0x5090220; - MCHBAR32(0x1504) = 0x2071310; - MCHBAR32(0x1508) = 0x2071420; - MCHBAR32(0x150c) = 0x5090220; - MCHBAR32(0x1510) = 0x1010001; - MCHBAR32(0x1514) = 0x1110000; - MCHBAR32(0x1518) = 0x7040120; - MCHBAR32(0x151c) = 0x2090220; - MCHBAR32(0x1520) = 0x70b1210; - MCHBAR32(0x1524) = 0x70b1310; - MCHBAR32(0x1528) = 0x2090220; - MCHBAR32(0x152c) = 0x1010001; - MCHBAR32(0x1530) = 0x1110000; - MCHBAR32(0x1534) = 0x1010110; - MCHBAR32(0x1538) = 0x1081310; - MCHBAR32(0x153c) = 0x5041200; - MCHBAR32(0x1540) = 0x5041310; - MCHBAR32(0x1544) = 0x1081310; - MCHBAR32(0x1548) = 0x1010001; - MCHBAR32(0x154c) = 0x1110000; - MCHBAR32(0x1550) = 0x1040120; - MCHBAR32(0x1554) = 0x4051210; - MCHBAR32(0x1558) = 0xd051200; - MCHBAR32(0x155c) = 0xd051200; - MCHBAR32(0x1560) = 0x4051210; - MCHBAR32(0x1564) = 0x1010001; - MCHBAR32(0x1568) = 0x1110000; - MCHBAR16(0x1222) = 0x220a; - MCHBAR16(0x123c) = 0x1fc0; - MCHBAR16(0x1220) = 0x1388; - } - - MCHBAR32_AND_OR(0x2c80, 0, 0x1053688); // !!!! - MCHBAR32(0x1c04); // !!!! - MCHBAR32(0x1804) = 0x406080; - - MCHBAR8(0x2ca8); - - if (x2ca8 == 0) { - MCHBAR8_AND(0x2ca8, ~3); - MCHBAR8(0x2ca8) = MCHBAR8(0x2ca8) + 4; // "+" or "|"? - /* This issues a CPU reset without resetting the platform */ - printk(BIOS_DEBUG, "Issuing a CPU reset\n"); - /* Write back the S3 state to PM1_CNT to let the reset CPU - know it also needs to take the s3 path. */ - if (s3resume) - write_pmbase32(PM1_CNT, read_pmbase32(PM1_CNT) - | (SLP_TYP_S3 << 10)); - MCHBAR32_OR(0x1af0, 0x10); - halt(); - } - - MCHBAR8(0x2ca8) = MCHBAR8(0x2ca8); - MCHBAR32_AND_OR(0x2c80, 0, 0x53688); // !!!! - pci_write_config32(PCI_DEV (0xff, 0, 0), 0x60, 0x20220); - MCHBAR16(0x2c20); // !!!! - MCHBAR16(0x2c10); // !!!! - MCHBAR16(0x2c00); // !!!! - MCHBAR16(0x2c00) = 0x8c0; - udelay(1000); - write_1d0(0, 0x33d, 0, 0); - write_500(&info, 0, 0, 0xb61, 0, 0); - write_500(&info, 1, 0, 0xb61, 0, 0); - MCHBAR32(0x1a30) = 0x0; - MCHBAR32(0x1a34) = 0x0; - MCHBAR16(0x614) = 0xb5b | (info.populated_ranks[1][0][0] * 0x404) | - (info.populated_ranks[0][0][0] * 0xa0); - MCHBAR16(0x616) = 0x26a; - MCHBAR32(0x134) = 0x856000; - MCHBAR32(0x160) = 0x5ffffff; - MCHBAR32_AND_OR(0x114, 0, 0xc2024440); // !!!! - MCHBAR32_AND_OR(0x118, 0, 0x4); // !!!! - for (channel = 0; channel < NUM_CHANNELS; channel++) - MCHBAR32(0x260 + (channel << 10)) = 0x30809ff | - ((info.populated_ranks_mask[channel] & 3) << 20); - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR16(0x31c + (channel << 10)) = 0x101; - MCHBAR16(0x360 + (channel << 10)) = 0x909; - MCHBAR16(0x3a4 + (channel << 10)) = 0x101; - MCHBAR16(0x3e8 + (channel << 10)) = 0x101; - MCHBAR32(0x320 + (channel << 10)) = 0x29002900; - MCHBAR32(0x324 + (channel << 10)) = 0x0; - MCHBAR32(0x368 + (channel << 10)) = 0x32003200; - MCHBAR16(0x352 + (channel << 10)) = 0x505; - MCHBAR16(0x354 + (channel << 10)) = 0x3c3c; - MCHBAR16(0x356 + (channel << 10)) = 0x1040; - MCHBAR16(0x39a + (channel << 10)) = 0x73e4; - MCHBAR16(0x3de + (channel << 10)) = 0x77ed; - MCHBAR16(0x422 + (channel << 10)) = 0x1040; - } - - write_1d0(0x4, 0x151, 4, 1); - write_1d0(0, 0x142, 3, 1); - rdmsr(0x1ac); // !!!! - write_500(&info, 1, 1, 0x6b3, 4, 1); - write_500(&info, 1, 1, 0x6cf, 4, 1); - - rmw_1d0(0x21c, 0x38, 0, 6, 1); - - write_1d0(((!info.populated_ranks[1][0][0]) << 1) | ((!info. - populated_ranks[0] - [0][0]) << 0), - 0x1d1, 3, 1); - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR16(0x38e + (channel << 10)) = 0x5f5f; - MCHBAR16(0x3d2 + (channel << 10)) = 0x5f5f; - } - - set_334(0); - - program_base_timings(&info); - - MCHBAR8_OR(0x5ff, 0x80); - - write_1d0(0x2, 0x1d5, 2, 1); - write_1d0(0x20, 0x166, 7, 1); - write_1d0(0x0, 0xeb, 3, 1); - write_1d0(0x0, 0xf3, 6, 1); - - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (lane = 0; lane < 9; lane++) { - u16 addr = 0x125 + get_lane_offset(0, 0, lane); - u8 a; - a = read_500(&info, channel, addr, 6); // = 0x20040080 //!!!! - write_500(&info, channel, a, addr, 6, 1); - } - - udelay(1000); - - if (s3resume) { - if (info.cached_training == NULL) { - u32 reg32; - printk(BIOS_ERR, - "Couldn't find training data. Rebooting\n"); - reg32 = inl(DEFAULT_PMBASE + 0x04); - outl(reg32 & ~(7 << 10), DEFAULT_PMBASE + 0x04); - full_reset(); - } - int tm; - info.training = *info.cached_training; - for (tm = 0; tm < 4; tm++) - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - for (lane = 0; lane < 9; lane++) - write_500(&info, - channel, - info.training. - lane_timings - [tm][channel] - [slot][rank] - [lane], - get_timing_register_addr - (lane, tm, - slot, rank), - 9, 0); - write_1d0(info.cached_training->reg_178, 0x178, 7, 1); - write_1d0(info.cached_training->reg_10b, 0x10b, 6, 1); - } - - MCHBAR32_AND_OR(0x1f4, 0, 0x20000); // !!!! - MCHBAR32(0x1f0) = 0x1d000200; - MCHBAR8_AND_OR(0x1f0, 0, 0x1); // !!!! - MCHBAR8(0x1f0); // !!!! - - program_board_delay(&info); - - MCHBAR8(0x5ff) = 0x0; - MCHBAR8(0x5ff) = 0x80; - MCHBAR8(0x5f4) = 0x1; - - MCHBAR32_AND(0x130, 0xfffffffd); // | 2 when ? - while (MCHBAR32(0x130) & 1) - ; - gav(read_1d0(0x14b, 7)); // = 0x81023100 - write_1d0(0x30, 0x14b, 7, 1); - read_1d0(0xd6, 6); // = 0xfa008080 // !!!! - write_1d0(7, 0xd6, 6, 1); - read_1d0(0x328, 6); // = 0xfa018080 // !!!! - write_1d0(7, 0x328, 6, 1); - - for (channel = 0; channel < NUM_CHANNELS; channel++) - set_4cf(&info, channel, - info.populated_ranks[channel][0][0] ? 8 : 0); - - read_1d0(0x116, 4); // = 0x4040432 // !!!! - write_1d0(2, 0x116, 4, 1); - read_1d0(0xae, 6); // = 0xe8088080 // !!!! - write_1d0(0, 0xae, 6, 1); - read_1d0(0x300, 4); // = 0x48088080 // !!!! - write_1d0(0, 0x300, 6, 1); - MCHBAR16_AND_OR(0x356, 0, 0x1040); // !!!! - MCHBAR16_AND_OR(0x756, 0, 0x1040); // !!!! - MCHBAR32_AND(0x140, ~0x07000000); - MCHBAR32_AND(0x138, ~0x07000000); - MCHBAR32(0x130) = 0x31111301; - /* Wait until REG130b0 is 1. */ - while (MCHBAR32(0x130) & 1) - ; - - { - u32 t; - u8 val_a1; - val_a1 = read_1d0(0xa1, 6); // = 0x1cf4040 // !!!! - t = read_1d0(0x2f3, 6); // = 0x10a4040 // !!!! - rmw_1d0(0x320, 0x07, - (t & 4) | ((t & 8) >> 2) | ((t & 0x10) >> 4), 6, 1); - rmw_1d0(0x14b, 0x78, - ((((val_a1 >> 2) & 4) | (val_a1 & 8)) >> 2) | (val_a1 & - 4), 7, - 1); - rmw_1d0(0xce, 0x38, - ((((val_a1 >> 2) & 4) | (val_a1 & 8)) >> 2) | (val_a1 & - 4), 6, - 1); - } - - for (channel = 0; channel < NUM_CHANNELS; channel++) - set_4cf(&info, channel, - info.populated_ranks[channel][0][0] ? 9 : 1); - - rmw_1d0(0x116, 0xe, 1, 4, 1); // = 0x4040432 // !!!! - MCHBAR32(0x144); // !!!! - write_1d0(2, 0xae, 6, 1); - write_1d0(2, 0x300, 6, 1); - write_1d0(2, 0x121, 3, 1); - read_1d0(0xd6, 6); // = 0xfa00c0c7 // !!!! - write_1d0(4, 0xd6, 6, 1); - read_1d0(0x328, 6); // = 0xfa00c0c7 // !!!! - write_1d0(4, 0x328, 6, 1); - - for (channel = 0; channel < NUM_CHANNELS; channel++) - set_4cf(&info, channel, - info.populated_ranks[channel][0][0] ? 9 : 0); - - MCHBAR32(0x130) = 0x11111301 | (info.populated_ranks[1][0][0] << 30) | - (info.populated_ranks[0][0][0] << 29); - while (MCHBAR8(0x130) & 1) - ; - read_1d0(0xa1, 6); // = 0x1cf4054 // !!!! - read_1d0(0x2f3, 6); // = 0x10a4054 // !!!! - read_1d0(0x21c, 6); // = 0xafa00c0 // !!!! - write_1d0(0, 0x21c, 6, 1); - read_1d0(0x14b, 7); // = 0x810231b0 // !!!! - write_1d0(0x35, 0x14b, 7, 1); - - for (channel = 0; channel < NUM_CHANNELS; channel++) - set_4cf(&info, channel, - info.populated_ranks[channel][0][0] ? 0xb : 0x2); - - set_334(1); - - MCHBAR8(0x1e8) = 0x4; - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - write_500(&info, channel, - 0x3 & ~(info.populated_ranks_mask[channel]), 0x6b7, 2, - 1); - write_500(&info, channel, 0x3, 0x69b, 2, 1); - } - MCHBAR32_AND_OR(0x2d0, 0xff2c01ff, 0x200000); - MCHBAR16(0x6c0) = 0x14a0; - MCHBAR32_AND_OR(0x6d0, 0xff0080ff, 0x8000); - MCHBAR16(0x232) = 0x8; - /* 0x40004 or 0 depending on ? */ - MCHBAR32_AND_OR(0x234, 0xfffbfffb, 0x40004); - MCHBAR32_AND_OR(0x34, 0xfffffffd, 5); - MCHBAR32(0x128) = 0x2150d05; - MCHBAR8(0x12c) = 0x1f; - MCHBAR8(0x12d) = 0x56; - MCHBAR8(0x12e) = 0x31; - MCHBAR8(0x12f) = 0x0; - MCHBAR8(0x271) = 0x2; - MCHBAR8(0x671) = 0x2; - MCHBAR8(0x1e8) = 0x4; - for (channel = 0; channel < NUM_CHANNELS; channel++) - MCHBAR32(0x294 + (channel << 10)) = - (info.populated_ranks_mask[channel] & 3) << 16; - MCHBAR32_AND_OR(0x134, 0xfc01ffff, 0x10000); - MCHBAR32_AND_OR(0x134, 0xfc85ffff, 0x850000); - for (channel = 0; channel < NUM_CHANNELS; channel++) - MCHBAR32_AND_OR(0x260 + (channel << 10), ~0xf00000, 0x8000000 | - ((info.populated_ranks_mask[channel] & 3) << 20)); - - if (!s3resume) - jedec_init(&info); - - int totalrank = 0; - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - if (info.populated_ranks[channel][slot][rank]) { - jedec_read(&info, channel, slot, rank, - totalrank, 0xa, 0x400); - totalrank++; - } - - MCHBAR8(0x12c) = 0x9f; - - MCHBAR8_AND_OR(0x271, 0, 0xe); // 2 // !!!! - MCHBAR8_AND_OR(0x671, 0, 0xe); // !!!! - - if (!s3resume) { - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32(0x294 + (channel << 10)) = - (info.populated_ranks_mask[channel] & 3) << 16; - MCHBAR16(0x298 + (channel << 10)) = - info.populated_ranks[channel][0][0] | - (info.populated_ranks[channel][0][1] << 5); - MCHBAR32(0x29c + (channel << 10)) = 0x77a; - } - MCHBAR32_AND_OR(0x2c0, 0, 0x6009cc00); // !!!! - - { - u8 a, b; - a = MCHBAR8(0x243); - b = MCHBAR8(0x643); - MCHBAR8(0x243) = a | 2; - MCHBAR8(0x643) = b | 2; - } - - write_1d0(7, 0x19b, 3, 1); - write_1d0(7, 0x1c0, 3, 1); - write_1d0(4, 0x1c6, 4, 1); - write_1d0(4, 0x1cc, 4, 1); - read_1d0(0x151, 4); // = 0x408c6d74 // !!!! - write_1d0(4, 0x151, 4, 1); - MCHBAR32(0x584) = 0xfffff; - MCHBAR32(0x984) = 0xfffff; - - for (channel = 0; channel < NUM_CHANNELS; channel++) - for (slot = 0; slot < NUM_SLOTS; slot++) - for (rank = 0; rank < NUM_RANKS; rank++) - if (info. - populated_ranks[channel][slot] - [rank]) - config_rank(&info, s3resume, - channel, slot, - rank); - - MCHBAR8(0x243) = 0x1; - MCHBAR8(0x643) = 0x1; - } - - /* was == 1 but is common */ - pci_write_config16(NORTHBRIDGE, 0xc8, 3); - write_26c(0, 0x820); - write_26c(1, 0x820); - MCHBAR32_OR(0x130, 2); - /* end */ - - if (s3resume) { - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32(0x294 + (channel << 10)) = - (info.populated_ranks_mask[channel] & 3) << 16; - MCHBAR16(0x298 + (channel << 10)) = - info.populated_ranks[channel][0][0] | - (info.populated_ranks[channel][0][1] << 5); - MCHBAR32(0x29c + (channel << 10)) = 0x77a; - } - MCHBAR32_AND_OR(0x2c0, 0, 0x6009cc00); // !!!! - } - - MCHBAR32_AND(0xfa4, ~0x01000002); - MCHBAR32(0xfb0) = 0x2000e019; - - /* Before training. */ - timestamp_add_now(103); - - if (!s3resume) - ram_training(&info); - - /* After training. */ - timestamp_add_now(104); - - dump_timings(&info); - - program_modules_memory_map(&info, 0); - program_total_memory_map(&info); - - if (info.non_interleaved_part_mb != 0 && info.interleaved_part_mb != 0) - MCHBAR8(0x111) = 0x20 | (0 << 2) | (1 << 6) | (0 << 7); - else if (have_match_ranks(&info, 0, 4) && have_match_ranks(&info, 1, 4)) - MCHBAR8(0x111) = 0x20 | (3 << 2) | (0 << 6) | (1 << 7); - else if (have_match_ranks(&info, 0, 2) && have_match_ranks(&info, 1, 2)) - MCHBAR8(0x111) = 0x20 | (3 << 2) | (0 << 6) | (0 << 7); - else - MCHBAR8(0x111) = 0x20 | (3 << 2) | (1 << 6) | (0 << 7); - - MCHBAR32_AND(0xfac, ~0x80000000); - MCHBAR32(0xfb4) = 0x4800; - MCHBAR32(0xfb8) = (info.revision < 8) ? 0x20 : 0x0; - MCHBAR32(0xe94) = 0x7ffff; - MCHBAR32(0xfc0) = 0x80002040; - MCHBAR32(0xfc4) = 0x701246; - MCHBAR8_AND(0xfc8, ~0x70); - MCHBAR32_OR(0xe5c, 0x1000000); - MCHBAR32_AND_OR(0x1a70, ~0x00100000, 0x00200000); - MCHBAR32(0x50) = 0x700b0; - MCHBAR32(0x3c) = 0x10; - MCHBAR8(0x1aa8) = (MCHBAR8(0x1aa8) & ~0x35) | 0xa; - MCHBAR8_OR(0xff4, 0x2); - MCHBAR32_AND_OR(0xff8, ~0xe008, 0x1020); - -#if 1 - MCHBAR32(0xd00) = IOMMU_BASE2 | 1; - MCHBAR32(0xd40) = IOMMU_BASE1 | 1; - MCHBAR32(0xdc0) = IOMMU_BASE4 | 1; - - write32p(IOMMU_BASE1 | 0xffc, 0x80000000); - write32p(IOMMU_BASE2 | 0xffc, 0xc0000000); - write32p(IOMMU_BASE4 | 0xffc, 0x80000000); - -#else - { - u32 eax; - // = 0xe911714b - eax = read32p(0xffc + (MCHBAR32(0xd00) & ~1)) | 0x08000000; - write32p(0xffc + (MCHBAR32(0xd00) & ~1), eax); - // = 0xe911714b - eax = read32p(0xffc + (MCHBAR32(0xdc0) & ~1)) | 0x40000000; - write32p(0xffc + (MCHBAR32(0xdc0) & ~1), eax); - } -#endif - - { - u32 eax; - - eax = info.fsb_frequency / 9; - MCHBAR32_AND_OR(0xfcc, 0xfffc0000, - (eax * 0x280) | (eax * 0x5000) | eax | 0x40000); - MCHBAR32(0x20) = 0x33001; - } - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32_AND(0x220 + (channel << 10), ~0x7770); - if (info.max_slots_used_in_channel == 1) - MCHBAR16_OR(0x237 + (channel << 10), 0x0201); - else - MCHBAR16_AND(0x237 + (channel << 10), ~0x0201); - - MCHBAR8_OR(0x241 + (channel << 10), 1); - - if (info.clock_speed_index <= 1 && (info.silicon_revision == 2 - || info.silicon_revision == 3)) - MCHBAR32_OR(0x248 + (channel << 10), 0x00102000); - else - MCHBAR32_AND(0x248 + (channel << 10), ~0x00102000); - } - - MCHBAR32_OR(0x115, 0x1000000); - - { - u8 al; - al = 0xd; - if (!(info.silicon_revision == 0 || info.silicon_revision == 1)) - al += 2; - al |= ((1 << (info.max_slots_used_in_channel - 1)) - 1) << 4; - MCHBAR32(0x210) = (al << 16) | 0x20; - } - - for (channel = 0; channel < NUM_CHANNELS; channel++) { - MCHBAR32(0x288 + (channel << 10)) = 0x70605040; - MCHBAR32(0x28c + (channel << 10)) = 0xfffec080; - MCHBAR32(0x290 + (channel << 10)) = 0x282091c | - ((info.max_slots_used_in_channel - 1) << 0x16); - } - u32 reg1c; - pci_read_config32(NORTHBRIDGE, 0x40); // = DEFAULT_EPBAR | 0x001 // OK - reg1c = read32p(DEFAULT_EPBAR | 0x01c); // = 0x8001 // OK - pci_read_config32(NORTHBRIDGE, 0x40); // = DEFAULT_EPBAR | 0x001 // OK - write32p(DEFAULT_EPBAR | 0x01c, reg1c); // OK - MCHBAR8(0xe08); // = 0x0 - pci_read_config32(NORTHBRIDGE, 0xe4); // = 0x316126 - MCHBAR8_OR(0x1210, 2); - MCHBAR32(0x1200) = 0x8800440; - MCHBAR32(0x1204) = 0x53ff0453; - MCHBAR32(0x1208) = 0x19002043; - MCHBAR16(0x1214) = 0x320; - - if (info.revision == 0x10 || info.revision == 0x11) { - MCHBAR16(0x1214) = 0x220; - MCHBAR8_OR(0x1210, 0x40); - } - - MCHBAR8_OR(0x1214, 0x4); - MCHBAR8(0x120c) = 0x1; - MCHBAR8(0x1218) = 0x3; - MCHBAR8(0x121a) = 0x3; - MCHBAR8(0x121c) = 0x3; - MCHBAR16(0xc14) = 0x0; - MCHBAR16(0xc20) = 0x0; - MCHBAR32(0x1c) = 0x0; - - /* revision dependent here. */ - - MCHBAR16_OR(0x1230, 0x1f07); - - if (info.uma_enabled) - MCHBAR32_OR(0x11f4, 0x10000000); - - MCHBAR16_OR(0x1230, 0x8000); - MCHBAR8_OR(0x1214, 1); - - u8 bl, ebpb; - u16 reg_1020; - - reg_1020 = MCHBAR32(0x1020); // = 0x6c733c // OK - MCHBAR8(0x1070) = 0x1; - - MCHBAR32(0x1000) = 0x100; - MCHBAR8(0x1007) = 0x0; - - if (reg_1020 != 0) { - MCHBAR16(0x1018) = 0x0; - bl = reg_1020 >> 8; - ebpb = reg_1020 & 0xff; - } else { - ebpb = 0; - bl = 8; - } - - rdmsr(0x1a2); - - MCHBAR32(0x1014) = 0xffffffff; - - MCHBAR32(0x1010) = ((((ebpb + 0x7d) << 7) / bl) & 0xff) * (!!reg_1020); - - MCHBAR8(0x101c) = 0xb8; - - MCHBAR8(0x123e) = (MCHBAR8(0x123e) & 0xf) | 0x60; - if (reg_1020 != 0) { - MCHBAR32_AND_OR(0x123c, ~0x00900000, 0x600000); - MCHBAR8(0x101c) = 0xb8; - } - - setup_heci_uma(&info); - - if (info.uma_enabled) { - u16 ax; - MCHBAR32_OR(0x11b0, 0x4000); - MCHBAR32_OR(0x11b4, 0x4000); - MCHBAR16_OR(0x1190, 0x4000); - - ax = MCHBAR16(0x1190) & 0xf00; // = 0x480a // OK - MCHBAR16(0x1170) = ax | (MCHBAR16(0x1170) & 0x107f) | 0x4080; - MCHBAR16_OR(0x1170, 0x1000); - - udelay(1000); - - u16 ecx; - for (ecx = 0xffff; ecx && (MCHBAR16(0x1170) & 0x1000); ecx--) - ; - MCHBAR16_AND(0x1190, ~0x4000); - } - - pci_write_config8(SOUTHBRIDGE, GEN_PMCON_2, - pci_read_config8(SOUTHBRIDGE, GEN_PMCON_2) & ~0x80); - udelay(10000); - MCHBAR16(0x2ca8) = 0x8; - - udelay(1000); - dump_timings(&info); - cbmem_wasnot_inited = cbmem_recovery(s3resume); - - if (!s3resume) - save_timings(&info); - if (s3resume && cbmem_wasnot_inited) { - u32 reg32; - printk(BIOS_ERR, "Failed S3 resume.\n"); - ram_check(0x100000, 0x200000); - - /* Clear SLP_TYPE. */ - reg32 = inl(DEFAULT_PMBASE + 0x04); - outl(reg32 & ~(7 << 10), DEFAULT_PMBASE + 0x04); - - /* Failed S3 resume, reset to come up cleanly */ - full_reset(); - } -} |