2730 lines
		
	
	
		
			72 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			2730 lines
		
	
	
		
			72 KiB
		
	
	
	
		
			C
		
	
	
	
| // SPDX-License-Identifier: GPL-2.0
 | |
| /*
 | |
|  * Copyright (C) 2020 Marvell International Ltd.
 | |
|  */
 | |
| 
 | |
| #include <command.h>
 | |
| #include <config.h>
 | |
| #include <dm.h>
 | |
| #include <hang.h>
 | |
| #include <i2c.h>
 | |
| #include <ram.h>
 | |
| #include <time.h>
 | |
| #include <asm/global_data.h>
 | |
| 
 | |
| #include <asm/sections.h>
 | |
| #include <linux/io.h>
 | |
| 
 | |
| #include <mach/octeon_ddr.h>
 | |
| 
 | |
| #define CONFIG_REF_HERTZ	50000000
 | |
| 
 | |
| DECLARE_GLOBAL_DATA_PTR;
 | |
| 
 | |
| /* Sign of an integer */
 | |
| static s64 _sign(s64 v)
 | |
| {
 | |
| 	return (v < 0);
 | |
| }
 | |
| 
 | |
| #ifndef DDR_NO_DEBUG
 | |
| char *lookup_env(struct ddr_priv *priv, const char *format, ...)
 | |
| {
 | |
| 	char *s;
 | |
| 	unsigned long value;
 | |
| 	va_list args;
 | |
| 	char buffer[64];
 | |
| 
 | |
| 	va_start(args, format);
 | |
| 	vsnprintf(buffer, sizeof(buffer), format, args);
 | |
| 	va_end(args);
 | |
| 
 | |
| 	s = ddr_getenv_debug(priv, buffer);
 | |
| 	if (s) {
 | |
| 		value = simple_strtoul(s, NULL, 0);
 | |
| 		printf("Parameter found in environment %s=\"%s\" 0x%lx (%ld)\n",
 | |
| 		       buffer, s, value, value);
 | |
| 	}
 | |
| 
 | |
| 	return s;
 | |
| }
 | |
| 
 | |
| char *lookup_env_ull(struct ddr_priv *priv, const char *format, ...)
 | |
| {
 | |
| 	char *s;
 | |
| 	u64 value;
 | |
| 	va_list args;
 | |
| 	char buffer[64];
 | |
| 
 | |
| 	va_start(args, format);
 | |
| 	vsnprintf(buffer, sizeof(buffer), format, args);
 | |
| 	va_end(args);
 | |
| 
 | |
| 	s = ddr_getenv_debug(priv, buffer);
 | |
| 	if (s) {
 | |
| 		value = simple_strtoull(s, NULL, 0);
 | |
| 		printf("Parameter found in environment. %s = 0x%016llx\n",
 | |
| 		       buffer, value);
 | |
| 	}
 | |
| 
 | |
| 	return s;
 | |
| }
 | |
| #else
 | |
| char *lookup_env(struct ddr_priv *priv, const char *format, ...)
 | |
| {
 | |
| 	return NULL;
 | |
| }
 | |
| 
 | |
| char *lookup_env_ull(struct ddr_priv *priv, const char *format, ...)
 | |
| {
 | |
| 	return NULL;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| /* Number of L2C Tag-and-data sections (TADs) that are connected to LMC. */
 | |
| #define CVMX_L2C_TADS  ((OCTEON_IS_MODEL(OCTEON_CN68XX) ||		\
 | |
| 			 OCTEON_IS_MODEL(OCTEON_CN73XX) ||		\
 | |
| 			 OCTEON_IS_MODEL(OCTEON_CNF75XX)) ? 4 :		\
 | |
| 			(OCTEON_IS_MODEL(OCTEON_CN78XX)) ? 8 : 1)
 | |
| 
 | |
| /* Number of L2C IOBs connected to LMC. */
 | |
| #define CVMX_L2C_IOBS  ((OCTEON_IS_MODEL(OCTEON_CN68XX) ||		\
 | |
| 			 OCTEON_IS_MODEL(OCTEON_CN78XX) ||		\
 | |
| 			 OCTEON_IS_MODEL(OCTEON_CN73XX) ||		\
 | |
| 			 OCTEON_IS_MODEL(OCTEON_CNF75XX)) ? 2 : 1)
 | |
| 
 | |
| #define CVMX_L2C_MAX_MEMSZ_ALLOWED (OCTEON_IS_OCTEON2() ?		\
 | |
| 				    (32 * CVMX_L2C_TADS) :		\
 | |
| 				    (OCTEON_IS_MODEL(OCTEON_CN70XX) ?	\
 | |
| 				     512 : (OCTEON_IS_OCTEON3() ? 1024 : 0)))
 | |
| 
 | |
| /**
 | |
|  * Initialize the BIG address in L2C+DRAM to generate proper error
 | |
|  * on reading/writing to an non-existent memory location.
 | |
|  *
 | |
|  * @param node      OCX CPU node number
 | |
|  * @param mem_size  Amount of DRAM configured in MB.
 | |
|  * @param mode      Allow/Disallow reporting errors L2C_INT_SUM[BIGRD,BIGWR].
 | |
|  */
 | |
| static void cvmx_l2c_set_big_size(struct ddr_priv *priv, u64 mem_size, int mode)
 | |
| {
 | |
| 	if ((OCTEON_IS_OCTEON2() || OCTEON_IS_OCTEON3()) &&
 | |
| 	    !OCTEON_IS_MODEL(OCTEON_CN63XX_PASS1_X)) {
 | |
| 		union cvmx_l2c_big_ctl big_ctl;
 | |
| 		int bits = 0, zero_bits = 0;
 | |
| 		u64 mem;
 | |
| 
 | |
| 		if (mem_size > (CVMX_L2C_MAX_MEMSZ_ALLOWED * 1024ull)) {
 | |
| 			printf("WARNING: Invalid memory size(%lld) requested, should be <= %lld\n",
 | |
| 			       mem_size,
 | |
| 			       (u64)CVMX_L2C_MAX_MEMSZ_ALLOWED * 1024);
 | |
| 			mem_size = CVMX_L2C_MAX_MEMSZ_ALLOWED * 1024;
 | |
| 		}
 | |
| 
 | |
| 		mem = mem_size;
 | |
| 		while (mem) {
 | |
| 			if ((mem & 1) == 0)
 | |
| 				zero_bits++;
 | |
| 			bits++;
 | |
| 			mem >>= 1;
 | |
| 		}
 | |
| 
 | |
| 		if ((bits - zero_bits) != 1 || (bits - 9) <= 0) {
 | |
| 			printf("ERROR: Invalid DRAM size (%lld) requested, refer to L2C_BIG_CTL[maxdram] for valid options.\n",
 | |
| 			       mem_size);
 | |
| 			return;
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * The BIG/HOLE is logic is not supported in pass1 as per
 | |
| 		 * Errata L2C-17736
 | |
| 		 */
 | |
| 		if (mode == 0 && OCTEON_IS_MODEL(OCTEON_CN78XX_PASS1_X))
 | |
| 			mode = 1;
 | |
| 
 | |
| 		big_ctl.u64 = 0;
 | |
| 		big_ctl.s.maxdram = bits - 9;
 | |
| 		big_ctl.cn61xx.disable = mode;
 | |
| 		l2c_wr(priv, CVMX_L2C_BIG_CTL, big_ctl.u64);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static u32 octeon3_refclock(u32 alt_refclk, u32 ddr_hertz,
 | |
| 			    struct dimm_config *dimm_config)
 | |
| {
 | |
| 	u32 ddr_ref_hertz = CONFIG_REF_HERTZ;
 | |
| 	int ddr_type;
 | |
| 	int spd_dimm_type;
 | |
| 
 | |
| 	debug("%s(%u, %u, %p)\n", __func__, alt_refclk, ddr_hertz, dimm_config);
 | |
| 
 | |
| 	/* Octeon 3 case... */
 | |
| 
 | |
| 	/* we know whether alternate refclk is always wanted
 | |
| 	 * we also know already if we want 2133 MT/s
 | |
| 	 * if alt refclk not always wanted, then probe DDR and
 | |
| 	 * DIMM type if DDR4 and RDIMMs, then set desired refclk
 | |
| 	 * to 100MHz, otherwise to default (50MHz)
 | |
| 	 * depend on ddr_initialize() to do the refclk selection
 | |
| 	 * and validation/
 | |
| 	 */
 | |
| 	if (alt_refclk) {
 | |
| 		/*
 | |
| 		 * If alternate refclk was specified, let it override
 | |
| 		 * everything
 | |
| 		 */
 | |
| 		ddr_ref_hertz = alt_refclk * 1000000;
 | |
| 		printf("%s: DRAM init: %d MHz refclk is REQUESTED ALWAYS\n",
 | |
| 		       __func__, alt_refclk);
 | |
| 	} else if (ddr_hertz > 1000000000) {
 | |
| 		ddr_type = get_ddr_type(dimm_config, 0);
 | |
| 		spd_dimm_type = get_dimm_module_type(dimm_config, 0, ddr_type);
 | |
| 
 | |
| 		debug("ddr type: 0x%x, dimm type: 0x%x\n", ddr_type,
 | |
| 		      spd_dimm_type);
 | |
| 		/* Is DDR4 and RDIMM just to be sure. */
 | |
| 		if (ddr_type == DDR4_DRAM &&
 | |
| 		    (spd_dimm_type == 1 || spd_dimm_type == 5 ||
 | |
| 		     spd_dimm_type == 8)) {
 | |
| 			/* Yes, we require 100MHz refclk, so set it. */
 | |
| 			ddr_ref_hertz = 100000000;
 | |
| 			puts("DRAM init: 100 MHz refclk is REQUIRED\n");
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	debug("%s: speed: %u\n", __func__, ddr_ref_hertz);
 | |
| 	return ddr_ref_hertz;
 | |
| }
 | |
| 
 | |
| int encode_row_lsb_ddr3(int row_lsb)
 | |
| {
 | |
| 	int row_lsb_start = 14;
 | |
| 
 | |
| 	/* Decoding for row_lsb        */
 | |
| 	/* 000: row_lsb = mem_adr[14]  */
 | |
| 	/* 001: row_lsb = mem_adr[15]  */
 | |
| 	/* 010: row_lsb = mem_adr[16]  */
 | |
| 	/* 011: row_lsb = mem_adr[17]  */
 | |
| 	/* 100: row_lsb = mem_adr[18]  */
 | |
| 	/* 101: row_lsb = mem_adr[19]  */
 | |
| 	/* 110: row_lsb = mem_adr[20]  */
 | |
| 	/* 111: RESERVED               */
 | |
| 
 | |
| 	if (octeon_is_cpuid(OCTEON_CN6XXX) ||
 | |
| 	    octeon_is_cpuid(OCTEON_CNF7XXX) || octeon_is_cpuid(OCTEON_CN7XXX))
 | |
| 		row_lsb_start = 14;
 | |
| 	else
 | |
| 		printf("ERROR: Unsupported Octeon model: 0x%x\n",
 | |
| 		       read_c0_prid());
 | |
| 
 | |
| 	return row_lsb - row_lsb_start;
 | |
| }
 | |
| 
 | |
| int encode_pbank_lsb_ddr3(int pbank_lsb)
 | |
| {
 | |
| 	/* Decoding for pbank_lsb                                        */
 | |
| 	/* 0000:DIMM = mem_adr[28]    / rank = mem_adr[27] (if RANK_ENA) */
 | |
| 	/* 0001:DIMM = mem_adr[29]    / rank = mem_adr[28]      "        */
 | |
| 	/* 0010:DIMM = mem_adr[30]    / rank = mem_adr[29]      "        */
 | |
| 	/* 0011:DIMM = mem_adr[31]    / rank = mem_adr[30]      "        */
 | |
| 	/* 0100:DIMM = mem_adr[32]    / rank = mem_adr[31]      "        */
 | |
| 	/* 0101:DIMM = mem_adr[33]    / rank = mem_adr[32]      "        */
 | |
| 	/* 0110:DIMM = mem_adr[34]    / rank = mem_adr[33]      "        */
 | |
| 	/* 0111:DIMM = 0              / rank = mem_adr[34]      "        */
 | |
| 	/* 1000-1111: RESERVED                                           */
 | |
| 
 | |
| 	int pbank_lsb_start = 0;
 | |
| 
 | |
| 	if (octeon_is_cpuid(OCTEON_CN6XXX) ||
 | |
| 	    octeon_is_cpuid(OCTEON_CNF7XXX) || octeon_is_cpuid(OCTEON_CN7XXX))
 | |
| 		pbank_lsb_start = 28;
 | |
| 	else
 | |
| 		printf("ERROR: Unsupported Octeon model: 0x%x\n",
 | |
| 		       read_c0_prid());
 | |
| 
 | |
| 	return pbank_lsb - pbank_lsb_start;
 | |
| }
 | |
| 
 | |
| static void set_ddr_clock_initialized(struct ddr_priv *priv, int if_num,
 | |
| 				      bool inited_flag)
 | |
| {
 | |
| 	priv->ddr_clock_initialized[if_num] = inited_flag;
 | |
| }
 | |
| 
 | |
| static int ddr_clock_initialized(struct ddr_priv *priv, int if_num)
 | |
| {
 | |
| 	return priv->ddr_clock_initialized[if_num];
 | |
| }
 | |
| 
 | |
| static void set_ddr_memory_preserved(struct ddr_priv *priv)
 | |
| {
 | |
| 	priv->ddr_memory_preserved = true;
 | |
| }
 | |
| 
 | |
| bool ddr_memory_preserved(struct ddr_priv *priv)
 | |
| {
 | |
| 	return priv->ddr_memory_preserved;
 | |
| }
 | |
| 
 | |
| static void cn78xx_lmc_dreset_init(struct ddr_priv *priv, int if_num)
 | |
| {
 | |
| 	union cvmx_lmcx_dll_ctl2 dll_ctl2;
 | |
| 
 | |
| 	/*
 | |
| 	 * The remainder of this section describes the sequence for LMCn.
 | |
| 	 *
 | |
| 	 * 1. If not done already, write LMC(0..3)_DLL_CTL2 to its reset value
 | |
| 	 * (except without changing the LMC(0..3)_DLL_CTL2[INTF_EN] value from
 | |
| 	 * that set in the prior Step 3), including
 | |
| 	 * LMC(0..3)_DLL_CTL2[DRESET] = 1.
 | |
| 	 *
 | |
| 	 * 2. Without changing any other LMC(0..3)_DLL_CTL2 fields, write
 | |
| 	 * LMC(0..3)_DLL_CTL2[DLL_BRINGUP] = 1.
 | |
| 	 */
 | |
| 
 | |
| 	dll_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 	dll_ctl2.cn78xx.dll_bringup = 1;
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL2(if_num), dll_ctl2.u64);
 | |
| 
 | |
| 	/*
 | |
| 	 * 3. Read LMC(0..3)_DLL_CTL2 and wait for the result.
 | |
| 	 */
 | |
| 
 | |
| 	lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 
 | |
| 	/*
 | |
| 	 * 4. Wait for a minimum of 10 LMC CK cycles.
 | |
| 	 */
 | |
| 
 | |
| 	udelay(1);
 | |
| 
 | |
| 	/*
 | |
| 	 * 5. Without changing any other fields in LMC(0..3)_DLL_CTL2, write
 | |
| 	 * LMC(0..3)_DLL_CTL2[QUAD_DLL_ENA] = 1.
 | |
| 	 * LMC(0..3)_DLL_CTL2[QUAD_DLL_ENA] must not change after this point
 | |
| 	 * without restarting the LMCn DRESET initialization sequence.
 | |
| 	 */
 | |
| 
 | |
| 	dll_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 	dll_ctl2.cn78xx.quad_dll_ena = 1;
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL2(if_num), dll_ctl2.u64);
 | |
| 
 | |
| 	/*
 | |
| 	 * 6. Read LMC(0..3)_DLL_CTL2 and wait for the result.
 | |
| 	 */
 | |
| 
 | |
| 	lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 
 | |
| 	/*
 | |
| 	 * 7. Wait a minimum of 10 us.
 | |
| 	 */
 | |
| 
 | |
| 	udelay(10);
 | |
| 
 | |
| 	/*
 | |
| 	 * 8. Without changing any other fields in LMC(0..3)_DLL_CTL2, write
 | |
| 	 * LMC(0..3)_DLL_CTL2[DLL_BRINGUP] = 0.
 | |
| 	 * LMC(0..3)_DLL_CTL2[DLL_BRINGUP] must not change after this point
 | |
| 	 * without restarting the LMCn DRESET initialization sequence.
 | |
| 	 */
 | |
| 
 | |
| 	dll_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 	dll_ctl2.cn78xx.dll_bringup = 0;
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL2(if_num), dll_ctl2.u64);
 | |
| 
 | |
| 	/*
 | |
| 	 * 9. Read LMC(0..3)_DLL_CTL2 and wait for the result.
 | |
| 	 */
 | |
| 
 | |
| 	lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 
 | |
| 	/*
 | |
| 	 * 10. Without changing any other fields in LMC(0..3)_DLL_CTL2, write
 | |
| 	 * LMC(0..3)_DLL_CTL2[DRESET] = 0.
 | |
| 	 * LMC(0..3)_DLL_CTL2[DRESET] must not change after this point without
 | |
| 	 * restarting the LMCn DRESET initialization sequence.
 | |
| 	 *
 | |
| 	 * After completing LMCn DRESET initialization, all LMC CSRs may be
 | |
| 	 * accessed.  Prior to completing LMC DRESET initialization, only
 | |
| 	 * LMC(0..3)_DDR_PLL_CTL, LMC(0..3)_DLL_CTL2, LMC(0..3)_RESET_CTL, and
 | |
| 	 * LMC(0..3)_COMP_CTL2 LMC CSRs can be accessed.
 | |
| 	 */
 | |
| 
 | |
| 	dll_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL2(if_num));
 | |
| 	dll_ctl2.cn78xx.dreset = 0;
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL2(if_num), dll_ctl2.u64);
 | |
| }
 | |
| 
 | |
| int initialize_ddr_clock(struct ddr_priv *priv, struct ddr_conf *ddr_conf,
 | |
| 			 u32 cpu_hertz, u32 ddr_hertz, u32 ddr_ref_hertz,
 | |
| 			 int if_num, u32 if_mask)
 | |
| {
 | |
| 	char *s;
 | |
| 
 | |
| 	if (ddr_clock_initialized(priv, if_num))
 | |
| 		return 0;
 | |
| 
 | |
| 	if (!ddr_clock_initialized(priv, 0)) {	/* Do this once */
 | |
| 		union cvmx_lmcx_reset_ctl reset_ctl;
 | |
| 		int i;
 | |
| 
 | |
| 		/*
 | |
| 		 * Check to see if memory is to be preserved and set global
 | |
| 		 * flag
 | |
| 		 */
 | |
| 		for (i = 3; i >= 0; --i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			reset_ctl.u64 = lmc_rd(priv, CVMX_LMCX_RESET_CTL(i));
 | |
| 			if (reset_ctl.s.ddr3psv == 1) {
 | |
| 				debug("LMC%d Preserving memory\n", i);
 | |
| 				set_ddr_memory_preserved(priv);
 | |
| 
 | |
| 				/* Re-initialize flags */
 | |
| 				reset_ctl.s.ddr3pwarm = 0;
 | |
| 				reset_ctl.s.ddr3psoft = 0;
 | |
| 				reset_ctl.s.ddr3psv = 0;
 | |
| 				lmc_wr(priv, CVMX_LMCX_RESET_CTL(i),
 | |
| 				       reset_ctl.u64);
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * ToDo: Add support for these SoCs:
 | |
| 	 *
 | |
| 	 * if (octeon_is_cpuid(OCTEON_CN63XX) ||
 | |
| 	 * octeon_is_cpuid(OCTEON_CN66XX) ||
 | |
| 	 * octeon_is_cpuid(OCTEON_CN61XX) || octeon_is_cpuid(OCTEON_CNF71XX))
 | |
| 	 *
 | |
| 	 * and
 | |
| 	 *
 | |
| 	 * if (octeon_is_cpuid(OCTEON_CN68XX))
 | |
| 	 *
 | |
| 	 * and
 | |
| 	 *
 | |
| 	 * if (octeon_is_cpuid(OCTEON_CN70XX))
 | |
| 	 *
 | |
| 	 */
 | |
| 
 | |
| 	if (octeon_is_cpuid(OCTEON_CN78XX) || octeon_is_cpuid(OCTEON_CN73XX) ||
 | |
| 	    octeon_is_cpuid(OCTEON_CNF75XX)) {
 | |
| 		union cvmx_lmcx_dll_ctl2 dll_ctl2;
 | |
| 		union cvmx_lmcx_dll_ctl3 ddr_dll_ctl3;
 | |
| 		union cvmx_lmcx_ddr_pll_ctl ddr_pll_ctl;
 | |
| 		struct dimm_config *dimm_config_table =
 | |
| 			ddr_conf->dimm_config_table;
 | |
| 		int en_idx, save_en_idx, best_en_idx = 0;
 | |
| 		u64 clkf, clkr, max_clkf = 127;
 | |
| 		u64 best_clkf = 0, best_clkr = 0;
 | |
| 		u64 best_pll_MHz = 0;
 | |
| 		u64 pll_MHz;
 | |
| 		u64 min_pll_MHz = 800;
 | |
| 		u64 max_pll_MHz = 5000;
 | |
| 		u64 error;
 | |
| 		u64 best_error;
 | |
| 		u64 best_calculated_ddr_hertz = 0;
 | |
| 		u64 calculated_ddr_hertz = 0;
 | |
| 		u64 orig_ddr_hertz = ddr_hertz;
 | |
| 		const int _en[] = { 1, 2, 3, 4, 5, 6, 7, 8, 10, 12 };
 | |
| 		int override_pll_settings;
 | |
| 		int new_bwadj;
 | |
| 		int ddr_type;
 | |
| 		int i;
 | |
| 
 | |
| 		/* ddr_type only indicates DDR4 or DDR3 */
 | |
| 		ddr_type = (read_spd(&dimm_config_table[0], 0,
 | |
| 				     DDR4_SPD_KEY_BYTE_DEVICE_TYPE) ==
 | |
| 			    0x0C) ? DDR4_DRAM : DDR3_DRAM;
 | |
| 
 | |
| 		/*
 | |
| 		 * 5.9 LMC Initialization Sequence
 | |
| 		 *
 | |
| 		 * There are 13 parts to the LMC initialization procedure:
 | |
| 		 *
 | |
| 		 * 1. DDR PLL initialization
 | |
| 		 *
 | |
| 		 * 2. LMC CK initialization
 | |
| 		 *
 | |
| 		 * 3. LMC interface enable initialization
 | |
| 		 *
 | |
| 		 * 4. LMC DRESET initialization
 | |
| 		 *
 | |
| 		 * 5. LMC CK local initialization
 | |
| 		 *
 | |
| 		 * 6. LMC RESET initialization
 | |
| 		 *
 | |
| 		 * 7. Early LMC initialization
 | |
| 		 *
 | |
| 		 * 8. LMC offset training
 | |
| 		 *
 | |
| 		 * 9. LMC internal Vref training
 | |
| 		 *
 | |
| 		 * 10. LMC deskew training
 | |
| 		 *
 | |
| 		 * 11. LMC write leveling
 | |
| 		 *
 | |
| 		 * 12. LMC read leveling
 | |
| 		 *
 | |
| 		 * 13. Final LMC initialization
 | |
| 		 *
 | |
| 		 * CN78XX supports two modes:
 | |
| 		 *
 | |
| 		 * - two-LMC mode: both LMCs 2/3 must not be enabled
 | |
| 		 * (LMC2/3_DLL_CTL2[DRESET] must be set to 1 and
 | |
| 		 * LMC2/3_DLL_CTL2[INTF_EN]
 | |
| 		 * must be set to 0) and both LMCs 0/1 must be enabled).
 | |
| 		 *
 | |
| 		 * - four-LMC mode: all four LMCs 0..3 must be enabled.
 | |
| 		 *
 | |
| 		 * Steps 4 and 6..13 should each be performed for each
 | |
| 		 * enabled LMC (either twice or four times). Steps 1..3 and
 | |
| 		 * 5 are more global in nature and each must be executed
 | |
| 		 * exactly once (not once per LMC) each time the DDR PLL
 | |
| 		 * changes or is first brought up. Steps 1..3 and 5 need
 | |
| 		 * not be performed if the DDR PLL is stable.
 | |
| 		 *
 | |
| 		 * Generally, the steps are performed in order. The exception
 | |
| 		 * is that the CK local initialization (step 5) must be
 | |
| 		 * performed after some DRESET initializations (step 4) and
 | |
| 		 * before other DRESET initializations when the DDR PLL is
 | |
| 		 * brought up or changed. (The CK local initialization uses
 | |
| 		 * information from some LMCs to bring up the other local
 | |
| 		 * CKs.) The following text describes these ordering
 | |
| 		 * requirements in more detail.
 | |
| 		 *
 | |
| 		 * Following any chip reset, the DDR PLL must be brought up,
 | |
| 		 * and all 13 steps should be executed. Subsequently, it is
 | |
| 		 * possible to execute only steps 4 and 6..13, or to execute
 | |
| 		 * only steps 8..13.
 | |
| 		 *
 | |
| 		 * The remainder of this section covers these initialization
 | |
| 		 * steps in sequence.
 | |
| 		 */
 | |
| 
 | |
| 		/* Do the following init only once */
 | |
| 		if (if_num != 0)
 | |
| 			goto not_if0;
 | |
| 
 | |
| 		/* Only for interface #0 ... */
 | |
| 
 | |
| 		/*
 | |
| 		 * 5.9.3 LMC Interface-Enable Initialization
 | |
| 		 *
 | |
| 		 * LMC interface-enable initialization (Step 3) must be#
 | |
| 		 * performed after Step 2 for each chip reset and whenever
 | |
| 		 * the DDR clock speed changes. This step needs to be
 | |
| 		 * performed only once, not once per LMC. Perform the
 | |
| 		 * following three substeps for the LMC interface-enable
 | |
| 		 * initialization:
 | |
| 		 *
 | |
| 		 * 1. Without changing any other LMC2_DLL_CTL2 fields
 | |
| 		 * (LMC(0..3)_DLL_CTL2 should be at their reset values after
 | |
| 		 * Step 1), write LMC2_DLL_CTL2[INTF_EN] = 1 if four-LMC
 | |
| 		 * mode is desired.
 | |
| 		 *
 | |
| 		 * 2. Without changing any other LMC3_DLL_CTL2 fields, write
 | |
| 		 * LMC3_DLL_CTL2[INTF_EN] = 1 if four-LMC mode is desired.
 | |
| 		 *
 | |
| 		 * 3. Read LMC2_DLL_CTL2 and wait for the result.
 | |
| 		 *
 | |
| 		 * The LMC2_DLL_CTL2[INTF_EN] and LMC3_DLL_CTL2[INTF_EN]
 | |
| 		 * values should not be changed by software from this point.
 | |
| 		 */
 | |
| 
 | |
| 		for (i = 0; i < 4; ++i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			dll_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL2(i));
 | |
| 
 | |
| 			dll_ctl2.cn78xx.byp_setting = 0;
 | |
| 			dll_ctl2.cn78xx.byp_sel = 0;
 | |
| 			dll_ctl2.cn78xx.quad_dll_ena = 0;
 | |
| 			dll_ctl2.cn78xx.dreset = 1;
 | |
| 			dll_ctl2.cn78xx.dll_bringup = 0;
 | |
| 			dll_ctl2.cn78xx.intf_en = 0;
 | |
| 
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL2(i), dll_ctl2.u64);
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * ###### Interface enable (intf_en) deferred until after
 | |
| 		 * DDR_DIV_RESET=0 #######
 | |
| 		 */
 | |
| 
 | |
| 		/*
 | |
| 		 * 5.9.1 DDR PLL Initialization
 | |
| 		 *
 | |
| 		 * DDR PLL initialization (Step 1) must be performed for each
 | |
| 		 * chip reset and whenever the DDR clock speed changes. This
 | |
| 		 * step needs to be performed only once, not once per LMC.
 | |
| 		 *
 | |
| 		 * Perform the following eight substeps to initialize the
 | |
| 		 * DDR PLL:
 | |
| 		 *
 | |
| 		 * 1. If not done already, write all fields in
 | |
| 		 * LMC(0..3)_DDR_PLL_CTL and
 | |
| 		 * LMC(0..1)_DLL_CTL2 to their reset values, including:
 | |
| 		 *
 | |
| 		 * .. LMC0_DDR_PLL_CTL[DDR_DIV_RESET] = 1
 | |
| 		 * .. LMC0_DLL_CTL2[DRESET] = 1
 | |
| 		 *
 | |
| 		 * This substep is not necessary after a chip reset.
 | |
| 		 *
 | |
| 		 */
 | |
| 
 | |
| 		ddr_pll_ctl.u64 = lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(0));
 | |
| 
 | |
| 		ddr_pll_ctl.cn78xx.reset_n = 0;
 | |
| 		ddr_pll_ctl.cn78xx.ddr_div_reset = 1;
 | |
| 		ddr_pll_ctl.cn78xx.phy_dcok = 0;
 | |
| 
 | |
| 		/*
 | |
| 		 * 73XX pass 1.3 has LMC0 DCLK_INVERT tied to 1; earlier
 | |
| 		 * 73xx passes are tied to 0
 | |
| 		 *
 | |
| 		 * 75XX needs LMC0 DCLK_INVERT set to 1 to minimize duty
 | |
| 		 * cycle falling points
 | |
| 		 *
 | |
| 		 * and we default all other chips LMC0 to DCLK_INVERT=0
 | |
| 		 */
 | |
| 		ddr_pll_ctl.cn78xx.dclk_invert =
 | |
| 		    !!(octeon_is_cpuid(OCTEON_CN73XX_PASS1_3) ||
 | |
| 		       octeon_is_cpuid(OCTEON_CNF75XX));
 | |
| 
 | |
| 		/*
 | |
| 		 * allow override of LMC0 desired setting for DCLK_INVERT,
 | |
| 		 * but not on 73XX;
 | |
| 		 * we cannot change LMC0 DCLK_INVERT on 73XX any pass
 | |
| 		 */
 | |
| 		if (!(octeon_is_cpuid(OCTEON_CN73XX))) {
 | |
| 			s = lookup_env(priv, "ddr0_set_dclk_invert");
 | |
| 			if (s) {
 | |
| 				ddr_pll_ctl.cn78xx.dclk_invert =
 | |
| 				    !!simple_strtoul(s, NULL, 0);
 | |
| 				debug("LMC0: override DDR_PLL_CTL[dclk_invert] to %d\n",
 | |
| 				      ddr_pll_ctl.cn78xx.dclk_invert);
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(0), ddr_pll_ctl.u64);
 | |
| 		debug("%-45s : 0x%016llx\n", "LMC0: DDR_PLL_CTL",
 | |
| 		      ddr_pll_ctl.u64);
 | |
| 
 | |
| 		// only when LMC1 is active
 | |
| 		if (if_mask & 0x2) {
 | |
| 			/*
 | |
| 			 * For CNF75XX, both LMC0 and LMC1 use the same PLL,
 | |
| 			 * so we use the LMC0 setting of DCLK_INVERT for LMC1.
 | |
| 			 */
 | |
| 			if (!octeon_is_cpuid(OCTEON_CNF75XX)) {
 | |
| 				int override = 0;
 | |
| 
 | |
| 				/*
 | |
| 				 * by default, for non-CNF75XX, we want
 | |
| 				 * LMC1 toggled LMC0
 | |
| 				 */
 | |
| 				int lmc0_dclk_invert =
 | |
| 				    ddr_pll_ctl.cn78xx.dclk_invert;
 | |
| 
 | |
| 				/*
 | |
| 				 * FIXME: work-around for DDR3 UDIMM problems
 | |
| 				 * is to use LMC0 setting on LMC1 and if
 | |
| 				 * 73xx pass 1.3, we want to default LMC1
 | |
| 				 * DCLK_INVERT to LMC0, not the invert of LMC0
 | |
| 				 */
 | |
| 				int lmc1_dclk_invert;
 | |
| 
 | |
| 				lmc1_dclk_invert =
 | |
| 					((ddr_type == DDR4_DRAM) &&
 | |
| 					 !octeon_is_cpuid(OCTEON_CN73XX_PASS1_3))
 | |
| 					? lmc0_dclk_invert ^ 1 :
 | |
| 					lmc0_dclk_invert;
 | |
| 
 | |
| 				/*
 | |
| 				 * allow override of LMC1 desired setting for
 | |
| 				 * DCLK_INVERT
 | |
| 				 */
 | |
| 				s = lookup_env(priv, "ddr1_set_dclk_invert");
 | |
| 				if (s) {
 | |
| 					lmc1_dclk_invert =
 | |
| 						!!simple_strtoul(s, NULL, 0);
 | |
| 					override = 1;
 | |
| 				}
 | |
| 				debug("LMC1: %s DDR_PLL_CTL[dclk_invert] to %d (LMC0 %d)\n",
 | |
| 				      (override) ? "override" :
 | |
| 				      "default", lmc1_dclk_invert,
 | |
| 				      lmc0_dclk_invert);
 | |
| 
 | |
| 				ddr_pll_ctl.cn78xx.dclk_invert =
 | |
| 					lmc1_dclk_invert;
 | |
| 			}
 | |
| 
 | |
| 			// but always write LMC1 CSR if it is active
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(1), ddr_pll_ctl.u64);
 | |
| 			debug("%-45s : 0x%016llx\n",
 | |
| 			      "LMC1: DDR_PLL_CTL", ddr_pll_ctl.u64);
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * 2. If the current DRAM contents are not preserved (see
 | |
| 		 * LMC(0..3)_RESET_ CTL[DDR3PSV]), this is also an appropriate
 | |
| 		 * time to assert the RESET# pin of the DDR3/DDR4 DRAM parts.
 | |
| 		 * If desired, write
 | |
| 		 * LMC0_RESET_ CTL[DDR3RST] = 0 without modifying any other
 | |
| 		 * LMC0_RESET_CTL fields to assert the DDR_RESET_L pin.
 | |
| 		 * No action is required here to assert DDR_RESET_L
 | |
| 		 * following a chip reset. Refer to Section 5.9.6. Do this
 | |
| 		 * for all enabled LMCs.
 | |
| 		 */
 | |
| 
 | |
| 		for (i = 0; (!ddr_memory_preserved(priv)) && i < 4; ++i) {
 | |
| 			union cvmx_lmcx_reset_ctl reset_ctl;
 | |
| 
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			reset_ctl.u64 = lmc_rd(priv, CVMX_LMCX_RESET_CTL(i));
 | |
| 			reset_ctl.cn78xx.ddr3rst = 0;	/* Reset asserted */
 | |
| 			debug("LMC%d Asserting DDR_RESET_L\n", i);
 | |
| 			lmc_wr(priv, CVMX_LMCX_RESET_CTL(i), reset_ctl.u64);
 | |
| 			lmc_rd(priv, CVMX_LMCX_RESET_CTL(i));
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * 3. Without changing any other LMC0_DDR_PLL_CTL values,
 | |
| 		 * write LMC0_DDR_PLL_CTL[CLKF] with a value that gives a
 | |
| 		 * desired DDR PLL speed. The LMC0_DDR_PLL_CTL[CLKF] value
 | |
| 		 * should be selected in conjunction with the post-scalar
 | |
| 		 * divider values for LMC (LMC0_DDR_PLL_CTL[DDR_PS_EN]) so
 | |
| 		 * that the desired LMC CK speeds are is produced (all
 | |
| 		 * enabled LMCs must run the same speed). Section 5.14
 | |
| 		 * describes LMC0_DDR_PLL_CTL[CLKF] and
 | |
| 		 * LMC0_DDR_PLL_CTL[DDR_PS_EN] programmings that produce
 | |
| 		 * the desired LMC CK speed. Section 5.9.2 describes LMC CK
 | |
| 		 * initialization, which can be done separately from the DDR
 | |
| 		 * PLL initialization described in this section.
 | |
| 		 *
 | |
| 		 * The LMC0_DDR_PLL_CTL[CLKF] value must not change after
 | |
| 		 * this point without restarting this SDRAM PLL
 | |
| 		 * initialization sequence.
 | |
| 		 */
 | |
| 
 | |
| 		/* Init to max error */
 | |
| 		error = ddr_hertz;
 | |
| 		best_error = ddr_hertz;
 | |
| 
 | |
| 		debug("DDR Reference Hertz = %d\n", ddr_ref_hertz);
 | |
| 
 | |
| 		while (best_error == ddr_hertz) {
 | |
| 			for (clkr = 0; clkr < 4; ++clkr) {
 | |
| 				for (en_idx =
 | |
| 				     sizeof(_en) / sizeof(int) -
 | |
| 				     1; en_idx >= 0; --en_idx) {
 | |
| 					save_en_idx = en_idx;
 | |
| 					clkf =
 | |
| 					    ((ddr_hertz) *
 | |
| 					     (clkr + 1) * (_en[save_en_idx]));
 | |
| 					clkf = divide_nint(clkf, ddr_ref_hertz)
 | |
| 					    - 1;
 | |
| 					pll_MHz =
 | |
| 					    ddr_ref_hertz *
 | |
| 					    (clkf + 1) / (clkr + 1) / 1000000;
 | |
| 					calculated_ddr_hertz =
 | |
| 					    ddr_ref_hertz *
 | |
| 					    (clkf +
 | |
| 					     1) / ((clkr +
 | |
| 						    1) * (_en[save_en_idx]));
 | |
| 					error =
 | |
| 					    ddr_hertz - calculated_ddr_hertz;
 | |
| 
 | |
| 					if (pll_MHz < min_pll_MHz ||
 | |
| 					    pll_MHz > max_pll_MHz)
 | |
| 						continue;
 | |
| 					if (clkf > max_clkf) {
 | |
| 						/*
 | |
| 						 * PLL requires clkf to be
 | |
| 						 * limited
 | |
| 						 */
 | |
| 						continue;
 | |
| 					}
 | |
| 					if (abs(error) > abs(best_error))
 | |
| 						continue;
 | |
| 
 | |
| 					debug("clkr: %2llu, en[%d]: %2d, clkf: %4llu, pll_MHz: %4llu, ddr_hertz: %8llu, error: %8lld\n",
 | |
| 					      clkr, save_en_idx,
 | |
| 					      _en[save_en_idx], clkf, pll_MHz,
 | |
| 					     calculated_ddr_hertz, error);
 | |
| 
 | |
| 					/* Favor the highest PLL frequency. */
 | |
| 					if (abs(error) < abs(best_error) ||
 | |
| 					    pll_MHz > best_pll_MHz) {
 | |
| 						best_pll_MHz = pll_MHz;
 | |
| 						best_calculated_ddr_hertz =
 | |
| 							calculated_ddr_hertz;
 | |
| 						best_error = error;
 | |
| 						best_clkr = clkr;
 | |
| 						best_clkf = clkf;
 | |
| 						best_en_idx = save_en_idx;
 | |
| 					}
 | |
| 				}
 | |
| 			}
 | |
| 
 | |
| 			override_pll_settings = 0;
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_pll_clkr");
 | |
| 			if (s) {
 | |
| 				best_clkr = simple_strtoul(s, NULL, 0);
 | |
| 				override_pll_settings = 1;
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_pll_clkf");
 | |
| 			if (s) {
 | |
| 				best_clkf = simple_strtoul(s, NULL, 0);
 | |
| 				override_pll_settings = 1;
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_pll_en_idx");
 | |
| 			if (s) {
 | |
| 				best_en_idx = simple_strtoul(s, NULL, 0);
 | |
| 				override_pll_settings = 1;
 | |
| 			}
 | |
| 
 | |
| 			if (override_pll_settings) {
 | |
| 				best_pll_MHz =
 | |
| 				    ddr_ref_hertz * (best_clkf +
 | |
| 						     1) /
 | |
| 				    (best_clkr + 1) / 1000000;
 | |
| 				best_calculated_ddr_hertz =
 | |
| 				    ddr_ref_hertz * (best_clkf +
 | |
| 						     1) /
 | |
| 				    ((best_clkr + 1) * (_en[best_en_idx]));
 | |
| 				best_error =
 | |
| 				    ddr_hertz - best_calculated_ddr_hertz;
 | |
| 			}
 | |
| 
 | |
| 			debug("clkr: %2llu, en[%d]: %2d, clkf: %4llu, pll_MHz: %4llu, ddr_hertz: %8llu, error: %8lld <==\n",
 | |
| 			      best_clkr, best_en_idx, _en[best_en_idx],
 | |
| 			      best_clkf, best_pll_MHz,
 | |
| 			      best_calculated_ddr_hertz, best_error);
 | |
| 
 | |
| 			/*
 | |
| 			 * Try lowering the frequency if we can't get a
 | |
| 			 * working configuration
 | |
| 			 */
 | |
| 			if (best_error == ddr_hertz) {
 | |
| 				if (ddr_hertz < orig_ddr_hertz - 10000000)
 | |
| 					break;
 | |
| 				ddr_hertz -= 1000000;
 | |
| 				best_error = ddr_hertz;
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		if (best_error == ddr_hertz) {
 | |
| 			printf("ERROR: Can not compute a legal DDR clock speed configuration.\n");
 | |
| 			return -1;
 | |
| 		}
 | |
| 
 | |
| 		new_bwadj = (best_clkf + 1) / 10;
 | |
| 		debug("bwadj: %2d\n", new_bwadj);
 | |
| 
 | |
| 		s = lookup_env(priv, "ddr_pll_bwadj");
 | |
| 		if (s) {
 | |
| 			new_bwadj = strtoul(s, NULL, 0);
 | |
| 			debug("bwadj: %2d\n", new_bwadj);
 | |
| 		}
 | |
| 
 | |
| 		for (i = 0; i < 2; ++i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			ddr_pll_ctl.u64 =
 | |
| 			    lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 			debug("LMC%d: DDR_PLL_CTL                             : 0x%016llx\n",
 | |
| 			      i, ddr_pll_ctl.u64);
 | |
| 
 | |
| 			ddr_pll_ctl.cn78xx.ddr_ps_en = best_en_idx;
 | |
| 			ddr_pll_ctl.cn78xx.clkf = best_clkf;
 | |
| 			ddr_pll_ctl.cn78xx.clkr = best_clkr;
 | |
| 			ddr_pll_ctl.cn78xx.reset_n = 0;
 | |
| 			ddr_pll_ctl.cn78xx.bwadj = new_bwadj;
 | |
| 
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(i), ddr_pll_ctl.u64);
 | |
| 			debug("LMC%d: DDR_PLL_CTL                             : 0x%016llx\n",
 | |
| 			      i, ddr_pll_ctl.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * For cnf75xx LMC0 and LMC1 use the same PLL so
 | |
| 			 * only program LMC0 PLL.
 | |
| 			 */
 | |
| 			if (octeon_is_cpuid(OCTEON_CNF75XX))
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 		for (i = 0; i < 4; ++i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			/*
 | |
| 			 * 4. Read LMC0_DDR_PLL_CTL and wait for the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 
 | |
| 			/*
 | |
| 			 * 5. Wait a minimum of 3 us.
 | |
| 			 */
 | |
| 
 | |
| 			udelay(3);	/* Wait 3 us */
 | |
| 
 | |
| 			/*
 | |
| 			 * 6. Write LMC0_DDR_PLL_CTL[RESET_N] = 1 without
 | |
| 			 * changing any other LMC0_DDR_PLL_CTL values.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_pll_ctl.u64 =
 | |
| 			    lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 			ddr_pll_ctl.cn78xx.reset_n = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(i), ddr_pll_ctl.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 7. Read LMC0_DDR_PLL_CTL and wait for the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 
 | |
| 			/*
 | |
| 			 * 8. Wait a minimum of 25 us.
 | |
| 			 */
 | |
| 
 | |
| 			udelay(25);	/* Wait 25 us */
 | |
| 
 | |
| 			/*
 | |
| 			 * For cnf75xx LMC0 and LMC1 use the same PLL so
 | |
| 			 * only program LMC0 PLL.
 | |
| 			 */
 | |
| 			if (octeon_is_cpuid(OCTEON_CNF75XX))
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 		for (i = 0; i < 4; ++i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			/*
 | |
| 			 * 5.9.2 LMC CK Initialization
 | |
| 			 *
 | |
| 			 * DDR PLL initialization must be completed prior to
 | |
| 			 * starting LMC CK initialization.
 | |
| 			 *
 | |
| 			 * Perform the following substeps to initialize the
 | |
| 			 * LMC CK:
 | |
| 			 *
 | |
| 			 * 1. Without changing any other LMC(0..3)_DDR_PLL_CTL
 | |
| 			 * values, write
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL[DDR_DIV_RESET] = 1 and
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL[DDR_PS_EN] with the
 | |
| 			 * appropriate value to get the desired LMC CK speed.
 | |
| 			 * Section 5.14 discusses CLKF and DDR_PS_EN
 | |
| 			 * programmings.  The LMC(0..3)_DDR_PLL_CTL[DDR_PS_EN]
 | |
| 			 * must not change after this point without restarting
 | |
| 			 * this LMC CK initialization sequence.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_pll_ctl.u64 = lmc_rd(priv,
 | |
| 						 CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 			ddr_pll_ctl.cn78xx.ddr_div_reset = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(i), ddr_pll_ctl.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 2. Without changing any other fields in
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL, write
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL[DDR4_MODE] = 0.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_pll_ctl.u64 =
 | |
| 			    lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 			ddr_pll_ctl.cn78xx.ddr4_mode =
 | |
| 			    (ddr_type == DDR4_DRAM) ? 1 : 0;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(i), ddr_pll_ctl.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 3. Read LMC(0..3)_DDR_PLL_CTL and wait for the
 | |
| 			 * result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 
 | |
| 			/*
 | |
| 			 * 4. Wait a minimum of 1 us.
 | |
| 			 */
 | |
| 
 | |
| 			udelay(1);	/* Wait 1 us */
 | |
| 
 | |
| 			/*
 | |
| 			 * ###### Steps 5 through 7 deferred until after
 | |
| 			 * DDR_DIV_RESET=0 #######
 | |
| 			 */
 | |
| 
 | |
| 			/*
 | |
| 			 * 8. Without changing any other LMC(0..3)_COMP_CTL2
 | |
| 			 * values, write
 | |
| 			 * LMC(0..3)_COMP_CTL2[CK_CTL,CONTROL_CTL,CMD_CTL]
 | |
| 			 * to the desired DDR*_CK_*_P control and command
 | |
| 			 * signals drive strength.
 | |
| 			 */
 | |
| 
 | |
| 			union cvmx_lmcx_comp_ctl2 comp_ctl2;
 | |
| 			const struct ddr3_custom_config *custom_lmc_config =
 | |
| 			    &ddr_conf->custom_lmc_config;
 | |
| 
 | |
| 			comp_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_COMP_CTL2(i));
 | |
| 
 | |
| 			/* Default 4=34.3 ohm */
 | |
| 			comp_ctl2.cn78xx.dqx_ctl =
 | |
| 			    (custom_lmc_config->dqx_ctl ==
 | |
| 			     0) ? 4 : custom_lmc_config->dqx_ctl;
 | |
| 			/* Default 4=34.3 ohm */
 | |
| 			comp_ctl2.cn78xx.ck_ctl =
 | |
| 			    (custom_lmc_config->ck_ctl ==
 | |
| 			     0) ? 4 : custom_lmc_config->ck_ctl;
 | |
| 			/* Default 4=34.3 ohm */
 | |
| 			comp_ctl2.cn78xx.cmd_ctl =
 | |
| 			    (custom_lmc_config->cmd_ctl ==
 | |
| 			     0) ? 4 : custom_lmc_config->cmd_ctl;
 | |
| 
 | |
| 			comp_ctl2.cn78xx.rodt_ctl = 0x4;	/* 60 ohm */
 | |
| 
 | |
| 			comp_ctl2.cn70xx.ptune_offset =
 | |
| 			    (abs(custom_lmc_config->ptune_offset) & 0x7)
 | |
| 			    | (_sign(custom_lmc_config->ptune_offset) << 3);
 | |
| 			comp_ctl2.cn70xx.ntune_offset =
 | |
| 			    (abs(custom_lmc_config->ntune_offset) & 0x7)
 | |
| 			    | (_sign(custom_lmc_config->ntune_offset) << 3);
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_clk_ctl");
 | |
| 			if (s) {
 | |
| 				comp_ctl2.cn78xx.ck_ctl =
 | |
| 				    simple_strtoul(s, NULL, 0);
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_ck_ctl");
 | |
| 			if (s) {
 | |
| 				comp_ctl2.cn78xx.ck_ctl =
 | |
| 				    simple_strtoul(s, NULL, 0);
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_cmd_ctl");
 | |
| 			if (s) {
 | |
| 				comp_ctl2.cn78xx.cmd_ctl =
 | |
| 				    simple_strtoul(s, NULL, 0);
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_dqx_ctl");
 | |
| 			if (s) {
 | |
| 				comp_ctl2.cn78xx.dqx_ctl =
 | |
| 				    simple_strtoul(s, NULL, 0);
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_ptune_offset");
 | |
| 			if (s) {
 | |
| 				comp_ctl2.cn78xx.ptune_offset =
 | |
| 				    simple_strtoul(s, NULL, 0);
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_ntune_offset");
 | |
| 			if (s) {
 | |
| 				comp_ctl2.cn78xx.ntune_offset =
 | |
| 				    simple_strtoul(s, NULL, 0);
 | |
| 			}
 | |
| 
 | |
| 			lmc_wr(priv, CVMX_LMCX_COMP_CTL2(i), comp_ctl2.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 9. Read LMC(0..3)_DDR_PLL_CTL and wait for the
 | |
| 			 * result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 
 | |
| 			/*
 | |
| 			 * 10. Wait a minimum of 200 ns.
 | |
| 			 */
 | |
| 
 | |
| 			udelay(1);	/* Wait 1 us */
 | |
| 
 | |
| 			/*
 | |
| 			 * 11. Without changing any other
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL values, write
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL[DDR_DIV_RESET] = 0.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_pll_ctl.u64 = lmc_rd(priv,
 | |
| 						 CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 			ddr_pll_ctl.cn78xx.ddr_div_reset = 0;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(i), ddr_pll_ctl.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 12. Read LMC(0..3)_DDR_PLL_CTL and wait for the
 | |
| 			 * result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 
 | |
| 			/*
 | |
| 			 * 13. Wait a minimum of 200 ns.
 | |
| 			 */
 | |
| 
 | |
| 			udelay(1);	/* Wait 1 us */
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * Relocated Interface Enable (intf_en) Step
 | |
| 		 */
 | |
| 		for (i = (octeon_is_cpuid(OCTEON_CN73XX) ||
 | |
| 			  octeon_is_cpuid(OCTEON_CNF75XX)) ? 1 : 2;
 | |
| 		     i < 4; ++i) {
 | |
| 			/*
 | |
| 			 * This step is only necessary for LMC 2 and 3 in
 | |
| 			 * 4-LMC mode. The mask will cause the unpopulated
 | |
| 			 * interfaces to be skipped.
 | |
| 			 */
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 
 | |
| 			dll_ctl2.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL2(i));
 | |
| 			dll_ctl2.cn78xx.intf_en = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL2(i), dll_ctl2.u64);
 | |
| 			lmc_rd(priv, CVMX_LMCX_DLL_CTL2(i));
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * Relocated PHY_DCOK Step
 | |
| 		 */
 | |
| 		for (i = 0; i < 4; ++i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 			/*
 | |
| 			 * 5. Without changing any other fields in
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL, write
 | |
| 			 * LMC(0..3)_DDR_PLL_CTL[PHY_DCOK] = 1.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_pll_ctl.u64 = lmc_rd(priv,
 | |
| 						 CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 			ddr_pll_ctl.cn78xx.phy_dcok = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(i), ddr_pll_ctl.u64);
 | |
| 			/*
 | |
| 			 * 6. Read LMC(0..3)_DDR_PLL_CTL and wait for
 | |
| 			 * the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(i));
 | |
| 
 | |
| 			/*
 | |
| 			 * 7. Wait a minimum of 20 us.
 | |
| 			 */
 | |
| 
 | |
| 			udelay(20);	/* Wait 20 us */
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * 5.9.4 LMC DRESET Initialization
 | |
| 		 *
 | |
| 		 * All of the DDR PLL, LMC global CK, and LMC interface
 | |
| 		 * enable initializations must be completed prior to starting
 | |
| 		 * this LMC DRESET initialization (Step 4).
 | |
| 		 *
 | |
| 		 * This LMC DRESET step is done for all enabled LMCs.
 | |
| 		 *
 | |
| 		 * There are special constraints on the ordering of DRESET
 | |
| 		 * initialization (Steps 4) and CK local initialization
 | |
| 		 * (Step 5) whenever CK local initialization must be executed.
 | |
| 		 * CK local initialization must be executed whenever the DDR
 | |
| 		 * PLL is being brought up (for each chip reset* and whenever
 | |
| 		 * the DDR clock speed changes).
 | |
| 		 *
 | |
| 		 * When Step 5 must be executed in the two-LMC mode case:
 | |
| 		 * - LMC0 DRESET initialization must occur before Step 5.
 | |
| 		 * - LMC1 DRESET initialization must occur after Step 5.
 | |
| 		 *
 | |
| 		 * When Step 5 must be executed in the four-LMC mode case:
 | |
| 		 * - LMC2 and LMC3 DRESET initialization must occur before
 | |
| 		 *   Step 5.
 | |
| 		 * - LMC0 and LMC1 DRESET initialization must occur after
 | |
| 		 *   Step 5.
 | |
| 		 */
 | |
| 
 | |
| 		if (octeon_is_cpuid(OCTEON_CN73XX)) {
 | |
| 			/* ONE-LMC or TWO-LMC MODE BEFORE STEP 5 for cn73xx */
 | |
| 			cn78xx_lmc_dreset_init(priv, 0);
 | |
| 		} else if (octeon_is_cpuid(OCTEON_CNF75XX)) {
 | |
| 			if (if_mask == 0x3) {
 | |
| 				/*
 | |
| 				 * 2-LMC Mode: LMC1 DRESET must occur
 | |
| 				 * before Step 5
 | |
| 				 */
 | |
| 				cn78xx_lmc_dreset_init(priv, 1);
 | |
| 			}
 | |
| 		} else {
 | |
| 			/* TWO-LMC MODE DRESET BEFORE STEP 5 */
 | |
| 			if (if_mask == 0x3)
 | |
| 				cn78xx_lmc_dreset_init(priv, 0);
 | |
| 
 | |
| 			/* FOUR-LMC MODE BEFORE STEP 5 */
 | |
| 			if (if_mask == 0xf) {
 | |
| 				cn78xx_lmc_dreset_init(priv, 2);
 | |
| 				cn78xx_lmc_dreset_init(priv, 3);
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * 5.9.5 LMC CK Local Initialization
 | |
| 		 *
 | |
| 		 * All of DDR PLL, LMC global CK, and LMC interface-enable
 | |
| 		 * initializations must be completed prior to starting this
 | |
| 		 * LMC CK local initialization (Step 5).
 | |
| 		 *
 | |
| 		 * LMC CK Local initialization must be performed for each
 | |
| 		 * chip reset and whenever the DDR clock speed changes. This
 | |
| 		 * step needs to be performed only once, not once per LMC.
 | |
| 		 *
 | |
| 		 * There are special constraints on the ordering of DRESET
 | |
| 		 * initialization (Steps 4) and CK local initialization
 | |
| 		 * (Step 5) whenever CK local initialization must be executed.
 | |
| 		 * CK local initialization must be executed whenever the
 | |
| 		 * DDR PLL is being brought up (for each chip reset and
 | |
| 		 * whenever the DDR clock speed changes).
 | |
| 		 *
 | |
| 		 * When Step 5 must be executed in the two-LMC mode case:
 | |
| 		 * - LMC0 DRESET initialization must occur before Step 5.
 | |
| 		 * - LMC1 DRESET initialization must occur after Step 5.
 | |
| 		 *
 | |
| 		 * When Step 5 must be executed in the four-LMC mode case:
 | |
| 		 * - LMC2 and LMC3 DRESET initialization must occur before
 | |
| 		 *   Step 5.
 | |
| 		 * - LMC0 and LMC1 DRESET initialization must occur after
 | |
| 		 *   Step 5.
 | |
| 		 *
 | |
| 		 * LMC CK local initialization is different depending on
 | |
| 		 * whether two-LMC or four-LMC modes are desired.
 | |
| 		 */
 | |
| 
 | |
| 		if (if_mask == 0x3) {
 | |
| 			int temp_lmc_if_num = octeon_is_cpuid(OCTEON_CNF75XX) ?
 | |
| 				1 : 0;
 | |
| 
 | |
| 			/*
 | |
| 			 * 5.9.5.1 LMC CK Local Initialization for Two-LMC
 | |
| 			 * Mode
 | |
| 			 *
 | |
| 			 * 1. Write LMC0_DLL_CTL3 to its reset value. (Note
 | |
| 			 * that LMC0_DLL_CTL3[DLL_90_BYTE_SEL] = 0x2 .. 0x8
 | |
| 			 * should also work.)
 | |
| 			 */
 | |
| 
 | |
| 			ddr_dll_ctl3.u64 = 0;
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 1;
 | |
| 
 | |
| 			if (octeon_is_cpuid(OCTEON_CNF75XX))
 | |
| 				ddr_dll_ctl3.cn78xx.dll90_byte_sel = 7;
 | |
| 			else
 | |
| 				ddr_dll_ctl3.cn78xx.dll90_byte_sel = 1;
 | |
| 
 | |
| 			lmc_wr(priv,
 | |
| 			       CVMX_LMCX_DLL_CTL3(temp_lmc_if_num),
 | |
| 			       ddr_dll_ctl3.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 2. Read LMC0_DLL_CTL3 and wait for the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DLL_CTL3(temp_lmc_if_num));
 | |
| 
 | |
| 			/*
 | |
| 			 * 3. Without changing any other fields in
 | |
| 			 * LMC0_DLL_CTL3, write
 | |
| 			 * LMC0_DLL_CTL3[DCLK90_FWD] = 1.  Writing
 | |
| 			 * LMC0_DLL_CTL3[DCLK90_FWD] = 1
 | |
| 			 * causes clock-delay information to be forwarded
 | |
| 			 * from LMC0 to LMC1.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_fwd = 1;
 | |
| 			lmc_wr(priv,
 | |
| 			       CVMX_LMCX_DLL_CTL3(temp_lmc_if_num),
 | |
| 			       ddr_dll_ctl3.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 4. Read LMC0_DLL_CTL3 and wait for the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DLL_CTL3(temp_lmc_if_num));
 | |
| 		}
 | |
| 
 | |
| 		if (if_mask == 0xf) {
 | |
| 			/*
 | |
| 			 * 5.9.5.2 LMC CK Local Initialization for Four-LMC
 | |
| 			 * Mode
 | |
| 			 *
 | |
| 			 * 1. Write LMC2_DLL_CTL3 to its reset value except
 | |
| 			 * LMC2_DLL_CTL3[DLL90_BYTE_SEL] = 0x7.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_dll_ctl3.u64 = 0;
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 1;
 | |
| 			ddr_dll_ctl3.cn78xx.dll90_byte_sel = 7;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(2), ddr_dll_ctl3.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 2. Write LMC3_DLL_CTL3 to its reset value except
 | |
| 			 * LMC3_DLL_CTL3[DLL90_BYTE_SEL] = 0x2.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_dll_ctl3.u64 = 0;
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 1;
 | |
| 			ddr_dll_ctl3.cn78xx.dll90_byte_sel = 2;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(3), ddr_dll_ctl3.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 3. Read LMC3_DLL_CTL3 and wait for the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DLL_CTL3(3));
 | |
| 
 | |
| 			/*
 | |
| 			 * 4. Without changing any other fields in
 | |
| 			 * LMC2_DLL_CTL3, write LMC2_DLL_CTL3[DCLK90_FWD] = 1
 | |
| 			 * and LMC2_DLL_CTL3[DCLK90_RECAL_ DIS] = 1.
 | |
| 			 * Writing LMC2_DLL_CTL3[DCLK90_FWD] = 1 causes LMC 2
 | |
| 			 * to forward clockdelay information to LMC0. Setting
 | |
| 			 * LMC2_DLL_CTL3[DCLK90_RECAL_DIS] to 1 prevents LMC2
 | |
| 			 * from periodically recalibrating this delay
 | |
| 			 * information.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(2));
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_fwd = 1;
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(2), ddr_dll_ctl3.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 5. Without changing any other fields in
 | |
| 			 * LMC3_DLL_CTL3, write LMC3_DLL_CTL3[DCLK90_FWD] = 1
 | |
| 			 * and LMC3_DLL_CTL3[DCLK90_RECAL_ DIS] = 1.
 | |
| 			 * Writing LMC3_DLL_CTL3[DCLK90_FWD] = 1 causes LMC3
 | |
| 			 * to forward clockdelay information to LMC1. Setting
 | |
| 			 * LMC3_DLL_CTL3[DCLK90_RECAL_DIS] to 1 prevents LMC3
 | |
| 			 * from periodically recalibrating this delay
 | |
| 			 * information.
 | |
| 			 */
 | |
| 
 | |
| 			ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(3));
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_fwd = 1;
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(3), ddr_dll_ctl3.u64);
 | |
| 
 | |
| 			/*
 | |
| 			 * 6. Read LMC3_DLL_CTL3 and wait for the result.
 | |
| 			 */
 | |
| 
 | |
| 			lmc_rd(priv, CVMX_LMCX_DLL_CTL3(3));
 | |
| 		}
 | |
| 
 | |
| 		if (octeon_is_cpuid(OCTEON_CNF75XX)) {
 | |
| 			/*
 | |
| 			 * cnf75xx 2-LMC Mode: LMC0 DRESET must occur after
 | |
| 			 * Step 5, Do LMC0 for 1-LMC Mode here too
 | |
| 			 */
 | |
| 			cn78xx_lmc_dreset_init(priv, 0);
 | |
| 		}
 | |
| 
 | |
| 		/* TWO-LMC MODE AFTER STEP 5 */
 | |
| 		if (if_mask == 0x3) {
 | |
| 			if (octeon_is_cpuid(OCTEON_CNF75XX)) {
 | |
| 				/*
 | |
| 				 * cnf75xx 2-LMC Mode: LMC0 DRESET must
 | |
| 				 * occur after Step 5
 | |
| 				 */
 | |
| 				cn78xx_lmc_dreset_init(priv, 0);
 | |
| 			} else {
 | |
| 				cn78xx_lmc_dreset_init(priv, 1);
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		/* FOUR-LMC MODE AFTER STEP 5 */
 | |
| 		if (if_mask == 0xf) {
 | |
| 			cn78xx_lmc_dreset_init(priv, 0);
 | |
| 			cn78xx_lmc_dreset_init(priv, 1);
 | |
| 
 | |
| 			/*
 | |
| 			 * Enable periodic recalibration of DDR90 delay
 | |
| 			 * line in.
 | |
| 			 */
 | |
| 			ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(0));
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 0;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(0), ddr_dll_ctl3.u64);
 | |
| 			ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(1));
 | |
| 			ddr_dll_ctl3.cn78xx.dclk90_recal_dis = 0;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(1), ddr_dll_ctl3.u64);
 | |
| 		}
 | |
| 
 | |
| 		/* Enable fine tune mode for all LMCs */
 | |
| 		for (i = 0; i < 4; ++i) {
 | |
| 			if ((if_mask & (1 << i)) == 0)
 | |
| 				continue;
 | |
| 			ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(i));
 | |
| 			ddr_dll_ctl3.cn78xx.fine_tune_mode = 1;
 | |
| 			lmc_wr(priv, CVMX_LMCX_DLL_CTL3(i), ddr_dll_ctl3.u64);
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * Enable the trim circuit on the appropriate channels to
 | |
| 		 * adjust the DDR clock duty cycle for chips that support
 | |
| 		 * it
 | |
| 		 */
 | |
| 		if (octeon_is_cpuid(OCTEON_CN78XX_PASS2_X) ||
 | |
| 		    octeon_is_cpuid(OCTEON_CN73XX) ||
 | |
| 		    octeon_is_cpuid(OCTEON_CNF75XX)) {
 | |
| 			union cvmx_lmcx_phy_ctl lmc_phy_ctl;
 | |
| 			int i;
 | |
| 
 | |
| 			for (i = 0; i < 4; ++i) {
 | |
| 				if ((if_mask & (1 << i)) == 0)
 | |
| 					continue;
 | |
| 
 | |
| 				lmc_phy_ctl.u64 =
 | |
| 				    lmc_rd(priv, CVMX_LMCX_PHY_CTL(i));
 | |
| 
 | |
| 				if (octeon_is_cpuid(OCTEON_CNF75XX) ||
 | |
| 				    octeon_is_cpuid(OCTEON_CN73XX_PASS1_3)) {
 | |
| 					/* Both LMCs */
 | |
| 					lmc_phy_ctl.s.lv_mode = 0;
 | |
| 				} else {
 | |
| 					/* Odd LMCs = 0, Even LMCs = 1 */
 | |
| 					lmc_phy_ctl.s.lv_mode = (~i) & 1;
 | |
| 				}
 | |
| 
 | |
| 				debug("LMC%d: PHY_CTL                                 : 0x%016llx\n",
 | |
| 				      i, lmc_phy_ctl.u64);
 | |
| 				lmc_wr(priv, CVMX_LMCX_PHY_CTL(i),
 | |
| 				       lmc_phy_ctl.u64);
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * 5.9.6 LMC RESET Initialization
 | |
| 	 *
 | |
| 	 * NOTE: this is now done as the first step in
 | |
| 	 * init_octeon3_ddr3_interface, rather than the last step in clock
 | |
| 	 * init. This reorg allows restarting per-LMC initialization should
 | |
| 	 * problems be encountered, rather than being forced to resort to
 | |
| 	 * resetting the chip and starting all over.
 | |
| 	 *
 | |
| 	 * Look for the code in octeon3_lmc.c: perform_lmc_reset().
 | |
| 	 */
 | |
| 
 | |
| 	/* Fallthrough for all interfaces... */
 | |
| not_if0:
 | |
| 
 | |
| 	/*
 | |
| 	 * Start the DDR clock so that its frequency can be measured.
 | |
| 	 * For some chips we must activate the memory controller with
 | |
| 	 * init_start to make the DDR clock start to run.
 | |
| 	 */
 | |
| 	if ((!octeon_is_cpuid(OCTEON_CN6XXX)) &&
 | |
| 	    (!octeon_is_cpuid(OCTEON_CNF7XXX)) &&
 | |
| 	    (!octeon_is_cpuid(OCTEON_CN7XXX))) {
 | |
| 		union cvmx_lmcx_mem_cfg0 mem_cfg0;
 | |
| 
 | |
| 		mem_cfg0.u64 = 0;
 | |
| 		mem_cfg0.s.init_start = 1;
 | |
| 		lmc_wr(priv, CVMX_LMCX_MEM_CFG0(if_num), mem_cfg0.u64);
 | |
| 		lmc_rd(priv, CVMX_LMCX_MEM_CFG0(if_num));
 | |
| 	}
 | |
| 
 | |
| 	set_ddr_clock_initialized(priv, if_num, 1);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static void octeon_ipd_delay_cycles(u64 cycles)
 | |
| {
 | |
| 	u64 start = csr_rd(CVMX_IPD_CLK_COUNT);
 | |
| 
 | |
| 	while (start + cycles > csr_rd(CVMX_IPD_CLK_COUNT))
 | |
| 		;
 | |
| }
 | |
| 
 | |
| static void octeon_ipd_delay_cycles_o3(u64 cycles)
 | |
| {
 | |
| 	u64 start = csr_rd(CVMX_FPA_CLK_COUNT);
 | |
| 
 | |
| 	while (start + cycles > csr_rd(CVMX_FPA_CLK_COUNT))
 | |
| 		;
 | |
| }
 | |
| 
 | |
| static u32 measure_octeon_ddr_clock(struct ddr_priv *priv,
 | |
| 				    struct ddr_conf *ddr_conf, u32 cpu_hertz,
 | |
| 				    u32 ddr_hertz, u32 ddr_ref_hertz,
 | |
| 				    int if_num, u32 if_mask)
 | |
| {
 | |
| 	u64 core_clocks;
 | |
| 	u64 ddr_clocks;
 | |
| 	u64 calc_ddr_hertz;
 | |
| 
 | |
| 	if (ddr_conf) {
 | |
| 		if (initialize_ddr_clock(priv, ddr_conf, cpu_hertz,
 | |
| 					 ddr_hertz, ddr_ref_hertz, if_num,
 | |
| 					 if_mask) != 0)
 | |
| 			return 0;
 | |
| 	}
 | |
| 
 | |
| 	/* Dynamically determine the DDR clock speed */
 | |
| 	if (OCTEON_IS_OCTEON2() || octeon_is_cpuid(OCTEON_CN70XX)) {
 | |
| 		core_clocks = csr_rd(CVMX_IPD_CLK_COUNT);
 | |
| 		ddr_clocks = lmc_rd(priv, CVMX_LMCX_DCLK_CNT(if_num));
 | |
| 		/* How many cpu cycles to measure over */
 | |
| 		octeon_ipd_delay_cycles(100000000);
 | |
| 		core_clocks = csr_rd(CVMX_IPD_CLK_COUNT) - core_clocks;
 | |
| 		ddr_clocks =
 | |
| 		    lmc_rd(priv, CVMX_LMCX_DCLK_CNT(if_num)) - ddr_clocks;
 | |
| 		calc_ddr_hertz = ddr_clocks * gd->bus_clk / core_clocks;
 | |
| 	} else if (octeon_is_cpuid(OCTEON_CN7XXX)) {
 | |
| 		core_clocks = csr_rd(CVMX_FPA_CLK_COUNT);
 | |
| 		ddr_clocks = lmc_rd(priv, CVMX_LMCX_DCLK_CNT(if_num));
 | |
| 		/* How many cpu cycles to measure over */
 | |
| 		octeon_ipd_delay_cycles_o3(100000000);
 | |
| 		core_clocks = csr_rd(CVMX_FPA_CLK_COUNT) - core_clocks;
 | |
| 		ddr_clocks =
 | |
| 		    lmc_rd(priv, CVMX_LMCX_DCLK_CNT(if_num)) - ddr_clocks;
 | |
| 		calc_ddr_hertz = ddr_clocks * gd->bus_clk / core_clocks;
 | |
| 	} else {
 | |
| 		core_clocks = csr_rd(CVMX_IPD_CLK_COUNT);
 | |
| 		/*
 | |
| 		 * ignore overflow, starts counting when we enable the
 | |
| 		 * controller
 | |
| 		 */
 | |
| 		ddr_clocks = lmc_rd(priv, CVMX_LMCX_DCLK_CNT_LO(if_num));
 | |
| 		/* How many cpu cycles to measure over */
 | |
| 		octeon_ipd_delay_cycles(100000000);
 | |
| 		core_clocks = csr_rd(CVMX_IPD_CLK_COUNT) - core_clocks;
 | |
| 		ddr_clocks =
 | |
| 		    lmc_rd(priv, CVMX_LMCX_DCLK_CNT_LO(if_num)) - ddr_clocks;
 | |
| 		calc_ddr_hertz = ddr_clocks * cpu_hertz / core_clocks;
 | |
| 	}
 | |
| 
 | |
| 	debug("core clocks: %llu, ddr clocks: %llu, calc rate: %llu\n",
 | |
| 	      core_clocks, ddr_clocks, calc_ddr_hertz);
 | |
| 	debug("LMC%d: Measured DDR clock: %lld, cpu clock: %u, ddr clocks: %llu\n",
 | |
| 	      if_num, calc_ddr_hertz, cpu_hertz, ddr_clocks);
 | |
| 
 | |
| 	/* Check for unreasonable settings. */
 | |
| 	if (calc_ddr_hertz < 10000) {
 | |
| 		udelay(8000000 * 100);
 | |
| 		printf("DDR clock misconfigured on interface %d. Resetting...\n",
 | |
| 		       if_num);
 | |
| 		do_reset(NULL, 0, 0, NULL);
 | |
| 	}
 | |
| 
 | |
| 	return calc_ddr_hertz;
 | |
| }
 | |
| 
 | |
| u64 lmc_ddr3_rl_dbg_read(struct ddr_priv *priv, int if_num, int idx)
 | |
| {
 | |
| 	union cvmx_lmcx_rlevel_dbg rlevel_dbg;
 | |
| 	union cvmx_lmcx_rlevel_ctl rlevel_ctl;
 | |
| 
 | |
| 	rlevel_ctl.u64 = lmc_rd(priv, CVMX_LMCX_RLEVEL_CTL(if_num));
 | |
| 	rlevel_ctl.s.byte = idx;
 | |
| 
 | |
| 	lmc_wr(priv, CVMX_LMCX_RLEVEL_CTL(if_num), rlevel_ctl.u64);
 | |
| 	lmc_rd(priv, CVMX_LMCX_RLEVEL_CTL(if_num));
 | |
| 
 | |
| 	rlevel_dbg.u64 = lmc_rd(priv, CVMX_LMCX_RLEVEL_DBG(if_num));
 | |
| 	return rlevel_dbg.s.bitmask;
 | |
| }
 | |
| 
 | |
| u64 lmc_ddr3_wl_dbg_read(struct ddr_priv *priv, int if_num, int idx)
 | |
| {
 | |
| 	union cvmx_lmcx_wlevel_dbg wlevel_dbg;
 | |
| 
 | |
| 	wlevel_dbg.u64 = 0;
 | |
| 	wlevel_dbg.s.byte = idx;
 | |
| 
 | |
| 	lmc_wr(priv, CVMX_LMCX_WLEVEL_DBG(if_num), wlevel_dbg.u64);
 | |
| 	lmc_rd(priv, CVMX_LMCX_WLEVEL_DBG(if_num));
 | |
| 
 | |
| 	wlevel_dbg.u64 = lmc_rd(priv, CVMX_LMCX_WLEVEL_DBG(if_num));
 | |
| 	return wlevel_dbg.s.bitmask;
 | |
| }
 | |
| 
 | |
| int validate_ddr3_rlevel_bitmask(struct rlevel_bitmask *rlevel_bitmask_p,
 | |
| 				 int ddr_type)
 | |
| {
 | |
| 	int i;
 | |
| 	int errors = 0;
 | |
| 	u64 mask = 0;		/* Used in 64-bit comparisons */
 | |
| 	u8 mstart = 0;
 | |
| 	u8 width = 0;
 | |
| 	u8 firstbit = 0;
 | |
| 	u8 lastbit = 0;
 | |
| 	u8 bubble = 0;
 | |
| 	u8 tbubble = 0;
 | |
| 	u8 blank = 0;
 | |
| 	u8 narrow = 0;
 | |
| 	u8 trailing = 0;
 | |
| 	u64 bitmask = rlevel_bitmask_p->bm;
 | |
| 	u8 extras = 0;
 | |
| 	u8 toolong = 0;
 | |
| 	u64 temp;
 | |
| 
 | |
| 	if (bitmask == 0) {
 | |
| 		blank += RLEVEL_BITMASK_BLANK_ERROR;
 | |
| 	} else {
 | |
| 		/* Look for fb, the first bit */
 | |
| 		temp = bitmask;
 | |
| 		while (!(temp & 1)) {
 | |
| 			firstbit++;
 | |
| 			temp >>= 1;
 | |
| 		}
 | |
| 
 | |
| 		/* Look for lb, the last bit */
 | |
| 		lastbit = firstbit;
 | |
| 		while ((temp >>= 1))
 | |
| 			lastbit++;
 | |
| 
 | |
| 		/*
 | |
| 		 * Start with the max range to try to find the largest mask
 | |
| 		 * within the bitmask data
 | |
| 		 */
 | |
| 		width = MASKRANGE_BITS;
 | |
| 		for (mask = MASKRANGE; mask > 0; mask >>= 1, --width) {
 | |
| 			for (mstart = lastbit - width + 1; mstart >= firstbit;
 | |
| 			     --mstart) {
 | |
| 				temp = mask << mstart;
 | |
| 				if ((bitmask & temp) == temp)
 | |
| 					goto done_now;
 | |
| 			}
 | |
| 		}
 | |
| done_now:
 | |
| 		/* look for any more contiguous 1's to the right of mstart */
 | |
| 		if (width == MASKRANGE_BITS) {	// only when maximum mask
 | |
| 			while ((bitmask >> (mstart - 1)) & 1) {
 | |
| 				// slide right over more 1's
 | |
| 				--mstart;
 | |
| 				// count the number of extra bits only for DDR4
 | |
| 				if (ddr_type == DDR4_DRAM)
 | |
| 					extras++;
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		/* Penalize any extra 1's beyond the maximum desired mask */
 | |
| 		if (extras > 0)
 | |
| 			toolong =
 | |
| 			    RLEVEL_BITMASK_TOOLONG_ERROR * ((1 << extras) - 1);
 | |
| 
 | |
| 		/* Detect if bitmask is too narrow. */
 | |
| 		if (width < 4)
 | |
| 			narrow = (4 - width) * RLEVEL_BITMASK_NARROW_ERROR;
 | |
| 
 | |
| 		/*
 | |
| 		 * detect leading bubble bits, that is, any 0's between first
 | |
| 		 * and mstart
 | |
| 		 */
 | |
| 		temp = bitmask >> (firstbit + 1);
 | |
| 		i = mstart - firstbit - 1;
 | |
| 		while (--i >= 0) {
 | |
| 			if ((temp & 1) == 0)
 | |
| 				bubble += RLEVEL_BITMASK_BUBBLE_BITS_ERROR;
 | |
| 			temp >>= 1;
 | |
| 		}
 | |
| 
 | |
| 		temp = bitmask >> (mstart + width + extras);
 | |
| 		i = lastbit - (mstart + width + extras - 1);
 | |
| 		while (--i >= 0) {
 | |
| 			if (temp & 1) {
 | |
| 				/*
 | |
| 				 * Detect 1 bits after the trailing end of
 | |
| 				 * the mask, including last.
 | |
| 				 */
 | |
| 				trailing += RLEVEL_BITMASK_TRAILING_BITS_ERROR;
 | |
| 			} else {
 | |
| 				/*
 | |
| 				 * Detect trailing bubble bits, that is,
 | |
| 				 * any 0's between end-of-mask and last
 | |
| 				 */
 | |
| 				tbubble += RLEVEL_BITMASK_BUBBLE_BITS_ERROR;
 | |
| 			}
 | |
| 			temp >>= 1;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	errors = bubble + tbubble + blank + narrow + trailing + toolong;
 | |
| 
 | |
| 	/* Pass out useful statistics */
 | |
| 	rlevel_bitmask_p->mstart = mstart;
 | |
| 	rlevel_bitmask_p->width = width;
 | |
| 
 | |
| 	debug_bitmask_print("bm:%08lx mask:%02lx, width:%2u, mstart:%2d, fb:%2u, lb:%2u (bu:%2d, tb:%2d, bl:%2d, n:%2d, t:%2d, x:%2d) errors:%3d %s\n",
 | |
| 			    (unsigned long)bitmask, mask, width, mstart,
 | |
| 			    firstbit, lastbit, bubble, tbubble, blank,
 | |
| 			    narrow, trailing, toolong, errors,
 | |
| 			    (errors) ? "=> invalid" : "");
 | |
| 
 | |
| 	return errors;
 | |
| }
 | |
| 
 | |
| int compute_ddr3_rlevel_delay(u8 mstart, u8 width,
 | |
| 			      union cvmx_lmcx_rlevel_ctl rlevel_ctl)
 | |
| {
 | |
| 	int delay;
 | |
| 
 | |
| 	debug_bitmask_print("  offset_en:%d", rlevel_ctl.s.offset_en);
 | |
| 
 | |
| 	if (rlevel_ctl.s.offset_en) {
 | |
| 		delay = max((int)mstart,
 | |
| 			    (int)(mstart + width - 1 - rlevel_ctl.s.offset));
 | |
| 	} else {
 | |
| 		/* if (rlevel_ctl.s.offset) { *//* Experimental */
 | |
| 		if (0) {
 | |
| 			delay = max(mstart + rlevel_ctl.s.offset, mstart + 1);
 | |
| 			/*
 | |
| 			 * Insure that the offset delay falls within the
 | |
| 			 * bitmask
 | |
| 			 */
 | |
| 			delay = min(delay, mstart + width - 1);
 | |
| 		} else {
 | |
| 			/* Round down */
 | |
| 			delay = (width - 1) / 2 + mstart;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return delay;
 | |
| }
 | |
| 
 | |
| /* Default ODT config must disable ODT */
 | |
| /* Must be const (read only) so that the structure is in flash */
 | |
| const struct dimm_odt_config disable_odt_config[] = {
 | |
| 	/*   1 */ { 0, 0x0000, {.u64 = 0x0000}, {.u64 = 0x0000}, 0, 0x0000, 0 },
 | |
| 	/*   2 */ { 0, 0x0000, {.u64 = 0x0000}, {.u64 = 0x0000}, 0, 0x0000, 0 },
 | |
| 	/*   3 */ { 0, 0x0000, {.u64 = 0x0000}, {.u64 = 0x0000}, 0, 0x0000, 0 },
 | |
| 	/*   4 */ { 0, 0x0000, {.u64 = 0x0000}, {.u64 = 0x0000}, 0, 0x0000, 0 },
 | |
| };
 | |
| 
 | |
| /* Memory controller setup function */
 | |
| static int init_octeon_dram_interface(struct ddr_priv *priv,
 | |
| 				      struct ddr_conf *ddr_conf,
 | |
| 				      u32 ddr_hertz, u32 cpu_hertz,
 | |
| 				      u32 ddr_ref_hertz, int if_num,
 | |
| 				      u32 if_mask)
 | |
| {
 | |
| 	u32 mem_size_mbytes = 0;
 | |
| 	char *s;
 | |
| 
 | |
| 	s = lookup_env(priv, "ddr_timing_hertz");
 | |
| 	if (s)
 | |
| 		ddr_hertz = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| 	if (OCTEON_IS_OCTEON3()) {
 | |
| 		int lmc_restart_retries = 0;
 | |
| #define DEFAULT_RESTART_RETRIES 3
 | |
| 		int lmc_restart_retries_limit = DEFAULT_RESTART_RETRIES;
 | |
| 
 | |
| 		s = lookup_env(priv, "ddr_restart_retries_limit");
 | |
| 		if (s)
 | |
| 			lmc_restart_retries_limit = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| restart_lmc_init:
 | |
| 		mem_size_mbytes = init_octeon3_ddr3_interface(priv, ddr_conf,
 | |
| 							      ddr_hertz,
 | |
| 							      cpu_hertz,
 | |
| 							      ddr_ref_hertz,
 | |
| 							      if_num, if_mask);
 | |
| 		if (mem_size_mbytes == 0) {	// 0 means restart is possible
 | |
| 			if (lmc_restart_retries < lmc_restart_retries_limit) {
 | |
| 				lmc_restart_retries++;
 | |
| 				printf("N0.LMC%d Configuration problem: attempting LMC reset and init restart %d\n",
 | |
| 				       if_num, lmc_restart_retries);
 | |
| 				goto restart_lmc_init;
 | |
| 			} else {
 | |
| 				if (lmc_restart_retries_limit > 0) {
 | |
| 					printf("INFO: N0.LMC%d Configuration: fatal problem remains after %d LMC init retries - Resetting node...\n",
 | |
| 					       if_num, lmc_restart_retries);
 | |
| 					mdelay(500);
 | |
| 					do_reset(NULL, 0, 0, NULL);
 | |
| 				} else {
 | |
| 					// return an error, no restart
 | |
| 					mem_size_mbytes = -1;
 | |
| 				}
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	debug("N0.LMC%d Configuration Completed: %d MB\n",
 | |
| 	      if_num, mem_size_mbytes);
 | |
| 
 | |
| 	return mem_size_mbytes;
 | |
| }
 | |
| 
 | |
| #define WLEVEL_BYTE_BITS	5
 | |
| #define WLEVEL_BYTE_MSK		((1ULL << 5) - 1)
 | |
| 
 | |
| void upd_wl_rank(union cvmx_lmcx_wlevel_rankx *lmc_wlevel_rank,
 | |
| 		 int byte, int delay)
 | |
| {
 | |
| 	union cvmx_lmcx_wlevel_rankx temp_wlevel_rank;
 | |
| 
 | |
| 	if (byte >= 0 && byte <= 8) {
 | |
| 		temp_wlevel_rank.u64 = lmc_wlevel_rank->u64;
 | |
| 		temp_wlevel_rank.u64 &=
 | |
| 		    ~(WLEVEL_BYTE_MSK << (WLEVEL_BYTE_BITS * byte));
 | |
| 		temp_wlevel_rank.u64 |=
 | |
| 		    ((delay & WLEVEL_BYTE_MSK) << (WLEVEL_BYTE_BITS * byte));
 | |
| 		lmc_wlevel_rank->u64 = temp_wlevel_rank.u64;
 | |
| 	}
 | |
| }
 | |
| 
 | |
| int get_wl_rank(union cvmx_lmcx_wlevel_rankx *lmc_wlevel_rank, int byte)
 | |
| {
 | |
| 	int delay = 0;
 | |
| 
 | |
| 	if (byte >= 0 && byte <= 8)
 | |
| 		delay =
 | |
| 		    ((lmc_wlevel_rank->u64) >> (WLEVEL_BYTE_BITS *
 | |
| 						byte)) & WLEVEL_BYTE_MSK;
 | |
| 
 | |
| 	return delay;
 | |
| }
 | |
| 
 | |
| void upd_rl_rank(union cvmx_lmcx_rlevel_rankx *lmc_rlevel_rank,
 | |
| 		 int byte, int delay)
 | |
| {
 | |
| 	union cvmx_lmcx_rlevel_rankx temp_rlevel_rank;
 | |
| 
 | |
| 	if (byte >= 0 && byte <= 8) {
 | |
| 		temp_rlevel_rank.u64 =
 | |
| 		    lmc_rlevel_rank->u64 & ~(RLEVEL_BYTE_MSK <<
 | |
| 					     (RLEVEL_BYTE_BITS * byte));
 | |
| 		temp_rlevel_rank.u64 |=
 | |
| 		    ((delay & RLEVEL_BYTE_MSK) << (RLEVEL_BYTE_BITS * byte));
 | |
| 		lmc_rlevel_rank->u64 = temp_rlevel_rank.u64;
 | |
| 	}
 | |
| }
 | |
| 
 | |
| int get_rl_rank(union cvmx_lmcx_rlevel_rankx *lmc_rlevel_rank, int byte)
 | |
| {
 | |
| 	int delay = 0;
 | |
| 
 | |
| 	if (byte >= 0 && byte <= 8)
 | |
| 		delay =
 | |
| 		    ((lmc_rlevel_rank->u64) >> (RLEVEL_BYTE_BITS *
 | |
| 						byte)) & RLEVEL_BYTE_MSK;
 | |
| 
 | |
| 	return delay;
 | |
| }
 | |
| 
 | |
| void rlevel_to_wlevel(union cvmx_lmcx_rlevel_rankx *lmc_rlevel_rank,
 | |
| 		      union cvmx_lmcx_wlevel_rankx *lmc_wlevel_rank, int byte)
 | |
| {
 | |
| 	int byte_delay = get_rl_rank(lmc_rlevel_rank, byte);
 | |
| 
 | |
| 	debug("Estimating Wlevel delay byte %d: ", byte);
 | |
| 	debug("Rlevel=%d => ", byte_delay);
 | |
| 	byte_delay = divide_roundup(byte_delay, 2) & 0x1e;
 | |
| 	debug("Wlevel=%d\n", byte_delay);
 | |
| 	upd_wl_rank(lmc_wlevel_rank, byte, byte_delay);
 | |
| }
 | |
| 
 | |
| /* Delay trend: constant=0, decreasing=-1, increasing=1 */
 | |
| static s64 calc_delay_trend(s64 v)
 | |
| {
 | |
| 	if (v == 0)
 | |
| 		return 0;
 | |
| 	if (v < 0)
 | |
| 		return -1;
 | |
| 
 | |
| 	return 1;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Evaluate delay sequence across the whole range of byte delays while
 | |
|  * keeping track of the overall delay trend, increasing or decreasing.
 | |
|  * If the trend changes charge an error amount to the score.
 | |
|  */
 | |
| 
 | |
| // NOTE: "max_adj_delay_inc" argument is, by default, 1 for DDR3 and 2 for DDR4
 | |
| 
 | |
| int nonseq_del(struct rlevel_byte_data *rlevel_byte, int start, int end,
 | |
| 	       int max_adj_delay_inc)
 | |
| {
 | |
| 	s64 error = 0;
 | |
| 	s64 delay_trend, prev_trend = 0;
 | |
| 	int byte_idx;
 | |
| 	s64 seq_err;
 | |
| 	s64 adj_err;
 | |
| 	s64 delay_inc;
 | |
| 	s64 delay_diff;
 | |
| 
 | |
| 	for (byte_idx = start; byte_idx < end; ++byte_idx) {
 | |
| 		delay_diff = rlevel_byte[byte_idx + 1].delay -
 | |
| 			rlevel_byte[byte_idx].delay;
 | |
| 		delay_trend = calc_delay_trend(delay_diff);
 | |
| 
 | |
| 		/*
 | |
| 		 * Increment error each time the trend changes to the
 | |
| 		 * opposite direction.
 | |
| 		 */
 | |
| 		if (prev_trend != 0 && delay_trend != 0 &&
 | |
| 		    prev_trend != delay_trend) {
 | |
| 			seq_err = RLEVEL_NONSEQUENTIAL_DELAY_ERROR;
 | |
| 		} else {
 | |
| 			seq_err = 0;
 | |
| 		}
 | |
| 
 | |
| 		// how big was the delay change, if any
 | |
| 		delay_inc = abs(delay_diff);
 | |
| 
 | |
| 		/*
 | |
| 		 * Even if the trend did not change to the opposite direction,
 | |
| 		 * check for the magnitude of the change, and scale the
 | |
| 		 * penalty by the amount that the size is larger than the
 | |
| 		 * provided limit.
 | |
| 		 */
 | |
| 		if (max_adj_delay_inc != 0 && delay_inc > max_adj_delay_inc) {
 | |
| 			adj_err = (delay_inc - max_adj_delay_inc) *
 | |
| 				RLEVEL_ADJACENT_DELAY_ERROR;
 | |
| 		} else {
 | |
| 			adj_err = 0;
 | |
| 		}
 | |
| 
 | |
| 		rlevel_byte[byte_idx + 1].sqerrs = seq_err + adj_err;
 | |
| 		error += seq_err + adj_err;
 | |
| 
 | |
| 		debug_bitmask_print("Byte %d: %d, Byte %d: %d, delay_trend: %ld, prev_trend: %ld, [%ld/%ld]%s%s\n",
 | |
| 				    byte_idx + 0,
 | |
| 				    rlevel_byte[byte_idx + 0].delay,
 | |
| 				    byte_idx + 1,
 | |
| 				    rlevel_byte[byte_idx + 1].delay,
 | |
| 				    delay_trend,
 | |
| 				    prev_trend, seq_err, adj_err,
 | |
| 				    (seq_err) ?
 | |
| 				    " => Nonsequential byte delay" : "",
 | |
| 				    (adj_err) ?
 | |
| 				    " => Adjacent delay error" : "");
 | |
| 
 | |
| 		if (delay_trend != 0)
 | |
| 			prev_trend = delay_trend;
 | |
| 	}
 | |
| 
 | |
| 	return (int)error;
 | |
| }
 | |
| 
 | |
| int roundup_ddr3_wlevel_bitmask(int bitmask)
 | |
| {
 | |
| 	int shifted_bitmask;
 | |
| 	int leader;
 | |
| 	int delay;
 | |
| 
 | |
| 	for (leader = 0; leader < 8; ++leader) {
 | |
| 		shifted_bitmask = (bitmask >> leader);
 | |
| 		if ((shifted_bitmask & 1) == 0)
 | |
| 			break;
 | |
| 	}
 | |
| 
 | |
| 	for (leader = leader; leader < 16; ++leader) {
 | |
| 		shifted_bitmask = (bitmask >> (leader % 8));
 | |
| 		if (shifted_bitmask & 1)
 | |
| 			break;
 | |
| 	}
 | |
| 
 | |
| 	delay = (leader & 1) ? leader + 1 : leader;
 | |
| 	delay = delay % 8;
 | |
| 
 | |
| 	return delay;
 | |
| }
 | |
| 
 | |
| /* Octeon 2 */
 | |
| static void oct2_ddr3_seq(struct ddr_priv *priv, int rank_mask, int if_num,
 | |
| 			  int sequence)
 | |
| {
 | |
| 	char *s;
 | |
| 
 | |
| #ifdef DEBUG_PERFORM_DDR3_SEQUENCE
 | |
| 	static const char * const sequence_str[] = {
 | |
| 		"power-up/init",
 | |
| 		"read-leveling",
 | |
| 		"self-refresh entry",
 | |
| 		"self-refresh exit",
 | |
| 		"precharge power-down entry",
 | |
| 		"precharge power-down exit",
 | |
| 		"write-leveling",
 | |
| 		"illegal"
 | |
| 	};
 | |
| #endif
 | |
| 
 | |
| 	union cvmx_lmcx_control lmc_control;
 | |
| 	union cvmx_lmcx_config lmc_config;
 | |
| 	int save_ddr2t;
 | |
| 
 | |
| 	lmc_control.u64 = lmc_rd(priv, CVMX_LMCX_CONTROL(if_num));
 | |
| 	save_ddr2t = lmc_control.s.ddr2t;
 | |
| 
 | |
| 	if (save_ddr2t == 0 && octeon_is_cpuid(OCTEON_CN63XX_PASS1_X)) {
 | |
| 		/* Some register parts (IDT and TI included) do not like
 | |
| 		 * the sequence that LMC generates for an MRS register
 | |
| 		 * write in 1T mode. In this case, the register part does
 | |
| 		 * not properly forward the MRS register write to the DRAM
 | |
| 		 * parts.  See errata (LMC-14548) Issues with registered
 | |
| 		 * DIMMs.
 | |
| 		 */
 | |
| 		debug("Forcing DDR 2T during init seq. Re: Pass 1 LMC-14548\n");
 | |
| 		lmc_control.s.ddr2t = 1;
 | |
| 	}
 | |
| 
 | |
| 	s = lookup_env(priv, "ddr_init_2t");
 | |
| 	if (s)
 | |
| 		lmc_control.s.ddr2t = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| 	lmc_wr(priv, CVMX_LMCX_CONTROL(if_num), lmc_control.u64);
 | |
| 
 | |
| 	lmc_config.u64 = lmc_rd(priv, CVMX_LMCX_CONFIG(if_num));
 | |
| 
 | |
| 	lmc_config.s.init_start = 1;
 | |
| 	if (OCTEON_IS_OCTEON2())
 | |
| 		lmc_config.cn63xx.sequence = sequence;
 | |
| 	lmc_config.s.rankmask = rank_mask;
 | |
| 
 | |
| #ifdef DEBUG_PERFORM_DDR3_SEQUENCE
 | |
| 	debug("Performing LMC sequence: rank_mask=0x%02x, sequence=%d, %s\n",
 | |
| 	      rank_mask, sequence, sequence_str[sequence]);
 | |
| #endif
 | |
| 
 | |
| 	lmc_wr(priv, CVMX_LMCX_CONFIG(if_num), lmc_config.u64);
 | |
| 	lmc_rd(priv, CVMX_LMCX_CONFIG(if_num));
 | |
| 	udelay(600);		/* Wait a while */
 | |
| 
 | |
| 	lmc_control.s.ddr2t = save_ddr2t;
 | |
| 	lmc_wr(priv, CVMX_LMCX_CONTROL(if_num), lmc_control.u64);
 | |
| 	lmc_rd(priv, CVMX_LMCX_CONTROL(if_num));
 | |
| }
 | |
| 
 | |
| /* Check to see if any custom offset values are used */
 | |
| static int is_dll_offset_provided(const int8_t *dll_offset_table)
 | |
| {
 | |
| 	int i;
 | |
| 
 | |
| 	if (!dll_offset_table)	/* Check for pointer to table. */
 | |
| 		return 0;
 | |
| 
 | |
| 	for (i = 0; i < 9; ++i) {
 | |
| 		if (dll_offset_table[i] != 0)
 | |
| 			return 1;
 | |
| 	}
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| void change_dll_offset_enable(struct ddr_priv *priv, int if_num, int change)
 | |
| {
 | |
| 	union cvmx_lmcx_dll_ctl3 ddr_dll_ctl3;
 | |
| 
 | |
| 	ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(if_num));
 | |
| 	SET_DDR_DLL_CTL3(offset_ena, !!change);
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL3(if_num), ddr_dll_ctl3.u64);
 | |
| 	ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(if_num));
 | |
| }
 | |
| 
 | |
| unsigned short load_dll_offset(struct ddr_priv *priv, int if_num,
 | |
| 			       int dll_offset_mode, int byte_offset, int byte)
 | |
| {
 | |
| 	union cvmx_lmcx_dll_ctl3 ddr_dll_ctl3;
 | |
| 	int field_width = 6;
 | |
| 	/*
 | |
| 	 * byte_sel:
 | |
| 	 * 0x1 = byte 0, ..., 0x9 = byte 8
 | |
| 	 * 0xA = all bytes
 | |
| 	 */
 | |
| 	int byte_sel = (byte == 10) ? byte : byte + 1;
 | |
| 
 | |
| 	if (octeon_is_cpuid(OCTEON_CN6XXX))
 | |
| 		field_width = 5;
 | |
| 
 | |
| 	ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(if_num));
 | |
| 	SET_DDR_DLL_CTL3(load_offset, 0);
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL3(if_num), ddr_dll_ctl3.u64);
 | |
| 	ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(if_num));
 | |
| 
 | |
| 	SET_DDR_DLL_CTL3(mode_sel, dll_offset_mode);
 | |
| 	SET_DDR_DLL_CTL3(offset,
 | |
| 			 (abs(byte_offset) & (~(-1 << field_width))) |
 | |
| 			 (_sign(byte_offset) << field_width));
 | |
| 	SET_DDR_DLL_CTL3(byte_sel, byte_sel);
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL3(if_num), ddr_dll_ctl3.u64);
 | |
| 	ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(if_num));
 | |
| 
 | |
| 	SET_DDR_DLL_CTL3(load_offset, 1);
 | |
| 	lmc_wr(priv, CVMX_LMCX_DLL_CTL3(if_num), ddr_dll_ctl3.u64);
 | |
| 	ddr_dll_ctl3.u64 = lmc_rd(priv, CVMX_LMCX_DLL_CTL3(if_num));
 | |
| 
 | |
| 	return (unsigned short)GET_DDR_DLL_CTL3(offset);
 | |
| }
 | |
| 
 | |
| void process_custom_dll_offsets(struct ddr_priv *priv, int if_num,
 | |
| 				const char *enable_str,
 | |
| 				const int8_t *offsets, const char *byte_str,
 | |
| 				int mode)
 | |
| {
 | |
| 	const char *s;
 | |
| 	int enabled;
 | |
| 	int provided;
 | |
| 	int byte_offset;
 | |
| 	unsigned short offset[9] = { 0 };
 | |
| 	int byte;
 | |
| 
 | |
| 	s = lookup_env(priv, enable_str);
 | |
| 	if (s)
 | |
| 		enabled = !!simple_strtol(s, NULL, 0);
 | |
| 	else
 | |
| 		enabled = -1;
 | |
| 
 | |
| 	/*
 | |
| 	 * enabled == -1: no override, do only configured offsets if provided
 | |
| 	 * enabled ==  0: override OFF, do NOT do it even if configured
 | |
| 	 *                offsets provided
 | |
| 	 * enabled ==  1: override ON, do it for overrides plus configured
 | |
| 	 *                offsets
 | |
| 	 */
 | |
| 
 | |
| 	if (enabled == 0)
 | |
| 		return;
 | |
| 
 | |
| 	provided = is_dll_offset_provided(offsets);
 | |
| 
 | |
| 	if (enabled < 0 && !provided)
 | |
| 		return;
 | |
| 
 | |
| 	change_dll_offset_enable(priv, if_num, 0);
 | |
| 
 | |
| 	for (byte = 0; byte < 9; ++byte) {
 | |
| 		// always take the provided, if available
 | |
| 		byte_offset = (provided) ? offsets[byte] : 0;
 | |
| 
 | |
| 		// then, if enabled, use any overrides present
 | |
| 		if (enabled > 0) {
 | |
| 			s = lookup_env(priv, byte_str, if_num, byte);
 | |
| 			if (s)
 | |
| 				byte_offset = simple_strtol(s, NULL, 0);
 | |
| 		}
 | |
| 
 | |
| 		offset[byte] =
 | |
| 		    load_dll_offset(priv, if_num, mode, byte_offset, byte);
 | |
| 	}
 | |
| 
 | |
| 	change_dll_offset_enable(priv, if_num, 1);
 | |
| 
 | |
| 	debug("N0.LMC%d: DLL %s Offset 8:0       :  0x%02x  0x%02x  0x%02x  0x%02x  0x%02x  0x%02x  0x%02x  0x%02x  0x%02x\n",
 | |
| 	      if_num, (mode == 2) ? "Read " : "Write",
 | |
| 	      offset[8], offset[7], offset[6], offset[5], offset[4],
 | |
| 	      offset[3], offset[2], offset[1], offset[0]);
 | |
| }
 | |
| 
 | |
| void ddr_init_seq(struct ddr_priv *priv, int rank_mask, int if_num)
 | |
| {
 | |
| 	char *s;
 | |
| 	int ddr_init_loops = 1;
 | |
| 	int rankx;
 | |
| 
 | |
| 	s = lookup_env(priv, "ddr%d_init_loops", if_num);
 | |
| 	if (s)
 | |
| 		ddr_init_loops = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| 	while (ddr_init_loops--) {
 | |
| 		for (rankx = 0; rankx < 8; rankx++) {
 | |
| 			if (!(rank_mask & (1 << rankx)))
 | |
| 				continue;
 | |
| 
 | |
| 			if (OCTEON_IS_OCTEON3()) {
 | |
| 				/* power-up/init */
 | |
| 				oct3_ddr3_seq(priv, 1 << rankx, if_num, 0);
 | |
| 			} else {
 | |
| 				/* power-up/init */
 | |
| 				oct2_ddr3_seq(priv, 1 << rankx, if_num, 0);
 | |
| 			}
 | |
| 
 | |
| 			udelay(1000);	/* Wait a while. */
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_sequence1");
 | |
| 			if (s) {
 | |
| 				int sequence1;
 | |
| 
 | |
| 				sequence1 = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| 				if (OCTEON_IS_OCTEON3()) {
 | |
| 					oct3_ddr3_seq(priv, 1 << rankx,
 | |
| 						      if_num, sequence1);
 | |
| 				} else {
 | |
| 					oct2_ddr3_seq(priv, 1 << rankx,
 | |
| 						      if_num, sequence1);
 | |
| 				}
 | |
| 			}
 | |
| 
 | |
| 			s = lookup_env(priv, "ddr_sequence2");
 | |
| 			if (s) {
 | |
| 				int sequence2;
 | |
| 
 | |
| 				sequence2 = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| 				if (OCTEON_IS_OCTEON3())
 | |
| 					oct3_ddr3_seq(priv, 1 << rankx,
 | |
| 						      if_num, sequence2);
 | |
| 				else
 | |
| 					oct2_ddr3_seq(priv, 1 << rankx,
 | |
| 						      if_num, sequence2);
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static int octeon_ddr_initialize(struct ddr_priv *priv, u32 cpu_hertz,
 | |
| 				 u32 ddr_hertz, u32 ddr_ref_hertz,
 | |
| 				 u32 if_mask,
 | |
| 				 struct ddr_conf *ddr_conf,
 | |
| 				 u32 *measured_ddr_hertz)
 | |
| {
 | |
| 	u32 ddr_conf_valid_mask = 0;
 | |
| 	int memsize_mbytes = 0;
 | |
| 	char *eptr;
 | |
| 	int if_idx;
 | |
| 	u32 ddr_max_speed = 667000000;
 | |
| 	u32 calc_ddr_hertz = -1;
 | |
| 	int val;
 | |
| 	int ret;
 | |
| 
 | |
| 	if (env_get("ddr_verbose") || env_get("ddr_prompt"))
 | |
| 		priv->flags |= FLAG_DDR_VERBOSE;
 | |
| 
 | |
| #ifdef DDR_VERBOSE
 | |
| 	priv->flags |= FLAG_DDR_VERBOSE;
 | |
| #endif
 | |
| 
 | |
| 	if (env_get("ddr_trace_init")) {
 | |
| 		printf("Parameter ddr_trace_init found in environment.\n");
 | |
| 		priv->flags |= FLAG_DDR_TRACE_INIT;
 | |
| 		priv->flags |= FLAG_DDR_VERBOSE;
 | |
| 	}
 | |
| 
 | |
| 	priv->flags |= FLAG_DDR_DEBUG;
 | |
| 
 | |
| 	val = env_get_ulong("ddr_debug", 10, (u32)-1);
 | |
| 	switch (val) {
 | |
| 	case 0:
 | |
| 		priv->flags &= ~FLAG_DDR_DEBUG;
 | |
| 		printf("Parameter ddr_debug clear in environment\n");
 | |
| 		break;
 | |
| 	case (u32)-1:
 | |
| 		break;
 | |
| 	default:
 | |
| 		printf("Parameter ddr_debug set in environment\n");
 | |
| 		priv->flags |= FLAG_DDR_DEBUG;
 | |
| 		priv->flags |= FLAG_DDR_VERBOSE;
 | |
| 		break;
 | |
| 	}
 | |
| 	if (env_get("ddr_prompt"))
 | |
| 		priv->flags |= FLAG_DDR_PROMPT;
 | |
| 
 | |
| 	/* Force ddr_verbose for failsafe debugger */
 | |
| 	if (priv->flags & FLAG_FAILSAFE_MODE)
 | |
| 		priv->flags |= FLAG_DDR_VERBOSE;
 | |
| 
 | |
| #ifdef DDR_DEBUG
 | |
| 	priv->flags |= FLAG_DDR_DEBUG;
 | |
| 	/* Keep verbose on while we are still debugging. */
 | |
| 	priv->flags |= FLAG_DDR_VERBOSE;
 | |
| #endif
 | |
| 
 | |
| 	if ((octeon_is_cpuid(OCTEON_CN61XX) ||
 | |
| 	     octeon_is_cpuid(OCTEON_CNF71XX)) && ddr_max_speed > 533333333) {
 | |
| 		ddr_max_speed = 533333333;
 | |
| 	} else if (octeon_is_cpuid(OCTEON_CN7XXX)) {
 | |
| 		/* Override speed restrictions to support internal testing. */
 | |
| 		ddr_max_speed = 1210000000;
 | |
| 	}
 | |
| 
 | |
| 	if (ddr_hertz > ddr_max_speed) {
 | |
| 		printf("DDR clock speed %u exceeds maximum supported DDR speed, reducing to %uHz\n",
 | |
| 		       ddr_hertz, ddr_max_speed);
 | |
| 		ddr_hertz = ddr_max_speed;
 | |
| 	}
 | |
| 
 | |
| 	if (OCTEON_IS_OCTEON3()) {	// restrict check
 | |
| 		if (ddr_hertz > cpu_hertz) {
 | |
| 			printf("\nFATAL ERROR: DDR speed %u exceeds CPU speed %u, exiting...\n\n",
 | |
| 			       ddr_hertz, cpu_hertz);
 | |
| 			return -1;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/* Enable L2 ECC */
 | |
| 	eptr = env_get("disable_l2_ecc");
 | |
| 	if (eptr) {
 | |
| 		printf("Disabling L2 ECC based on disable_l2_ecc environment variable\n");
 | |
| 		union cvmx_l2c_ctl l2c_val;
 | |
| 
 | |
| 		l2c_val.u64 = l2c_rd(priv, CVMX_L2C_CTL);
 | |
| 		l2c_val.s.disecc = 1;
 | |
| 		l2c_wr(priv, CVMX_L2C_CTL, l2c_val.u64);
 | |
| 	} else {
 | |
| 		union cvmx_l2c_ctl l2c_val;
 | |
| 
 | |
| 		l2c_val.u64 = l2c_rd(priv, CVMX_L2C_CTL);
 | |
| 		l2c_val.s.disecc = 0;
 | |
| 		l2c_wr(priv, CVMX_L2C_CTL, l2c_val.u64);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Init the L2C, must be done before DRAM access so that we
 | |
| 	 * know L2 is empty
 | |
| 	 */
 | |
| 	eptr = env_get("disable_l2_index_aliasing");
 | |
| 	if (eptr) {
 | |
| 		union cvmx_l2c_ctl l2c_val;
 | |
| 
 | |
| 		puts("L2 index aliasing disabled.\n");
 | |
| 
 | |
| 		l2c_val.u64 = l2c_rd(priv, CVMX_L2C_CTL);
 | |
| 		l2c_val.s.disidxalias = 1;
 | |
| 		l2c_wr(priv, CVMX_L2C_CTL, l2c_val.u64);
 | |
| 	} else {
 | |
| 		union cvmx_l2c_ctl l2c_val;
 | |
| 
 | |
| 		/* Enable L2C index aliasing */
 | |
| 
 | |
| 		l2c_val.u64 = l2c_rd(priv, CVMX_L2C_CTL);
 | |
| 		l2c_val.s.disidxalias = 0;
 | |
| 		l2c_wr(priv, CVMX_L2C_CTL, l2c_val.u64);
 | |
| 	}
 | |
| 
 | |
| 	if (OCTEON_IS_OCTEON3()) {
 | |
| 		/*
 | |
| 		 * rdf_cnt: Defines the sample point of the LMC response data in
 | |
| 		 * the DDR-clock/core-clock crossing.  For optimal
 | |
| 		 * performance set to 10 * (DDR-clock period/core-clock
 | |
| 		 * period) - 1.  To disable set to 0. All other values
 | |
| 		 * are reserved.
 | |
| 		 */
 | |
| 
 | |
| 		union cvmx_l2c_ctl l2c_ctl;
 | |
| 		u64 rdf_cnt;
 | |
| 		char *s;
 | |
| 
 | |
| 		l2c_ctl.u64 = l2c_rd(priv, CVMX_L2C_CTL);
 | |
| 
 | |
| 		/*
 | |
| 		 * It is more convenient to compute the ratio using clock
 | |
| 		 * frequencies rather than clock periods.
 | |
| 		 */
 | |
| 		rdf_cnt = (((u64)10 * cpu_hertz) / ddr_hertz) - 1;
 | |
| 		rdf_cnt = rdf_cnt < 256 ? rdf_cnt : 255;
 | |
| 		l2c_ctl.cn78xx.rdf_cnt = rdf_cnt;
 | |
| 
 | |
| 		s = lookup_env(priv, "early_fill_count");
 | |
| 		if (s)
 | |
| 			l2c_ctl.cn78xx.rdf_cnt = simple_strtoul(s, NULL, 0);
 | |
| 
 | |
| 		debug("%-45s : %d, cpu_hertz:%d, ddr_hertz:%d\n",
 | |
| 		      "EARLY FILL COUNT  ", l2c_ctl.cn78xx.rdf_cnt, cpu_hertz,
 | |
| 		      ddr_hertz);
 | |
| 		l2c_wr(priv, CVMX_L2C_CTL, l2c_ctl.u64);
 | |
| 	}
 | |
| 
 | |
| 	/* Check for lower DIMM socket populated */
 | |
| 	for (if_idx = 0; if_idx < 4; ++if_idx) {
 | |
| 		if ((if_mask & (1 << if_idx)) &&
 | |
| 		    validate_dimm(priv,
 | |
| 				  &ddr_conf[(int)if_idx].dimm_config_table[0],
 | |
| 				  0))
 | |
| 			ddr_conf_valid_mask |= (1 << if_idx);
 | |
| 	}
 | |
| 
 | |
| 	if (octeon_is_cpuid(OCTEON_CN68XX) || octeon_is_cpuid(OCTEON_CN78XX)) {
 | |
| 		int four_lmc_mode = 1;
 | |
| 		char *s;
 | |
| 
 | |
| 		if (priv->flags & FLAG_FAILSAFE_MODE)
 | |
| 			four_lmc_mode = 0;
 | |
| 
 | |
| 		/* Pass 1.0 disable four LMC mode.
 | |
| 		 *  See errata (LMC-15811)
 | |
| 		 */
 | |
| 		if (octeon_is_cpuid(OCTEON_CN68XX_PASS1_0))
 | |
| 			four_lmc_mode = 0;
 | |
| 
 | |
| 		s = env_get("ddr_four_lmc");
 | |
| 		if (s) {
 | |
| 			four_lmc_mode = simple_strtoul(s, NULL, 0);
 | |
| 			printf("Parameter found in environment. ddr_four_lmc = %d\n",
 | |
| 			       four_lmc_mode);
 | |
| 		}
 | |
| 
 | |
| 		if (!four_lmc_mode) {
 | |
| 			puts("Forcing two-LMC Mode.\n");
 | |
| 			/* Invalidate LMC[2:3] */
 | |
| 			ddr_conf_valid_mask &= ~(3 << 2);
 | |
| 		}
 | |
| 	} else if (octeon_is_cpuid(OCTEON_CN73XX)) {
 | |
| 		int one_lmc_mode = 0;
 | |
| 		char *s;
 | |
| 
 | |
| 		s = env_get("ddr_one_lmc");
 | |
| 		if (s) {
 | |
| 			one_lmc_mode = simple_strtoul(s, NULL, 0);
 | |
| 			printf("Parameter found in environment. ddr_one_lmc = %d\n",
 | |
| 			       one_lmc_mode);
 | |
| 		}
 | |
| 
 | |
| 		if (one_lmc_mode) {
 | |
| 			puts("Forcing one-LMC Mode.\n");
 | |
| 			/* Invalidate LMC[1:3] */
 | |
| 			ddr_conf_valid_mask &= ~(1 << 1);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (!ddr_conf_valid_mask) {
 | |
| 		printf
 | |
| 		    ("ERROR: No valid DIMMs detected on any DDR interface.\n");
 | |
| 		hang();
 | |
| 		return -1;	// testr-only: no ret negativ!!!
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * We measure the DDR frequency by counting DDR clocks.  We can
 | |
| 	 * confirm or adjust the expected frequency as necessary.  We use
 | |
| 	 * the measured frequency to make accurate timing calculations
 | |
| 	 * used to configure the controller.
 | |
| 	 */
 | |
| 	for (if_idx = 0; if_idx < 4; ++if_idx) {
 | |
| 		u32 tmp_hertz;
 | |
| 
 | |
| 		if (!(ddr_conf_valid_mask & (1 << if_idx)))
 | |
| 			continue;
 | |
| 
 | |
| try_again:
 | |
| 		/*
 | |
| 		 * only check for alternate refclk wanted on chips that
 | |
| 		 * support it
 | |
| 		 */
 | |
| 		if ((octeon_is_cpuid(OCTEON_CN73XX)) ||
 | |
| 		    (octeon_is_cpuid(OCTEON_CNF75XX)) ||
 | |
| 		    (octeon_is_cpuid(OCTEON_CN78XX_PASS2_X))) {
 | |
| 			// only need do this if we are LMC0
 | |
| 			if (if_idx == 0) {
 | |
| 				union cvmx_lmcx_ddr_pll_ctl ddr_pll_ctl;
 | |
| 
 | |
| 				ddr_pll_ctl.u64 =
 | |
| 				    lmc_rd(priv, CVMX_LMCX_DDR_PLL_CTL(0));
 | |
| 
 | |
| 				/*
 | |
| 				 * If we are asking for 100 MHz refclk, we can
 | |
| 				 * only get it via alternate, so switch to it
 | |
| 				 */
 | |
| 				if (ddr_ref_hertz == 100000000) {
 | |
| 					ddr_pll_ctl.cn78xx.dclk_alt_refclk_sel =
 | |
| 					    1;
 | |
| 					lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(0),
 | |
| 					       ddr_pll_ctl.u64);
 | |
| 					udelay(1000);	// wait 1 msec
 | |
| 				} else {
 | |
| 					/*
 | |
| 					 * If we are NOT asking for 100MHz,
 | |
| 					 * then reset to (assumed) 50MHz and go
 | |
| 					 * on
 | |
| 					 */
 | |
| 					ddr_pll_ctl.cn78xx.dclk_alt_refclk_sel =
 | |
| 					    0;
 | |
| 					lmc_wr(priv, CVMX_LMCX_DDR_PLL_CTL(0),
 | |
| 					       ddr_pll_ctl.u64);
 | |
| 					udelay(1000);	// wait 1 msec
 | |
| 				}
 | |
| 			}
 | |
| 		} else {
 | |
| 			if (ddr_ref_hertz == 100000000) {
 | |
| 				debug("N0: DRAM init: requested 100 MHz refclk NOT SUPPORTED\n");
 | |
| 				ddr_ref_hertz = CONFIG_REF_HERTZ;
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		tmp_hertz = measure_octeon_ddr_clock(priv, &ddr_conf[if_idx],
 | |
| 						     cpu_hertz, ddr_hertz,
 | |
| 						     ddr_ref_hertz, if_idx,
 | |
| 						     ddr_conf_valid_mask);
 | |
| 
 | |
| 		/*
 | |
| 		 * only check for alternate refclk acquired on chips that
 | |
| 		 * support it
 | |
| 		 */
 | |
| 		if ((octeon_is_cpuid(OCTEON_CN73XX)) ||
 | |
| 		    (octeon_is_cpuid(OCTEON_CNF75XX)) ||
 | |
| 		    (octeon_is_cpuid(OCTEON_CN78XX_PASS2_X))) {
 | |
| 			/*
 | |
| 			 * if we are LMC0 and we are asked for 100 MHz refclk,
 | |
| 			 * we must be sure it is available
 | |
| 			 * If not, we print an error message, set to 50MHz,
 | |
| 			 * and go on...
 | |
| 			 */
 | |
| 			if (if_idx == 0 && ddr_ref_hertz == 100000000) {
 | |
| 				/*
 | |
| 				 * Validate that the clock returned is close
 | |
| 				 * enough to the clock desired
 | |
| 				 */
 | |
| 				// FIXME: is 5% close enough?
 | |
| 				int hertz_diff =
 | |
| 				    abs((int)tmp_hertz - (int)ddr_hertz);
 | |
| 				if (hertz_diff > ((int)ddr_hertz * 5 / 100)) {
 | |
| 					// nope, diff is greater than than 5%
 | |
| 					debug("N0: DRAM init: requested 100 MHz refclk NOT FOUND\n");
 | |
| 					ddr_ref_hertz = CONFIG_REF_HERTZ;
 | |
| 					// clear the flag before trying again!!
 | |
| 					set_ddr_clock_initialized(priv, 0, 0);
 | |
| 					goto try_again;
 | |
| 				} else {
 | |
| 					debug("N0: DRAM Init: requested 100 MHz refclk FOUND and SELECTED\n");
 | |
| 				}
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		if (tmp_hertz > 0)
 | |
| 			calc_ddr_hertz = tmp_hertz;
 | |
| 		debug("LMC%d: measured speed: %u hz\n", if_idx, tmp_hertz);
 | |
| 	}
 | |
| 
 | |
| 	if (measured_ddr_hertz)
 | |
| 		*measured_ddr_hertz = calc_ddr_hertz;
 | |
| 
 | |
| 	memsize_mbytes = 0;
 | |
| 	for (if_idx = 0; if_idx < 4; ++if_idx) {
 | |
| 		if (!(ddr_conf_valid_mask & (1 << if_idx)))
 | |
| 			continue;
 | |
| 
 | |
| 		ret = init_octeon_dram_interface(priv, &ddr_conf[if_idx],
 | |
| 						 calc_ddr_hertz,
 | |
| 						 cpu_hertz, ddr_ref_hertz,
 | |
| 						 if_idx, ddr_conf_valid_mask);
 | |
| 		if (ret > 0)
 | |
| 			memsize_mbytes += ret;
 | |
| 	}
 | |
| 
 | |
| 	if (memsize_mbytes == 0)
 | |
| 		/* All interfaces failed to initialize, so return error */
 | |
| 		return -1;
 | |
| 
 | |
| 	/*
 | |
| 	 * switch over to DBI mode only for chips that support it, and
 | |
| 	 * enabled by envvar
 | |
| 	 */
 | |
| 	if ((octeon_is_cpuid(OCTEON_CN73XX)) ||
 | |
| 	    (octeon_is_cpuid(OCTEON_CNF75XX)) ||
 | |
| 	    (octeon_is_cpuid(OCTEON_CN78XX_PASS2_X))) {
 | |
| 		eptr = env_get("ddr_dbi_switchover");
 | |
| 		if (eptr) {
 | |
| 			printf("DBI Switchover starting...\n");
 | |
| 			cvmx_dbi_switchover(priv);
 | |
| 			printf("DBI Switchover finished.\n");
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/* call HW-assist tuning here on chips that support it */
 | |
| 	if ((octeon_is_cpuid(OCTEON_CN73XX)) ||
 | |
| 	    (octeon_is_cpuid(OCTEON_CNF75XX)) ||
 | |
| 	    (octeon_is_cpuid(OCTEON_CN78XX_PASS2_X)))
 | |
| 		cvmx_maybe_tune_node(priv, calc_ddr_hertz);
 | |
| 
 | |
| 	eptr = env_get("limit_dram_mbytes");
 | |
| 	if (eptr) {
 | |
| 		unsigned int mbytes = simple_strtoul(eptr, NULL, 10);
 | |
| 
 | |
| 		if (mbytes > 0) {
 | |
| 			memsize_mbytes = mbytes;
 | |
| 			printf("Limiting DRAM size to %d MBytes based on limit_dram_mbytes env. variable\n",
 | |
| 			       mbytes);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	debug("LMC Initialization complete. Total DRAM %d MB\n",
 | |
| 	      memsize_mbytes);
 | |
| 
 | |
| 	return memsize_mbytes;
 | |
| }
 | |
| 
 | |
| static int octeon_ddr_probe(struct udevice *dev)
 | |
| {
 | |
| 	struct ddr_priv *priv = dev_get_priv(dev);
 | |
| 	struct ofnode_phandle_args l2c_node;
 | |
| 	struct ddr_conf *ddr_conf_ptr;
 | |
| 	u32 ddr_conf_valid_mask = 0;
 | |
| 	u32 measured_ddr_hertz = 0;
 | |
| 	int conf_table_count;
 | |
| 	int def_ddr_freq;
 | |
| 	u32 mem_mbytes = 0;
 | |
| 	u32 ddr_hertz;
 | |
| 	u32 ddr_ref_hertz;
 | |
| 	int alt_refclk;
 | |
| 	const char *eptr;
 | |
| 	fdt_addr_t addr;
 | |
| 	u64 *ptr;
 | |
| 	u64 val;
 | |
| 	int ret;
 | |
| 	int i;
 | |
| 
 | |
| 	/* Don't try to re-init the DDR controller after relocation */
 | |
| 	if (gd->flags & GD_FLG_RELOC)
 | |
| 		return 0;
 | |
| 
 | |
| 	/*
 | |
| 	 * Dummy read all local variables into cache, so that they are
 | |
| 	 * locked in cache when the DDR code runs with flushes etc enabled
 | |
| 	 */
 | |
| 	ptr = (u64 *)_end;
 | |
| 	for (i = 0; i < (0x100000 / sizeof(u64)); i++)
 | |
| 		val = readq(ptr++);
 | |
| 
 | |
| 	/*
 | |
| 	 * The base addresses of LMC and L2C are read from the DT. This
 | |
| 	 * makes it possible to use the DDR init code without the need
 | |
| 	 * of the "node" variable, describing on which node to access. The
 | |
| 	 * node number is already included implicitly in the base addresses
 | |
| 	 * read from the DT this way.
 | |
| 	 */
 | |
| 
 | |
| 	/* Get LMC base address */
 | |
| 	priv->lmc_base = dev_remap_addr(dev);
 | |
| 	debug("%s: lmc_base=%p\n", __func__, priv->lmc_base);
 | |
| 
 | |
| 	/* Get L2C base address */
 | |
| 	ret = dev_read_phandle_with_args(dev, "l2c-handle", NULL, 0, 0,
 | |
| 					 &l2c_node);
 | |
| 	if (ret) {
 | |
| 		printf("Can't access L2C node!\n");
 | |
| 		return -ENODEV;
 | |
| 	}
 | |
| 
 | |
| 	addr = ofnode_get_addr(l2c_node.node);
 | |
| 	if (addr == FDT_ADDR_T_NONE) {
 | |
| 		printf("Can't access L2C node!\n");
 | |
| 		return -ENODEV;
 | |
| 	}
 | |
| 
 | |
| 	priv->l2c_base = map_physmem(addr, 0, MAP_NOCACHE);
 | |
| 	debug("%s: l2c_base=%p\n", __func__, priv->l2c_base);
 | |
| 
 | |
| 	ddr_conf_ptr = octeon_ddr_conf_table_get(&conf_table_count,
 | |
| 						 &def_ddr_freq);
 | |
| 	if (!ddr_conf_ptr) {
 | |
| 		printf("ERROR: unable to determine DDR configuration\n");
 | |
| 		return -ENODEV;
 | |
| 	}
 | |
| 
 | |
| 	for (i = 0; i < conf_table_count; i++) {
 | |
| 		if (ddr_conf_ptr[i].dimm_config_table[0].spd_addrs[0] ||
 | |
| 		    ddr_conf_ptr[i].dimm_config_table[0].spd_ptrs[0])
 | |
| 			ddr_conf_valid_mask |= 1 << i;
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Check for special case of mismarked 3005 samples,
 | |
| 	 * and adjust cpuid
 | |
| 	 */
 | |
| 	alt_refclk = 0;
 | |
| 	ddr_hertz = def_ddr_freq * 1000000;
 | |
| 
 | |
| 	eptr = env_get("ddr_clock_hertz");
 | |
| 	if (eptr) {
 | |
| 		ddr_hertz = simple_strtoul(eptr, NULL, 0);
 | |
| 		gd->mem_clk = divide_nint(ddr_hertz, 1000000);
 | |
| 		printf("Parameter found in environment. ddr_clock_hertz = %d\n",
 | |
| 		       ddr_hertz);
 | |
| 	}
 | |
| 
 | |
| 	ddr_ref_hertz = octeon3_refclock(alt_refclk,
 | |
| 					 ddr_hertz,
 | |
| 					 &ddr_conf_ptr[0].dimm_config_table[0]);
 | |
| 
 | |
| 	debug("Initializing DDR, clock = %uhz, reference = %uhz\n",
 | |
| 	      ddr_hertz, ddr_ref_hertz);
 | |
| 
 | |
| 	mem_mbytes = octeon_ddr_initialize(priv, gd->cpu_clk,
 | |
| 					   ddr_hertz, ddr_ref_hertz,
 | |
| 					   ddr_conf_valid_mask,
 | |
| 					   ddr_conf_ptr, &measured_ddr_hertz);
 | |
| 	debug("Mem size in MBYTES: %u\n", mem_mbytes);
 | |
| 
 | |
| 	gd->mem_clk = divide_nint(measured_ddr_hertz, 1000000);
 | |
| 
 | |
| 	debug("Measured DDR clock %d Hz\n", measured_ddr_hertz);
 | |
| 
 | |
| 	if (measured_ddr_hertz != 0) {
 | |
| 		if (!gd->mem_clk) {
 | |
| 			/*
 | |
| 			 * If ddr_clock not set, use measured clock
 | |
| 			 * and don't warn
 | |
| 			 */
 | |
| 			gd->mem_clk = divide_nint(measured_ddr_hertz, 1000000);
 | |
| 		} else if ((measured_ddr_hertz > ddr_hertz + 3000000) ||
 | |
| 			   (measured_ddr_hertz < ddr_hertz - 3000000)) {
 | |
| 			printf("\nWARNING:\n");
 | |
| 			printf("WARNING: Measured DDR clock mismatch!  expected: %lld MHz, measured: %lldMHz, cpu clock: %lu MHz\n",
 | |
| 			       divide_nint(ddr_hertz, 1000000),
 | |
| 			       divide_nint(measured_ddr_hertz, 1000000),
 | |
| 			       gd->cpu_clk);
 | |
| 			printf("WARNING:\n\n");
 | |
| 			gd->mem_clk = divide_nint(measured_ddr_hertz, 1000000);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (!mem_mbytes)
 | |
| 		return -ENODEV;
 | |
| 
 | |
| 	priv->info.base = CONFIG_SYS_SDRAM_BASE;
 | |
| 	priv->info.size = MB(mem_mbytes);
 | |
| 
 | |
| 	/*
 | |
| 	 * For 6XXX generate a proper error when reading/writing
 | |
| 	 * non-existent memory locations.
 | |
| 	 */
 | |
| 	cvmx_l2c_set_big_size(priv, mem_mbytes, 0);
 | |
| 
 | |
| 	debug("Ram size %uMiB\n", mem_mbytes);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int octeon_get_info(struct udevice *dev, struct ram_info *info)
 | |
| {
 | |
| 	struct ddr_priv *priv = dev_get_priv(dev);
 | |
| 
 | |
| 	*info = priv->info;
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static struct ram_ops octeon_ops = {
 | |
| 	.get_info = octeon_get_info,
 | |
| };
 | |
| 
 | |
| static const struct udevice_id octeon_ids[] = {
 | |
| 	{.compatible = "cavium,octeon-7xxx-ddr4" },
 | |
| 	{ }
 | |
| };
 | |
| 
 | |
| U_BOOT_DRIVER(octeon_ddr) = {
 | |
| 	.name = "octeon_ddr",
 | |
| 	.id = UCLASS_RAM,
 | |
| 	.of_match = octeon_ids,
 | |
| 	.ops = &octeon_ops,
 | |
| 	.probe = octeon_ddr_probe,
 | |
| 	.plat_auto = sizeof(struct ddr_priv),
 | |
| };
 |