2018-09-05 13:12:35 +00:00
|
|
|
// SPDX-License-Identifier: GPL-2.0+
|
|
|
|
/*
|
|
|
|
* Copyright (C) 2018 Stefan Roese <sr@denx.de>
|
|
|
|
*
|
|
|
|
* This code is mostly based on the code extracted from this MediaTek
|
|
|
|
* github repository:
|
|
|
|
*
|
|
|
|
* https://github.com/MediaTek-Labs/linkit-smart-uboot.git
|
|
|
|
*
|
|
|
|
* I was not able to find a specific license or other developers
|
|
|
|
* copyrights here, so I can't add them here.
|
|
|
|
*
|
|
|
|
* Most functions in this file are copied from the MediaTek U-Boot
|
|
|
|
* repository. Without any documentation, it was impossible to really
|
|
|
|
* implement this differently. So its mostly a cleaned-up version of
|
|
|
|
* the original code, with only support for the MT7628 / MT7688 SoC.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <common.h>
|
2019-11-14 19:57:39 +00:00
|
|
|
#include <cpu_func.h>
|
2018-09-05 13:12:35 +00:00
|
|
|
#include <linux/io.h>
|
|
|
|
#include <asm/cacheops.h>
|
|
|
|
#include <asm/io.h>
|
|
|
|
#include "mt76xx.h"
|
|
|
|
|
|
|
|
#define NUM_OF_CACHELINE 128
|
|
|
|
#define MIN_START 6
|
|
|
|
#define MIN_FINE_START 0xf
|
|
|
|
#define MAX_START 7
|
|
|
|
#define MAX_FINE_START 0x0
|
|
|
|
|
|
|
|
#define CPU_FRAC_DIV 1
|
|
|
|
|
|
|
|
#if defined(CONFIG_ONBOARD_DDR2_SIZE_256MBIT)
|
|
|
|
#define DRAM_BUTTOM 0x02000000
|
|
|
|
#endif
|
|
|
|
#if defined(CONFIG_ONBOARD_DDR2_SIZE_512MBIT)
|
|
|
|
#define DRAM_BUTTOM 0x04000000
|
|
|
|
#endif
|
|
|
|
#if defined(CONFIG_ONBOARD_DDR2_SIZE_1024MBIT)
|
|
|
|
#define DRAM_BUTTOM 0x08000000
|
|
|
|
#endif
|
|
|
|
#if defined(CONFIG_ONBOARD_DDR2_SIZE_2048MBIT)
|
|
|
|
#define DRAM_BUTTOM 0x10000000
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static inline void cal_memcpy(void *src, void *dst, u32 size)
|
|
|
|
{
|
|
|
|
u8 *psrc = (u8 *)src;
|
|
|
|
u8 *pdst = (u8 *)dst;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < size; i++, psrc++, pdst++)
|
|
|
|
*pdst = *psrc;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void cal_memset(void *src, u8 pat, u32 size)
|
|
|
|
{
|
|
|
|
u8 *psrc = (u8 *)src;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < size; i++, psrc++)
|
|
|
|
*psrc = pat;
|
|
|
|
}
|
|
|
|
|
|
|
|
#define pref_op(hint, addr) \
|
|
|
|
__asm__ __volatile__( \
|
|
|
|
".set push\n" \
|
|
|
|
".set noreorder\n" \
|
|
|
|
"pref %0, %1\n" \
|
|
|
|
".set pop\n" \
|
|
|
|
: \
|
|
|
|
: "i" (hint), "R" (*(u8 *)(addr)))
|
|
|
|
|
|
|
|
static inline void cal_patgen(u32 start_addr, u32 size, u32 bias)
|
|
|
|
{
|
|
|
|
u32 *addr = (u32 *)start_addr;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < size; i++)
|
|
|
|
addr[i] = start_addr + i + bias;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int test_loop(int k, int dqs, u32 test_dqs, u32 *coarse_dqs,
|
|
|
|
u32 offs, u32 pat, u32 val)
|
|
|
|
{
|
|
|
|
u32 nc_addr;
|
|
|
|
u32 *c_addr;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (nc_addr = 0xa0000000;
|
|
|
|
nc_addr < (0xa0000000 + DRAM_BUTTOM - NUM_OF_CACHELINE * 32);
|
|
|
|
nc_addr += (DRAM_BUTTOM >> 6) + offs) {
|
|
|
|
writel(0x00007474, (void *)MT76XX_MEMCTRL_BASE + 0x64);
|
|
|
|
wmb(); /* Make sure store if finished */
|
|
|
|
|
|
|
|
c_addr = (u32 *)(nc_addr & 0xdfffffff);
|
|
|
|
cal_memset(((u8 *)c_addr), 0x1F, NUM_OF_CACHELINE * 32);
|
|
|
|
cal_patgen(nc_addr, NUM_OF_CACHELINE * 8, pat);
|
|
|
|
|
|
|
|
if (dqs > 0)
|
|
|
|
writel(0x00000074 |
|
|
|
|
(((k == 1) ? coarse_dqs[dqs] : test_dqs) << 12) |
|
|
|
|
(((k == 0) ? val : test_dqs) << 8),
|
|
|
|
(void *)MT76XX_MEMCTRL_BASE + 0x64);
|
|
|
|
else
|
|
|
|
writel(0x00007400 |
|
|
|
|
(((k == 1) ? coarse_dqs[dqs] : test_dqs) << 4) |
|
|
|
|
(((k == 0) ? val : test_dqs) << 0),
|
|
|
|
(void *)MT76XX_MEMCTRL_BASE + 0x64);
|
|
|
|
wmb(); /* Make sure store if finished */
|
|
|
|
|
|
|
|
invalidate_dcache_range((u32)c_addr,
|
|
|
|
(u32)c_addr +
|
|
|
|
NUM_OF_CACHELINE * 32);
|
|
|
|
wmb(); /* Make sure store if finished */
|
|
|
|
|
|
|
|
for (i = 0; i < NUM_OF_CACHELINE * 8; i++) {
|
|
|
|
if (i % 8 == 0)
|
|
|
|
pref_op(0, &c_addr[i]);
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < NUM_OF_CACHELINE * 8; i++) {
|
|
|
|
if (c_addr[i] != nc_addr + i + pat)
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ddr_calibrate(void)
|
|
|
|
{
|
|
|
|
u32 min_coarse_dqs[2];
|
|
|
|
u32 max_coarse_dqs[2];
|
|
|
|
u32 min_fine_dqs[2];
|
|
|
|
u32 max_fine_dqs[2];
|
|
|
|
u32 coarse_dqs[2];
|
|
|
|
u32 fine_dqs[2];
|
|
|
|
int reg = 0, ddr_cfg2_reg;
|
|
|
|
int flag;
|
|
|
|
int i, k;
|
|
|
|
int dqs = 0;
|
|
|
|
u32 min_coarse_dqs_bnd, min_fine_dqs_bnd, coarse_dqs_dll, fine_dqs_dll;
|
|
|
|
u32 val;
|
|
|
|
u32 fdiv = 0, frac = 0;
|
|
|
|
|
|
|
|
/* Setup clock to run at full speed */
|
|
|
|
val = readl((void *)MT76XX_DYN_CFG0_REG);
|
|
|
|
fdiv = (u32)((val >> 8) & 0x0F);
|
|
|
|
if (CPU_FRAC_DIV < 1 || CPU_FRAC_DIV > 10)
|
|
|
|
frac = val & 0x0f;
|
|
|
|
else
|
|
|
|
frac = CPU_FRAC_DIV;
|
|
|
|
|
|
|
|
while (frac < fdiv) {
|
|
|
|
val = readl((void *)MT76XX_DYN_CFG0_REG);
|
|
|
|
fdiv = (val >> 8) & 0x0f;
|
|
|
|
fdiv--;
|
|
|
|
val &= ~(0x0f << 8);
|
|
|
|
val |= (fdiv << 8);
|
|
|
|
writel(val, (void *)MT76XX_DYN_CFG0_REG);
|
|
|
|
udelay(500);
|
|
|
|
val = readl((void *)MT76XX_DYN_CFG0_REG);
|
|
|
|
fdiv = (val >> 8) & 0x0f;
|
|
|
|
}
|
|
|
|
|
|
|
|
clrbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x10, BIT(4));
|
|
|
|
ddr_cfg2_reg = readl((void *)MT76XX_MEMCTRL_BASE + 0x48);
|
|
|
|
clrbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x48,
|
|
|
|
(0x3 << 28) | (0x3 << 26));
|
|
|
|
|
|
|
|
min_coarse_dqs[0] = MIN_START;
|
|
|
|
min_coarse_dqs[1] = MIN_START;
|
|
|
|
min_fine_dqs[0] = MIN_FINE_START;
|
|
|
|
min_fine_dqs[1] = MIN_FINE_START;
|
|
|
|
max_coarse_dqs[0] = MAX_START;
|
|
|
|
max_coarse_dqs[1] = MAX_START;
|
|
|
|
max_fine_dqs[0] = MAX_FINE_START;
|
|
|
|
max_fine_dqs[1] = MAX_FINE_START;
|
|
|
|
dqs = 0;
|
|
|
|
|
|
|
|
/* Add by KP, DQS MIN boundary */
|
|
|
|
reg = readl((void *)MT76XX_MEMCTRL_BASE + 0x20);
|
|
|
|
coarse_dqs_dll = (reg & 0xf00) >> 8;
|
|
|
|
fine_dqs_dll = (reg & 0xf0) >> 4;
|
|
|
|
if (coarse_dqs_dll <= 8)
|
|
|
|
min_coarse_dqs_bnd = 8 - coarse_dqs_dll;
|
|
|
|
else
|
|
|
|
min_coarse_dqs_bnd = 0;
|
|
|
|
|
|
|
|
if (fine_dqs_dll <= 8)
|
|
|
|
min_fine_dqs_bnd = 8 - fine_dqs_dll;
|
|
|
|
else
|
|
|
|
min_fine_dqs_bnd = 0;
|
|
|
|
/* DQS MIN boundary */
|
|
|
|
|
|
|
|
DQS_CAL:
|
|
|
|
|
|
|
|
for (k = 0; k < 2; k++) {
|
|
|
|
u32 test_dqs;
|
|
|
|
|
|
|
|
if (k == 0)
|
|
|
|
test_dqs = MAX_START;
|
|
|
|
else
|
|
|
|
test_dqs = MAX_FINE_START;
|
|
|
|
|
|
|
|
do {
|
|
|
|
flag = test_loop(k, dqs, test_dqs, max_coarse_dqs,
|
|
|
|
0x400, 0x3, 0xf);
|
|
|
|
if (flag == -1)
|
|
|
|
break;
|
|
|
|
|
|
|
|
test_dqs++;
|
|
|
|
} while (test_dqs <= 0xf);
|
|
|
|
|
|
|
|
if (k == 0) {
|
|
|
|
max_coarse_dqs[dqs] = test_dqs;
|
|
|
|
} else {
|
|
|
|
test_dqs--;
|
|
|
|
|
|
|
|
if (test_dqs == MAX_FINE_START - 1) {
|
|
|
|
max_coarse_dqs[dqs]--;
|
|
|
|
max_fine_dqs[dqs] = 0xf;
|
|
|
|
} else {
|
|
|
|
max_fine_dqs[dqs] = test_dqs;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for (k = 0; k < 2; k++) {
|
|
|
|
u32 test_dqs;
|
|
|
|
|
|
|
|
if (k == 0)
|
|
|
|
test_dqs = MIN_START;
|
|
|
|
else
|
|
|
|
test_dqs = MIN_FINE_START;
|
|
|
|
|
|
|
|
do {
|
|
|
|
flag = test_loop(k, dqs, test_dqs, min_coarse_dqs,
|
|
|
|
0x480, 0x1, 0x0);
|
|
|
|
if (k == 0) {
|
|
|
|
if (flag == -1 ||
|
|
|
|
test_dqs == min_coarse_dqs_bnd)
|
|
|
|
break;
|
|
|
|
|
|
|
|
test_dqs--;
|
|
|
|
|
|
|
|
if (test_dqs < min_coarse_dqs_bnd)
|
|
|
|
break;
|
|
|
|
} else {
|
|
|
|
if (flag == -1) {
|
|
|
|
test_dqs++;
|
|
|
|
break;
|
|
|
|
} else if (test_dqs == min_fine_dqs_bnd) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
test_dqs--;
|
|
|
|
|
|
|
|
if (test_dqs < min_fine_dqs_bnd)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (test_dqs >= 0);
|
|
|
|
|
|
|
|
if (k == 0) {
|
|
|
|
min_coarse_dqs[dqs] = test_dqs;
|
|
|
|
} else {
|
|
|
|
if (test_dqs == MIN_FINE_START + 1) {
|
|
|
|
min_coarse_dqs[dqs]++;
|
|
|
|
min_fine_dqs[dqs] = 0x0;
|
|
|
|
} else {
|
|
|
|
min_fine_dqs[dqs] = test_dqs;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (dqs == 0) {
|
|
|
|
dqs = 1;
|
|
|
|
goto DQS_CAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < 2; i++) {
|
|
|
|
u32 temp;
|
|
|
|
|
|
|
|
coarse_dqs[i] = (max_coarse_dqs[i] + min_coarse_dqs[i]) >> 1;
|
|
|
|
temp =
|
|
|
|
(((max_coarse_dqs[i] + min_coarse_dqs[i]) % 2) * 4) +
|
|
|
|
((max_fine_dqs[i] + min_fine_dqs[i]) >> 1);
|
|
|
|
if (temp >= 0x10) {
|
|
|
|
coarse_dqs[i]++;
|
|
|
|
fine_dqs[i] = (temp - 0x10) + 0x8;
|
|
|
|
} else {
|
|
|
|
fine_dqs[i] = temp;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
reg = (coarse_dqs[1] << 12) | (fine_dqs[1] << 8) |
|
|
|
|
(coarse_dqs[0] << 4) | fine_dqs[0];
|
|
|
|
|
|
|
|
clrbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x10, BIT(4));
|
|
|
|
writel(reg, (void *)MT76XX_MEMCTRL_BASE + 0x64);
|
|
|
|
writel(ddr_cfg2_reg, (void *)MT76XX_MEMCTRL_BASE + 0x48);
|
|
|
|
setbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x10, BIT(4));
|
|
|
|
|
|
|
|
for (i = 0; i < 2; i++)
|
|
|
|
debug("[%02X%02X%02X%02X]", min_coarse_dqs[i],
|
|
|
|
min_fine_dqs[i], max_coarse_dqs[i], max_fine_dqs[i]);
|
|
|
|
debug("\nDDR Calibration DQS reg = %08X\n", reg);
|
|
|
|
}
|