// SPDX-License-Identifier: GPL-2.0+ /* * Copyright (C) 2018 Stefan Roese * * This code is mostly based on the code extracted from this MediaTek * github repository: * * https://github.com/MediaTek-Labs/linkit-smart-uboot.git * * I was not able to find a specific license or other developers * copyrights here, so I can't add them here. * * Most functions in this file are copied from the MediaTek U-Boot * repository. Without any documentation, it was impossible to really * implement this differently. So its mostly a cleaned-up version of * the original code, with only support for the MT7628 / MT7688 SoC. */ #include #include #include #include #include "mt76xx.h" #define NUM_OF_CACHELINE 128 #define MIN_START 6 #define MIN_FINE_START 0xf #define MAX_START 7 #define MAX_FINE_START 0x0 #define CPU_FRAC_DIV 1 #if defined(CONFIG_ONBOARD_DDR2_SIZE_256MBIT) #define DRAM_BUTTOM 0x02000000 #endif #if defined(CONFIG_ONBOARD_DDR2_SIZE_512MBIT) #define DRAM_BUTTOM 0x04000000 #endif #if defined(CONFIG_ONBOARD_DDR2_SIZE_1024MBIT) #define DRAM_BUTTOM 0x08000000 #endif #if defined(CONFIG_ONBOARD_DDR2_SIZE_2048MBIT) #define DRAM_BUTTOM 0x10000000 #endif static inline void cal_memcpy(void *src, void *dst, u32 size) { u8 *psrc = (u8 *)src; u8 *pdst = (u8 *)dst; int i; for (i = 0; i < size; i++, psrc++, pdst++) *pdst = *psrc; } static inline void cal_memset(void *src, u8 pat, u32 size) { u8 *psrc = (u8 *)src; int i; for (i = 0; i < size; i++, psrc++) *psrc = pat; } #define pref_op(hint, addr) \ __asm__ __volatile__( \ ".set push\n" \ ".set noreorder\n" \ "pref %0, %1\n" \ ".set pop\n" \ : \ : "i" (hint), "R" (*(u8 *)(addr))) static inline void cal_patgen(u32 start_addr, u32 size, u32 bias) { u32 *addr = (u32 *)start_addr; int i; for (i = 0; i < size; i++) addr[i] = start_addr + i + bias; } static inline int test_loop(int k, int dqs, u32 test_dqs, u32 *coarse_dqs, u32 offs, u32 pat, u32 val) { u32 nc_addr; u32 *c_addr; int i; for (nc_addr = 0xa0000000; nc_addr < (0xa0000000 + DRAM_BUTTOM - NUM_OF_CACHELINE * 32); nc_addr += (DRAM_BUTTOM >> 6) + offs) { writel(0x00007474, (void *)MT76XX_MEMCTRL_BASE + 0x64); wmb(); /* Make sure store if finished */ c_addr = (u32 *)(nc_addr & 0xdfffffff); cal_memset(((u8 *)c_addr), 0x1F, NUM_OF_CACHELINE * 32); cal_patgen(nc_addr, NUM_OF_CACHELINE * 8, pat); if (dqs > 0) writel(0x00000074 | (((k == 1) ? coarse_dqs[dqs] : test_dqs) << 12) | (((k == 0) ? val : test_dqs) << 8), (void *)MT76XX_MEMCTRL_BASE + 0x64); else writel(0x00007400 | (((k == 1) ? coarse_dqs[dqs] : test_dqs) << 4) | (((k == 0) ? val : test_dqs) << 0), (void *)MT76XX_MEMCTRL_BASE + 0x64); wmb(); /* Make sure store if finished */ invalidate_dcache_range((u32)c_addr, (u32)c_addr + NUM_OF_CACHELINE * 32); wmb(); /* Make sure store if finished */ for (i = 0; i < NUM_OF_CACHELINE * 8; i++) { if (i % 8 == 0) pref_op(0, &c_addr[i]); } for (i = 0; i < NUM_OF_CACHELINE * 8; i++) { if (c_addr[i] != nc_addr + i + pat) return -1; } } return 0; } void ddr_calibrate(void) { u32 min_coarse_dqs[2]; u32 max_coarse_dqs[2]; u32 min_fine_dqs[2]; u32 max_fine_dqs[2]; u32 coarse_dqs[2]; u32 fine_dqs[2]; int reg = 0, ddr_cfg2_reg; int flag; int i, k; int dqs = 0; u32 min_coarse_dqs_bnd, min_fine_dqs_bnd, coarse_dqs_dll, fine_dqs_dll; u32 val; u32 fdiv = 0, frac = 0; /* Setup clock to run at full speed */ val = readl((void *)MT76XX_DYN_CFG0_REG); fdiv = (u32)((val >> 8) & 0x0F); if (CPU_FRAC_DIV < 1 || CPU_FRAC_DIV > 10) frac = val & 0x0f; else frac = CPU_FRAC_DIV; while (frac < fdiv) { val = readl((void *)MT76XX_DYN_CFG0_REG); fdiv = (val >> 8) & 0x0f; fdiv--; val &= ~(0x0f << 8); val |= (fdiv << 8); writel(val, (void *)MT76XX_DYN_CFG0_REG); udelay(500); val = readl((void *)MT76XX_DYN_CFG0_REG); fdiv = (val >> 8) & 0x0f; } clrbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x10, BIT(4)); ddr_cfg2_reg = readl((void *)MT76XX_MEMCTRL_BASE + 0x48); clrbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x48, (0x3 << 28) | (0x3 << 26)); min_coarse_dqs[0] = MIN_START; min_coarse_dqs[1] = MIN_START; min_fine_dqs[0] = MIN_FINE_START; min_fine_dqs[1] = MIN_FINE_START; max_coarse_dqs[0] = MAX_START; max_coarse_dqs[1] = MAX_START; max_fine_dqs[0] = MAX_FINE_START; max_fine_dqs[1] = MAX_FINE_START; dqs = 0; /* Add by KP, DQS MIN boundary */ reg = readl((void *)MT76XX_MEMCTRL_BASE + 0x20); coarse_dqs_dll = (reg & 0xf00) >> 8; fine_dqs_dll = (reg & 0xf0) >> 4; if (coarse_dqs_dll <= 8) min_coarse_dqs_bnd = 8 - coarse_dqs_dll; else min_coarse_dqs_bnd = 0; if (fine_dqs_dll <= 8) min_fine_dqs_bnd = 8 - fine_dqs_dll; else min_fine_dqs_bnd = 0; /* DQS MIN boundary */ DQS_CAL: for (k = 0; k < 2; k++) { u32 test_dqs; if (k == 0) test_dqs = MAX_START; else test_dqs = MAX_FINE_START; do { flag = test_loop(k, dqs, test_dqs, max_coarse_dqs, 0x400, 0x3, 0xf); if (flag == -1) break; test_dqs++; } while (test_dqs <= 0xf); if (k == 0) { max_coarse_dqs[dqs] = test_dqs; } else { test_dqs--; if (test_dqs == MAX_FINE_START - 1) { max_coarse_dqs[dqs]--; max_fine_dqs[dqs] = 0xf; } else { max_fine_dqs[dqs] = test_dqs; } } } for (k = 0; k < 2; k++) { u32 test_dqs; if (k == 0) test_dqs = MIN_START; else test_dqs = MIN_FINE_START; do { flag = test_loop(k, dqs, test_dqs, min_coarse_dqs, 0x480, 0x1, 0x0); if (k == 0) { if (flag == -1 || test_dqs == min_coarse_dqs_bnd) break; test_dqs--; if (test_dqs < min_coarse_dqs_bnd) break; } else { if (flag == -1) { test_dqs++; break; } else if (test_dqs == min_fine_dqs_bnd) { break; } test_dqs--; if (test_dqs < min_fine_dqs_bnd) break; } } while (test_dqs >= 0); if (k == 0) { min_coarse_dqs[dqs] = test_dqs; } else { if (test_dqs == MIN_FINE_START + 1) { min_coarse_dqs[dqs]++; min_fine_dqs[dqs] = 0x0; } else { min_fine_dqs[dqs] = test_dqs; } } } if (dqs == 0) { dqs = 1; goto DQS_CAL; } for (i = 0; i < 2; i++) { u32 temp; coarse_dqs[i] = (max_coarse_dqs[i] + min_coarse_dqs[i]) >> 1; temp = (((max_coarse_dqs[i] + min_coarse_dqs[i]) % 2) * 4) + ((max_fine_dqs[i] + min_fine_dqs[i]) >> 1); if (temp >= 0x10) { coarse_dqs[i]++; fine_dqs[i] = (temp - 0x10) + 0x8; } else { fine_dqs[i] = temp; } } reg = (coarse_dqs[1] << 12) | (fine_dqs[1] << 8) | (coarse_dqs[0] << 4) | fine_dqs[0]; clrbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x10, BIT(4)); writel(reg, (void *)MT76XX_MEMCTRL_BASE + 0x64); writel(ddr_cfg2_reg, (void *)MT76XX_MEMCTRL_BASE + 0x48); setbits_le32((void *)MT76XX_MEMCTRL_BASE + 0x10, BIT(4)); for (i = 0; i < 2; i++) debug("[%02X%02X%02X%02X]", min_coarse_dqs[i], min_fine_dqs[i], max_coarse_dqs[i], max_fine_dqs[i]); debug("\nDDR Calibration DQS reg = %08X\n", reg); }