Merge git://git.denx.de/u-boot-usb
[oweals/u-boot.git] / arch / arm / mach-imx / ddrmc-vf610-calibration.c
1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3  * ddrmc DDR3 calibration code for NXP's VF610
4  *
5  * Copyright (C) 2018 DENX Software Engineering
6  * Lukasz Majewski, DENX Software Engineering, lukma@denx.de
7  *
8  */
9 /* #define DEBUG */
10 #include <common.h>
11 #include <asm/io.h>
12 #include <asm/arch/imx-regs.h>
13 #include <linux/bitmap.h>
14
15 #include "ddrmc-vf610-calibration.h"
16
17 /*
18  * Documents:
19  *
20  * [1] "Vybrid: About DDR leveling feature on DDRMC."
21  * https://community.nxp.com/thread/395323
22  *
23  * [2] VFxxx Controller Reference Manual, Rev. 0, 10/2016
24  *
25  *
26  * NOTE
27  * ====
28  *
29  * NXP recommends setting 'fixed' parameters instead of performing the
30  * training at each boot.
31  *
32  * Use those functions to determine those values on new HW, read the
33  * calculated value from registers and add them to the board specific
34  * struct ddrmc_cr_setting.
35  *
36  * SW leveling supported operations - CR93[SW_LVL_MODE]:
37  *
38  * - 0x0 (b'00) - No leveling
39  *
40  * - 0x1 (b'01) - WRLVL_DL_X - It is not recommended to perform this tuning
41  *                             on HW designs utilizing non-flyback topology
42  *                             (Single DDR3 with x16).
43  *                             Instead the WRLVL_DL_0/1 fields shall be set
44  *                             based on trace length differences from their
45  *                             layout.
46  *                             Mismatches up to 25% or tCK (clock period) are
47  *                             allowed, so the value in the filed doesn’t have
48  *                             to be very accurate.
49  *
50  * - 0x2 (b'10) - RDLVL_DL_0/1 - refers to adjusting the DQS strobe in relation
51  *                             to the DQ signals so that the strobe edge is
52  *                             centered in the window of valid read data.
53  *
54  * - 0x3 (b'11) - RDLVL_GTDL_0/1 - refers to the delay the PHY uses to un-gate
55  *                             the Read DQS strobe pad from the time that the
56  *                             PHY enables the pad to input the strobe signal.
57  *
58  */
59 static int ddr_cal_get_first_edge_index(unsigned long *bmap, enum edge e,
60                                         int samples, int start, int max)
61 {
62         int i, ret = -1;
63
64         /*
65          * We look only for the first value (and filter out
66          * some wrong data)
67          */
68         switch (e) {
69         case RISING_EDGE:
70                 for (i = start; i <= max - samples; i++) {
71                         if (test_bit(i, bmap)) {
72                                 if (!test_bit(i - 1, bmap) &&
73                                     test_bit(i + 1, bmap) &&
74                                     test_bit(i + 2, bmap) &&
75                                     test_bit(i + 3, bmap)) {
76                                         return i;
77                                 }
78                         }
79                 }
80                 break;
81         case FALLING_EDGE:
82                 for (i = start; i <= max - samples; i++) {
83                         if (!test_bit(i, bmap)) {
84                                 if (test_bit(i - 1, bmap) &&
85                                     test_bit(i - 2, bmap) &&
86                                     test_bit(i - 3, bmap)) {
87                                         return i;
88                                 }
89                         }
90                 }
91         }
92
93         return ret;
94 }
95
96 static void bitmap_print(unsigned long *bmap, int max)
97 {
98         int i;
99
100         debug("BITMAP [0x%p]:\n", bmap);
101         for (i = 0; i <= max; i++) {
102                 debug("%d ", test_bit(i, bmap) ? 1 : 0);
103                 if (i && (i % 32) == (32 - 1))
104                         debug("\n");
105         }
106         debug("\n");
107 }
108
109 #define sw_leveling_op_done \
110         while (!(readl(&ddrmr->cr[94]) & DDRMC_CR94_SWLVL_OP_DONE))
111
112 #define sw_leveling_load_value \
113         do { clrsetbits_le32(&ddrmr->cr[93], DDRMC_CR93_SWLVL_LOAD, \
114                              DDRMC_CR93_SWLVL_LOAD); } while (0)
115
116 #define sw_leveling_start \
117         do { clrsetbits_le32(&ddrmr->cr[93], DDRMC_CR93_SWLVL_START, \
118                              DDRMC_CR93_SWLVL_START); } while (0)
119
120 #define sw_leveling_exit \
121         do { clrsetbits_le32(&ddrmr->cr[94], DDRMC_CR94_SWLVL_EXIT, \
122                              DDRMC_CR94_SWLVL_EXIT); } while (0)
123
124 /*
125  * RDLVL_DL calibration:
126  *
127  * NXP is _NOT_ recommending performing the leveling at each
128  * boot. Instead - one shall run this procedure on new boards
129  * and then use hardcoded values.
130  *
131  */
132 static int ddrmc_cal_dqs_to_dq(struct ddrmr_regs *ddrmr)
133 {
134         DECLARE_BITMAP(rdlvl_rsp, DDRMC_DQS_DQ_MAX_DELAY + 1);
135         int rdlvl_dl_0_min = -1, rdlvl_dl_0_max = -1;
136         int rdlvl_dl_1_min = -1, rdlvl_dl_1_max = -1;
137         int rdlvl_dl_0, rdlvl_dl_1;
138         u8 swlvl_rsp;
139         u32 tmp;
140         int i;
141
142         /* Read defaults */
143         u16 rdlvl_dl_0_def =
144                 (readl(&ddrmr->cr[105]) >> DDRMC_CR105_RDLVL_DL_0_OFF) & 0xFFFF;
145         u16 rdlvl_dl_1_def = readl(&ddrmr->cr[110]) & 0xFFFF;
146
147         debug("\nRDLVL: ======================\n");
148         debug("RDLVL: DQS to DQ (RDLVL)\n");
149
150         debug("RDLVL: RDLVL_DL_0_DFL:\t 0x%x\n", rdlvl_dl_0_def);
151         debug("RDLVL: RDLVL_DL_1_DFL:\t 0x%x\n", rdlvl_dl_1_def);
152
153         /*
154          * Set/Read setup for calibration
155          *
156          * Values necessary for leveling from Vybrid RM [2] - page 1600
157          */
158         writel(0x40703030, &ddrmr->cr[144]);
159         writel(0x40, &ddrmr->cr[145]);
160         writel(0x40, &ddrmr->cr[146]);
161
162         tmp = readl(&ddrmr->cr[144]);
163         debug("RDLVL: PHY_RDLVL_RES:\t 0x%x\n", (tmp >> 24) & 0xFF);// set 0x40
164         debug("RDLVL: PHY_RDLV_LOAD:\t 0x%x\n", (tmp >> 16) & 0xFF);// set 0x70
165         debug("RDLVL: PHY_RDLV_DLL:\t 0x%x\n", (tmp >> 8) & 0xFF); // set 0x30
166         debug("RDLVL: PHY_RDLV_EN:\t 0x%x\n", tmp & 0xFF); //set 0x30
167
168         tmp = readl(&ddrmr->cr[145]);
169         debug("RDLVL: PHY_RDLV_RR:\t 0x%x\n", tmp & 0x3FF); //set 0x40
170
171         tmp = readl(&ddrmr->cr[146]);
172         debug("RDLVL: PHY_RDLV_RESP:\t 0x%x\n", tmp); //set 0x40
173
174         /*
175          * Program/read the leveling edge RDLVL_EDGE = 0
176          *
177          * 0x00 is the correct output on SWLVL_RSP_X
178          * If by any chance 1s are visible -> wrong number read
179          */
180         clrbits_le32(&ddrmr->cr[101], DDRMC_CR101_PHY_RDLVL_EDGE);
181
182         tmp = readl(&ddrmr->cr[101]);
183         debug("RDLVL: PHY_RDLVL_EDGE:\t 0x%x\n",
184               (tmp >> DDRMC_CR101_PHY_RDLVL_EDGE_OFF) & 0x1); //set 0
185
186         /* Program Leveling mode - CR93[SW_LVL_MODE] to ’b10 */
187         clrsetbits_le32(&ddrmr->cr[93], DDRMC_CR93_SW_LVL_MODE(0x3),
188                         DDRMC_CR93_SW_LVL_MODE(0x2));
189         tmp = readl(&ddrmr->cr[93]);
190         debug("RDLVL: SW_LVL_MODE:\t 0x%x\n",
191               (tmp >> DDRMC_CR93_SW_LVL_MODE_OFF) & 0x3);
192
193         /* Start procedure - CR93[SWLVL_START] to ’b1 */
194         sw_leveling_start;
195
196         /* Poll CR94[SWLVL_OP_DONE] */
197         sw_leveling_op_done;
198
199         /*
200          * Program delays for RDLVL_DL_0
201          *
202          * The procedure is to increase the delay values from 0 to 0xFF
203          * and read the response from the DDRMC
204          */
205         debug("\nRDLVL: ---> RDLVL_DL_0\n");
206         bitmap_zero(rdlvl_rsp, DDRMC_DQS_DQ_MAX_DELAY + 1);
207
208         for (i = 0; i <= DDRMC_DQS_DQ_MAX_DELAY; i++) {
209                 clrsetbits_le32(&ddrmr->cr[105],
210                                 0xFFFF << DDRMC_CR105_RDLVL_DL_0_OFF,
211                                 i << DDRMC_CR105_RDLVL_DL_0_OFF);
212
213                 /* Load values CR93[SWLVL_LOAD] to ’b1 */
214                 sw_leveling_load_value;
215
216                 /* Poll CR94[SWLVL_OP_DONE] */
217                 sw_leveling_op_done;
218
219                 /*
220                  * Read Responses - SWLVL_RESP_0
221                  *
222                  * The 0x00 (correct response when PHY_RDLVL_EDGE = 0)
223                  * -> 1 in the bit vector
224                  */
225                 swlvl_rsp = (readl(&ddrmr->cr[94]) >>
226                              DDRMC_CR94_SWLVL_RESP_0_OFF) & 0xF;
227                 if (swlvl_rsp == 0)
228                         generic_set_bit(i, rdlvl_rsp);
229         }
230
231         bitmap_print(rdlvl_rsp, DDRMC_DQS_DQ_MAX_DELAY);
232
233         /*
234          * First test for rising edge 0x0 -> 0x1 in bitmap
235          */
236         rdlvl_dl_0_min = ddr_cal_get_first_edge_index(rdlvl_rsp, RISING_EDGE,
237                                                       N_SAMPLES, N_SAMPLES,
238                                                       DDRMC_DQS_DQ_MAX_DELAY);
239
240         /*
241          * Secondly test for falling edge 0x1 -> 0x0 in bitmap
242          */
243         rdlvl_dl_0_max = ddr_cal_get_first_edge_index(rdlvl_rsp, FALLING_EDGE,
244                                                       N_SAMPLES, rdlvl_dl_0_min,
245                                                       DDRMC_DQS_DQ_MAX_DELAY);
246
247         debug("RDLVL: DL_0 min: %d [0x%x] DL_0 max: %d [0x%x]\n",
248               rdlvl_dl_0_min, rdlvl_dl_0_min, rdlvl_dl_0_max, rdlvl_dl_0_max);
249         rdlvl_dl_0 = (rdlvl_dl_0_max - rdlvl_dl_0_min) / 2;
250
251         if (rdlvl_dl_0_max == -1 || rdlvl_dl_0_min == -1 || rdlvl_dl_0 <= 0) {
252                 debug("RDLVL: The DQS to DQ delay cannot be found!\n");
253                 debug("RDLVL: Using default - slice 0: %d!\n", rdlvl_dl_0_def);
254                 rdlvl_dl_0 = rdlvl_dl_0_def;
255         }
256
257         debug("\nRDLVL: ---> RDLVL_DL_1\n");
258         bitmap_zero(rdlvl_rsp, DDRMC_DQS_DQ_MAX_DELAY + 1);
259
260         for (i = 0; i <= DDRMC_DQS_DQ_MAX_DELAY; i++) {
261                 clrsetbits_le32(&ddrmr->cr[110],
262                                 0xFFFF << DDRMC_CR110_RDLVL_DL_1_OFF,
263                                 i << DDRMC_CR110_RDLVL_DL_1_OFF);
264
265                 /* Load values CR93[SWLVL_LOAD] to ’b1 */
266                 sw_leveling_load_value;
267
268                 /* Poll CR94[SWLVL_OP_DONE] */
269                 sw_leveling_op_done;
270
271                 /*
272                  * Read Responses - SWLVL_RESP_1
273                  *
274                  * The 0x00 (correct response when PHY_RDLVL_EDGE = 0)
275                  * -> 1 in the bit vector
276                  */
277                 swlvl_rsp = (readl(&ddrmr->cr[95]) >>
278                              DDRMC_CR95_SWLVL_RESP_1_OFF) & 0xF;
279                 if (swlvl_rsp == 0)
280                         generic_set_bit(i, rdlvl_rsp);
281         }
282
283         bitmap_print(rdlvl_rsp, DDRMC_DQS_DQ_MAX_DELAY);
284
285         /*
286          * First test for rising edge 0x0 -> 0x1 in bitmap
287          */
288         rdlvl_dl_1_min = ddr_cal_get_first_edge_index(rdlvl_rsp, RISING_EDGE,
289                                                       N_SAMPLES, N_SAMPLES,
290                                                       DDRMC_DQS_DQ_MAX_DELAY);
291
292         /*
293          * Secondly test for falling edge 0x1 -> 0x0 in bitmap
294          */
295         rdlvl_dl_1_max = ddr_cal_get_first_edge_index(rdlvl_rsp, FALLING_EDGE,
296                                                       N_SAMPLES, rdlvl_dl_1_min,
297                                                       DDRMC_DQS_DQ_MAX_DELAY);
298
299         debug("RDLVL: DL_1 min: %d [0x%x] DL_1 max: %d [0x%x]\n",
300               rdlvl_dl_1_min, rdlvl_dl_1_min, rdlvl_dl_1_max, rdlvl_dl_1_max);
301         rdlvl_dl_1 = (rdlvl_dl_1_max - rdlvl_dl_1_min) / 2;
302
303         if (rdlvl_dl_1_max == -1 || rdlvl_dl_1_min == -1 || rdlvl_dl_1 <= 0) {
304                 debug("RDLVL: The DQS to DQ delay cannot be found!\n");
305                 debug("RDLVL: Using default - slice 1: %d!\n", rdlvl_dl_1_def);
306                 rdlvl_dl_1 = rdlvl_dl_1_def;
307         }
308
309         debug("RDLVL: CALIBRATED: rdlvl_dl_0: 0x%x\t rdlvl_dl_1: 0x%x\n",
310               rdlvl_dl_0, rdlvl_dl_1);
311
312         /* Write new delay values */
313         writel(DDRMC_CR105_RDLVL_DL_0(rdlvl_dl_0), &ddrmr->cr[105]);
314         writel(DDRMC_CR110_RDLVL_DL_1(rdlvl_dl_1), &ddrmr->cr[110]);
315
316         sw_leveling_load_value;
317         sw_leveling_op_done;
318
319         /* Exit procedure - CR94[SWLVL_EXIT] to ’b1 */
320         sw_leveling_exit;
321
322         /* Poll CR94[SWLVL_OP_DONE] */
323         sw_leveling_op_done;
324
325         return 0;
326 }
327
328 /*
329  * WRLVL_DL calibration:
330  *
331  * For non-flyback memory architecture - where one have a single DDR3 x16
332  * memory - it is NOT necessary to perform "Write Leveling"
333  * [3] 'Vybrid DDR3 write leveling' https://community.nxp.com/thread/429362
334  *
335  */
336
337 int ddrmc_calibration(struct ddrmr_regs *ddrmr)
338 {
339         ddrmc_cal_dqs_to_dq(ddrmr);
340
341         return 0;
342 }