ram: rk3399: Add pctl start support
[oweals/u-boot.git] / drivers / ram / rockchip / sdram_rk3399.c
1 // SPDX-License-Identifier: GPL-2.0+ OR BSD-3-Clause
2 /*
3  * (C) Copyright 2016-2017 Rockchip Inc.
4  *
5  * Adapted from coreboot.
6  */
7
8 #include <common.h>
9 #include <clk.h>
10 #include <dm.h>
11 #include <dt-structs.h>
12 #include <ram.h>
13 #include <regmap.h>
14 #include <syscon.h>
15 #include <asm/io.h>
16 #include <asm/arch-rockchip/clock.h>
17 #include <asm/arch-rockchip/cru_rk3399.h>
18 #include <asm/arch-rockchip/grf_rk3399.h>
19 #include <asm/arch-rockchip/hardware.h>
20 #include <asm/arch-rockchip/sdram_common.h>
21 #include <asm/arch-rockchip/sdram_rk3399.h>
22 #include <linux/err.h>
23 #include <time.h>
24
25 #define PRESET_SGRF_HOLD(n)     ((0x1 << (6 + 16)) | ((n) << 6))
26 #define PRESET_GPIO0_HOLD(n)    ((0x1 << (7 + 16)) | ((n) << 7))
27 #define PRESET_GPIO1_HOLD(n)    ((0x1 << (8 + 16)) | ((n) << 8))
28
29 #define PHY_DRV_ODT_HI_Z        0x0
30 #define PHY_DRV_ODT_240         0x1
31 #define PHY_DRV_ODT_120         0x8
32 #define PHY_DRV_ODT_80          0x9
33 #define PHY_DRV_ODT_60          0xc
34 #define PHY_DRV_ODT_48          0xd
35 #define PHY_DRV_ODT_40          0xe
36 #define PHY_DRV_ODT_34_3        0xf
37
38 #define CRU_SFTRST_DDR_CTRL(ch, n)      ((0x1 << (8 + 16 + (ch) * 4)) | \
39                                         ((n) << (8 + (ch) * 4)))
40 #define CRU_SFTRST_DDR_PHY(ch, n)       ((0x1 << (9 + 16 + (ch) * 4)) | \
41                                         ((n) << (9 + (ch) * 4)))
42 struct chan_info {
43         struct rk3399_ddr_pctl_regs *pctl;
44         struct rk3399_ddr_pi_regs *pi;
45         struct rk3399_ddr_publ_regs *publ;
46         struct rk3399_msch_regs *msch;
47 };
48
49 struct dram_info {
50 #if defined(CONFIG_TPL_BUILD) || \
51         (!defined(CONFIG_TPL) && defined(CONFIG_SPL_BUILD))
52         u32 pwrup_srefresh_exit[2];
53         struct chan_info chan[2];
54         struct clk ddr_clk;
55         struct rk3399_cru *cru;
56         struct rk3399_grf_regs *grf;
57         struct rk3399_pmucru *pmucru;
58         struct rk3399_pmusgrf_regs *pmusgrf;
59         struct rk3399_ddr_cic_regs *cic;
60 #endif
61         struct ram_info info;
62         struct rk3399_pmugrf_regs *pmugrf;
63 };
64
65 #if defined(CONFIG_TPL_BUILD) || \
66         (!defined(CONFIG_TPL) && defined(CONFIG_SPL_BUILD))
67
68 struct rockchip_dmc_plat {
69 #if CONFIG_IS_ENABLED(OF_PLATDATA)
70         struct dtd_rockchip_rk3399_dmc dtplat;
71 #else
72         struct rk3399_sdram_params sdram_params;
73 #endif
74         struct regmap *map;
75 };
76
77 static void *get_ddrc0_con(struct dram_info *dram, u8 channel)
78 {
79         return (channel == 0) ? &dram->grf->ddrc0_con0 : &dram->grf->ddrc0_con1;
80 }
81
82 static void copy_to_reg(u32 *dest, const u32 *src, u32 n)
83 {
84         int i;
85
86         for (i = 0; i < n / sizeof(u32); i++) {
87                 writel(*src, dest);
88                 src++;
89                 dest++;
90         }
91 }
92
93 static void rkclk_ddr_reset(struct rk3399_cru *cru, u32 channel, u32 ctl,
94                             u32 phy)
95 {
96         channel &= 0x1;
97         ctl &= 0x1;
98         phy &= 0x1;
99         writel(CRU_SFTRST_DDR_CTRL(channel, ctl) |
100                                    CRU_SFTRST_DDR_PHY(channel, phy),
101                                    &cru->softrst_con[4]);
102 }
103
104 static void phy_pctrl_reset(struct rk3399_cru *cru,  u32 channel)
105 {
106         rkclk_ddr_reset(cru, channel, 1, 1);
107         udelay(10);
108
109         rkclk_ddr_reset(cru, channel, 1, 0);
110         udelay(10);
111
112         rkclk_ddr_reset(cru, channel, 0, 0);
113         udelay(10);
114 }
115
116 static void phy_dll_bypass_set(struct rk3399_ddr_publ_regs *ddr_publ_regs,
117                                u32 freq)
118 {
119         u32 *denali_phy = ddr_publ_regs->denali_phy;
120
121         /* From IP spec, only freq small than 125 can enter dll bypass mode */
122         if (freq <= 125) {
123                 /* phy_sw_master_mode_X PHY_86/214/342/470 4bits offset_8 */
124                 setbits_le32(&denali_phy[86], (0x3 << 2) << 8);
125                 setbits_le32(&denali_phy[214], (0x3 << 2) << 8);
126                 setbits_le32(&denali_phy[342], (0x3 << 2) << 8);
127                 setbits_le32(&denali_phy[470], (0x3 << 2) << 8);
128
129                 /* phy_adrctl_sw_master_mode PHY_547/675/803 4bits offset_16 */
130                 setbits_le32(&denali_phy[547], (0x3 << 2) << 16);
131                 setbits_le32(&denali_phy[675], (0x3 << 2) << 16);
132                 setbits_le32(&denali_phy[803], (0x3 << 2) << 16);
133         } else {
134                 /* phy_sw_master_mode_X PHY_86/214/342/470 4bits offset_8 */
135                 clrbits_le32(&denali_phy[86], (0x3 << 2) << 8);
136                 clrbits_le32(&denali_phy[214], (0x3 << 2) << 8);
137                 clrbits_le32(&denali_phy[342], (0x3 << 2) << 8);
138                 clrbits_le32(&denali_phy[470], (0x3 << 2) << 8);
139
140                 /* phy_adrctl_sw_master_mode PHY_547/675/803 4bits offset_16 */
141                 clrbits_le32(&denali_phy[547], (0x3 << 2) << 16);
142                 clrbits_le32(&denali_phy[675], (0x3 << 2) << 16);
143                 clrbits_le32(&denali_phy[803], (0x3 << 2) << 16);
144         }
145 }
146
147 static void set_memory_map(const struct chan_info *chan, u32 channel,
148                            const struct rk3399_sdram_params *params)
149 {
150         const struct rk3399_sdram_channel *sdram_ch = &params->ch[channel];
151         u32 *denali_ctl = chan->pctl->denali_ctl;
152         u32 *denali_pi = chan->pi->denali_pi;
153         u32 cs_map;
154         u32 reduc;
155         u32 row;
156
157         /* Get row number from ddrconfig setting */
158         if (sdram_ch->cap_info.ddrconfig < 2 ||
159             sdram_ch->cap_info.ddrconfig == 4)
160                 row = 16;
161         else if (sdram_ch->cap_info.ddrconfig == 3)
162                 row = 14;
163         else
164                 row = 15;
165
166         cs_map = (sdram_ch->cap_info.rank > 1) ? 3 : 1;
167         reduc = (sdram_ch->cap_info.bw == 2) ? 0 : 1;
168
169         /* Set the dram configuration to ctrl */
170         clrsetbits_le32(&denali_ctl[191], 0xF, (12 - sdram_ch->cap_info.col));
171         clrsetbits_le32(&denali_ctl[190], (0x3 << 16) | (0x7 << 24),
172                         ((3 - sdram_ch->cap_info.bk) << 16) |
173                         ((16 - row) << 24));
174
175         clrsetbits_le32(&denali_ctl[196], 0x3 | (1 << 16),
176                         cs_map | (reduc << 16));
177
178         /* PI_199 PI_COL_DIFF:RW:0:4 */
179         clrsetbits_le32(&denali_pi[199], 0xF, (12 - sdram_ch->cap_info.col));
180
181         /* PI_155 PI_ROW_DIFF:RW:24:3 PI_BANK_DIFF:RW:16:2 */
182         clrsetbits_le32(&denali_pi[155], (0x3 << 16) | (0x7 << 24),
183                         ((3 - sdram_ch->cap_info.bk) << 16) |
184                         ((16 - row) << 24));
185         /* PI_41 PI_CS_MAP:RW:24:4 */
186         clrsetbits_le32(&denali_pi[41], 0xf << 24, cs_map << 24);
187         if (sdram_ch->cap_info.rank == 1 && params->base.dramtype == DDR3)
188                 writel(0x2EC7FFFF, &denali_pi[34]);
189 }
190
191 static void set_ds_odt(const struct chan_info *chan,
192                        const struct rk3399_sdram_params *params)
193 {
194         u32 *denali_phy = chan->publ->denali_phy;
195
196         u32 tsel_idle_en, tsel_wr_en, tsel_rd_en;
197         u32 tsel_idle_select_p, tsel_rd_select_p;
198         u32 tsel_idle_select_n, tsel_rd_select_n;
199         u32 tsel_wr_select_dq_p, tsel_wr_select_ca_p;
200         u32 tsel_wr_select_dq_n, tsel_wr_select_ca_n;
201         u32 reg_value;
202
203         if (params->base.dramtype == LPDDR4) {
204                 tsel_rd_select_p = PHY_DRV_ODT_HI_Z;
205                 tsel_rd_select_n = PHY_DRV_ODT_240;
206
207                 tsel_idle_select_p = PHY_DRV_ODT_HI_Z;
208                 tsel_idle_select_n = PHY_DRV_ODT_240;
209
210                 tsel_wr_select_dq_p = PHY_DRV_ODT_40;
211                 tsel_wr_select_dq_n = PHY_DRV_ODT_40;
212
213                 tsel_wr_select_ca_p = PHY_DRV_ODT_40;
214                 tsel_wr_select_ca_n = PHY_DRV_ODT_40;
215         } else if (params->base.dramtype == LPDDR3) {
216                 tsel_rd_select_p = PHY_DRV_ODT_240;
217                 tsel_rd_select_n = PHY_DRV_ODT_HI_Z;
218
219                 tsel_idle_select_p = PHY_DRV_ODT_240;
220                 tsel_idle_select_n = PHY_DRV_ODT_HI_Z;
221
222                 tsel_wr_select_dq_p = PHY_DRV_ODT_34_3;
223                 tsel_wr_select_dq_n = PHY_DRV_ODT_34_3;
224
225                 tsel_wr_select_ca_p = PHY_DRV_ODT_48;
226                 tsel_wr_select_ca_n = PHY_DRV_ODT_48;
227         } else {
228                 tsel_rd_select_p = PHY_DRV_ODT_240;
229                 tsel_rd_select_n = PHY_DRV_ODT_240;
230
231                 tsel_idle_select_p = PHY_DRV_ODT_240;
232                 tsel_idle_select_n = PHY_DRV_ODT_240;
233
234                 tsel_wr_select_dq_p = PHY_DRV_ODT_34_3;
235                 tsel_wr_select_dq_n = PHY_DRV_ODT_34_3;
236
237                 tsel_wr_select_ca_p = PHY_DRV_ODT_34_3;
238                 tsel_wr_select_ca_n = PHY_DRV_ODT_34_3;
239         }
240
241         if (params->base.odt == 1)
242                 tsel_rd_en = 1;
243         else
244                 tsel_rd_en = 0;
245
246         tsel_wr_en = 0;
247         tsel_idle_en = 0;
248
249         /*
250          * phy_dq_tsel_select_X 24bits DENALI_PHY_6/134/262/390 offset_0
251          * sets termination values for read/idle cycles and drive strength
252          * for write cycles for DQ/DM
253          */
254         reg_value = tsel_rd_select_n | (tsel_rd_select_p << 0x4) |
255                     (tsel_wr_select_dq_n << 8) | (tsel_wr_select_dq_p << 12) |
256                     (tsel_idle_select_n << 16) | (tsel_idle_select_p << 20);
257         clrsetbits_le32(&denali_phy[6], 0xffffff, reg_value);
258         clrsetbits_le32(&denali_phy[134], 0xffffff, reg_value);
259         clrsetbits_le32(&denali_phy[262], 0xffffff, reg_value);
260         clrsetbits_le32(&denali_phy[390], 0xffffff, reg_value);
261
262         /*
263          * phy_dqs_tsel_select_X 24bits DENALI_PHY_7/135/263/391 offset_0
264          * sets termination values for read/idle cycles and drive strength
265          * for write cycles for DQS
266          */
267         clrsetbits_le32(&denali_phy[7], 0xffffff, reg_value);
268         clrsetbits_le32(&denali_phy[135], 0xffffff, reg_value);
269         clrsetbits_le32(&denali_phy[263], 0xffffff, reg_value);
270         clrsetbits_le32(&denali_phy[391], 0xffffff, reg_value);
271
272         /* phy_adr_tsel_select_ 8bits DENALI_PHY_544/672/800 offset_0 */
273         reg_value = tsel_wr_select_ca_n | (tsel_wr_select_ca_p << 0x4);
274         clrsetbits_le32(&denali_phy[544], 0xff, reg_value);
275         clrsetbits_le32(&denali_phy[672], 0xff, reg_value);
276         clrsetbits_le32(&denali_phy[800], 0xff, reg_value);
277
278         /* phy_pad_addr_drive 8bits DENALI_PHY_928 offset_0 */
279         clrsetbits_le32(&denali_phy[928], 0xff, reg_value);
280
281         /* phy_pad_rst_drive 8bits DENALI_PHY_937 offset_0 */
282         clrsetbits_le32(&denali_phy[937], 0xff, reg_value);
283
284         /* phy_pad_cke_drive 8bits DENALI_PHY_935 offset_0 */
285         clrsetbits_le32(&denali_phy[935], 0xff, reg_value);
286
287         /* phy_pad_cs_drive 8bits DENALI_PHY_939 offset_0 */
288         clrsetbits_le32(&denali_phy[939], 0xff, reg_value);
289
290         /* phy_pad_clk_drive 8bits DENALI_PHY_929 offset_0 */
291         clrsetbits_le32(&denali_phy[929], 0xff, reg_value);
292
293         /* phy_pad_fdbk_drive 23bit DENALI_PHY_924/925 */
294         clrsetbits_le32(&denali_phy[924], 0xff,
295                         tsel_wr_select_dq_n | (tsel_wr_select_dq_p << 4));
296         clrsetbits_le32(&denali_phy[925], 0xff,
297                         tsel_rd_select_n | (tsel_rd_select_p << 4));
298
299         /* phy_dq_tsel_enable_X 3bits DENALI_PHY_5/133/261/389 offset_16 */
300         reg_value = (tsel_rd_en | (tsel_wr_en << 1) | (tsel_idle_en << 2))
301                 << 16;
302         clrsetbits_le32(&denali_phy[5], 0x7 << 16, reg_value);
303         clrsetbits_le32(&denali_phy[133], 0x7 << 16, reg_value);
304         clrsetbits_le32(&denali_phy[261], 0x7 << 16, reg_value);
305         clrsetbits_le32(&denali_phy[389], 0x7 << 16, reg_value);
306
307         /* phy_dqs_tsel_enable_X 3bits DENALI_PHY_6/134/262/390 offset_24 */
308         reg_value = (tsel_rd_en | (tsel_wr_en << 1) | (tsel_idle_en << 2))
309                 << 24;
310         clrsetbits_le32(&denali_phy[6], 0x7 << 24, reg_value);
311         clrsetbits_le32(&denali_phy[134], 0x7 << 24, reg_value);
312         clrsetbits_le32(&denali_phy[262], 0x7 << 24, reg_value);
313         clrsetbits_le32(&denali_phy[390], 0x7 << 24, reg_value);
314
315         /* phy_adr_tsel_enable_ 1bit DENALI_PHY_518/646/774 offset_8 */
316         reg_value = tsel_wr_en << 8;
317         clrsetbits_le32(&denali_phy[518], 0x1 << 8, reg_value);
318         clrsetbits_le32(&denali_phy[646], 0x1 << 8, reg_value);
319         clrsetbits_le32(&denali_phy[774], 0x1 << 8, reg_value);
320
321         /* phy_pad_addr_term tsel 1bit DENALI_PHY_933 offset_17 */
322         reg_value = tsel_wr_en << 17;
323         clrsetbits_le32(&denali_phy[933], 0x1 << 17, reg_value);
324         /*
325          * pad_rst/cke/cs/clk_term tsel 1bits
326          * DENALI_PHY_938/936/940/934 offset_17
327          */
328         clrsetbits_le32(&denali_phy[938], 0x1 << 17, reg_value);
329         clrsetbits_le32(&denali_phy[936], 0x1 << 17, reg_value);
330         clrsetbits_le32(&denali_phy[940], 0x1 << 17, reg_value);
331         clrsetbits_le32(&denali_phy[934], 0x1 << 17, reg_value);
332
333         /* phy_pad_fdbk_term 1bit DENALI_PHY_930 offset_17 */
334         clrsetbits_le32(&denali_phy[930], 0x1 << 17, reg_value);
335 }
336
337 static void pctl_start(struct dram_info *dram, u8 channel)
338 {
339         const struct chan_info *chan = &dram->chan[channel];
340         u32 *denali_ctl = chan->pctl->denali_ctl;
341         u32 *denali_phy = chan->publ->denali_phy;
342         u32 *ddrc0_con = get_ddrc0_con(dram, channel);
343         u32 count = 0;
344         u32 byte, tmp;
345
346         writel(0x01000000, &ddrc0_con);
347
348         clrsetbits_le32(&denali_phy[957], 0x3 << 24, 0x2 << 24);
349
350         while (!(readl(&denali_ctl[203]) & (1 << 3))) {
351                 if (count > 1000) {
352                         printf("%s: Failed to init pctl for channel %d\n",
353                                __func__, channel);
354                         while (1)
355                                 ;
356                 }
357
358                 udelay(1);
359                 count++;
360         }
361
362         writel(0x01000100, &ddrc0_con);
363
364         for (byte = 0; byte < 4; byte++) {
365                 tmp = 0x820;
366                 writel((tmp << 16) | tmp, &denali_phy[53 + (128 * byte)]);
367                 writel((tmp << 16) | tmp, &denali_phy[54 + (128 * byte)]);
368                 writel((tmp << 16) | tmp, &denali_phy[55 + (128 * byte)]);
369                 writel((tmp << 16) | tmp, &denali_phy[56 + (128 * byte)]);
370                 writel((tmp << 16) | tmp, &denali_phy[57 + (128 * byte)]);
371
372                 clrsetbits_le32(&denali_phy[58 + (128 * byte)], 0xffff, tmp);
373         }
374
375         clrsetbits_le32(&denali_ctl[68], PWRUP_SREFRESH_EXIT,
376                         dram->pwrup_srefresh_exit[channel]);
377 }
378
379 static int phy_io_config(const struct chan_info *chan,
380                          const struct rk3399_sdram_params *params)
381 {
382         u32 *denali_phy = chan->publ->denali_phy;
383         u32 vref_mode_dq, vref_value_dq, vref_mode_ac, vref_value_ac;
384         u32 mode_sel;
385         u32 reg_value;
386         u32 drv_value, odt_value;
387         u32 speed;
388
389         /* vref setting */
390         if (params->base.dramtype == LPDDR4) {
391                 /* LPDDR4 */
392                 vref_mode_dq = 0x6;
393                 vref_value_dq = 0x1f;
394                 vref_mode_ac = 0x6;
395                 vref_value_ac = 0x1f;
396         } else if (params->base.dramtype == LPDDR3) {
397                 if (params->base.odt == 1) {
398                         vref_mode_dq = 0x5;  /* LPDDR3 ODT */
399                         drv_value = (readl(&denali_phy[6]) >> 12) & 0xf;
400                         odt_value = (readl(&denali_phy[6]) >> 4) & 0xf;
401                         if (drv_value == PHY_DRV_ODT_48) {
402                                 switch (odt_value) {
403                                 case PHY_DRV_ODT_240:
404                                         vref_value_dq = 0x16;
405                                         break;
406                                 case PHY_DRV_ODT_120:
407                                         vref_value_dq = 0x26;
408                                         break;
409                                 case PHY_DRV_ODT_60:
410                                         vref_value_dq = 0x36;
411                                         break;
412                                 default:
413                                         debug("Invalid ODT value.\n");
414                                         return -EINVAL;
415                                 }
416                         } else if (drv_value == PHY_DRV_ODT_40) {
417                                 switch (odt_value) {
418                                 case PHY_DRV_ODT_240:
419                                         vref_value_dq = 0x19;
420                                         break;
421                                 case PHY_DRV_ODT_120:
422                                         vref_value_dq = 0x23;
423                                         break;
424                                 case PHY_DRV_ODT_60:
425                                         vref_value_dq = 0x31;
426                                         break;
427                                 default:
428                                         debug("Invalid ODT value.\n");
429                                         return -EINVAL;
430                                 }
431                         } else if (drv_value == PHY_DRV_ODT_34_3) {
432                                 switch (odt_value) {
433                                 case PHY_DRV_ODT_240:
434                                         vref_value_dq = 0x17;
435                                         break;
436                                 case PHY_DRV_ODT_120:
437                                         vref_value_dq = 0x20;
438                                         break;
439                                 case PHY_DRV_ODT_60:
440                                         vref_value_dq = 0x2e;
441                                         break;
442                                 default:
443                                         debug("Invalid ODT value.\n");
444                                         return -EINVAL;
445                                 }
446                         } else {
447                                 debug("Invalid DRV value.\n");
448                                 return -EINVAL;
449                         }
450                 } else {
451                         vref_mode_dq = 0x2;  /* LPDDR3 */
452                         vref_value_dq = 0x1f;
453                 }
454                 vref_mode_ac = 0x2;
455                 vref_value_ac = 0x1f;
456         } else if (params->base.dramtype == DDR3) {
457                 /* DDR3L */
458                 vref_mode_dq = 0x1;
459                 vref_value_dq = 0x1f;
460                 vref_mode_ac = 0x1;
461                 vref_value_ac = 0x1f;
462         } else {
463                 debug("Unknown DRAM type.\n");
464                 return -EINVAL;
465         }
466
467         reg_value = (vref_mode_dq << 9) | (0x1 << 8) | vref_value_dq;
468
469         /* PHY_913 PHY_PAD_VREF_CTRL_DQ_0 12bits offset_8 */
470         clrsetbits_le32(&denali_phy[913], 0xfff << 8, reg_value << 8);
471         /* PHY_914 PHY_PAD_VREF_CTRL_DQ_1 12bits offset_0 */
472         clrsetbits_le32(&denali_phy[914], 0xfff, reg_value);
473         /* PHY_914 PHY_PAD_VREF_CTRL_DQ_2 12bits offset_16 */
474         clrsetbits_le32(&denali_phy[914], 0xfff << 16, reg_value << 16);
475         /* PHY_915 PHY_PAD_VREF_CTRL_DQ_3 12bits offset_0 */
476         clrsetbits_le32(&denali_phy[915], 0xfff, reg_value);
477
478         reg_value = (vref_mode_ac << 9) | (0x1 << 8) | vref_value_ac;
479
480         /* PHY_915 PHY_PAD_VREF_CTRL_AC 12bits offset_16 */
481         clrsetbits_le32(&denali_phy[915], 0xfff << 16, reg_value << 16);
482
483         if (params->base.dramtype == LPDDR4)
484                 mode_sel = 0x6;
485         else if (params->base.dramtype == LPDDR3)
486                 mode_sel = 0x0;
487         else if (params->base.dramtype == DDR3)
488                 mode_sel = 0x1;
489         else
490                 return -EINVAL;
491
492         /* PHY_924 PHY_PAD_FDBK_DRIVE */
493         clrsetbits_le32(&denali_phy[924], 0x7 << 15, mode_sel << 15);
494         /* PHY_926 PHY_PAD_DATA_DRIVE */
495         clrsetbits_le32(&denali_phy[926], 0x7 << 6, mode_sel << 6);
496         /* PHY_927 PHY_PAD_DQS_DRIVE */
497         clrsetbits_le32(&denali_phy[927], 0x7 << 6, mode_sel << 6);
498         /* PHY_928 PHY_PAD_ADDR_DRIVE */
499         clrsetbits_le32(&denali_phy[928], 0x7 << 14, mode_sel << 14);
500         /* PHY_929 PHY_PAD_CLK_DRIVE */
501         clrsetbits_le32(&denali_phy[929], 0x7 << 14, mode_sel << 14);
502         /* PHY_935 PHY_PAD_CKE_DRIVE */
503         clrsetbits_le32(&denali_phy[935], 0x7 << 14, mode_sel << 14);
504         /* PHY_937 PHY_PAD_RST_DRIVE */
505         clrsetbits_le32(&denali_phy[937], 0x7 << 14, mode_sel << 14);
506         /* PHY_939 PHY_PAD_CS_DRIVE */
507         clrsetbits_le32(&denali_phy[939], 0x7 << 14, mode_sel << 14);
508
509         /* speed setting */
510         if (params->base.ddr_freq < 400)
511                 speed = 0x0;
512         else if (params->base.ddr_freq < 800)
513                 speed = 0x1;
514         else if (params->base.ddr_freq < 1200)
515                 speed = 0x2;
516         else
517                 speed = 0x3;
518
519         /* PHY_924 PHY_PAD_FDBK_DRIVE */
520         clrsetbits_le32(&denali_phy[924], 0x3 << 21, speed << 21);
521         /* PHY_926 PHY_PAD_DATA_DRIVE */
522         clrsetbits_le32(&denali_phy[926], 0x3 << 9, speed << 9);
523         /* PHY_927 PHY_PAD_DQS_DRIVE */
524         clrsetbits_le32(&denali_phy[927], 0x3 << 9, speed << 9);
525         /* PHY_928 PHY_PAD_ADDR_DRIVE */
526         clrsetbits_le32(&denali_phy[928], 0x3 << 17, speed << 17);
527         /* PHY_929 PHY_PAD_CLK_DRIVE */
528         clrsetbits_le32(&denali_phy[929], 0x3 << 17, speed << 17);
529         /* PHY_935 PHY_PAD_CKE_DRIVE */
530         clrsetbits_le32(&denali_phy[935], 0x3 << 17, speed << 17);
531         /* PHY_937 PHY_PAD_RST_DRIVE */
532         clrsetbits_le32(&denali_phy[937], 0x3 << 17, speed << 17);
533         /* PHY_939 PHY_PAD_CS_DRIVE */
534         clrsetbits_le32(&denali_phy[939], 0x3 << 17, speed << 17);
535
536         return 0;
537 }
538
539 static int pctl_cfg(struct dram_info *dram, const struct chan_info *chan,
540                     u32 channel, const struct rk3399_sdram_params *params)
541 {
542         u32 *denali_ctl = chan->pctl->denali_ctl;
543         u32 *denali_pi = chan->pi->denali_pi;
544         u32 *denali_phy = chan->publ->denali_phy;
545         const u32 *params_ctl = params->pctl_regs.denali_ctl;
546         const u32 *params_phy = params->phy_regs.denali_phy;
547         u32 tmp, tmp1, tmp2;
548         int ret;
549
550         /*
551          * work around controller bug:
552          * Do not program DRAM_CLASS until NO_PHY_IND_TRAIN_INT is programmed
553          */
554         copy_to_reg(&denali_ctl[1], &params_ctl[1],
555                     sizeof(struct rk3399_ddr_pctl_regs) - 4);
556         writel(params_ctl[0], &denali_ctl[0]);
557
558         copy_to_reg(denali_pi, &params->pi_regs.denali_pi[0],
559                     sizeof(struct rk3399_ddr_pi_regs));
560
561         /* rank count need to set for init */
562         set_memory_map(chan, channel, params);
563
564         writel(params->phy_regs.denali_phy[910], &denali_phy[910]);
565         writel(params->phy_regs.denali_phy[911], &denali_phy[911]);
566         writel(params->phy_regs.denali_phy[912], &denali_phy[912]);
567
568         dram->pwrup_srefresh_exit[channel] = readl(&denali_ctl[68]) &
569                                              PWRUP_SREFRESH_EXIT;
570         clrbits_le32(&denali_ctl[68], PWRUP_SREFRESH_EXIT);
571
572         /* PHY_DLL_RST_EN */
573         clrsetbits_le32(&denali_phy[957], 0x3 << 24, 1 << 24);
574
575         setbits_le32(&denali_pi[0], START);
576         setbits_le32(&denali_ctl[0], START);
577
578         /* Waiting for phy DLL lock */
579         while (1) {
580                 tmp = readl(&denali_phy[920]);
581                 tmp1 = readl(&denali_phy[921]);
582                 tmp2 = readl(&denali_phy[922]);
583                 if ((((tmp >> 16) & 0x1) == 0x1) &&
584                     (((tmp1 >> 16) & 0x1) == 0x1) &&
585                     (((tmp1 >> 0) & 0x1) == 0x1) &&
586                     (((tmp2 >> 0) & 0x1) == 0x1))
587                         break;
588         }
589
590         copy_to_reg(&denali_phy[896], &params_phy[896], (958 - 895) * 4);
591         copy_to_reg(&denali_phy[0], &params_phy[0], (90 - 0 + 1) * 4);
592         copy_to_reg(&denali_phy[128], &params_phy[128], (218 - 128 + 1) * 4);
593         copy_to_reg(&denali_phy[256], &params_phy[256], (346 - 256 + 1) * 4);
594         copy_to_reg(&denali_phy[384], &params_phy[384], (474 - 384 + 1) * 4);
595         copy_to_reg(&denali_phy[512], &params_phy[512], (549 - 512 + 1) * 4);
596         copy_to_reg(&denali_phy[640], &params_phy[640], (677 - 640 + 1) * 4);
597         copy_to_reg(&denali_phy[768], &params_phy[768], (805 - 768 + 1) * 4);
598         set_ds_odt(chan, params);
599
600         /*
601          * phy_dqs_tsel_wr_timing_X 8bits DENALI_PHY_84/212/340/468 offset_8
602          * dqs_tsel_wr_end[7:4] add Half cycle
603          */
604         tmp = (readl(&denali_phy[84]) >> 8) & 0xff;
605         clrsetbits_le32(&denali_phy[84], 0xff << 8, (tmp + 0x10) << 8);
606         tmp = (readl(&denali_phy[212]) >> 8) & 0xff;
607         clrsetbits_le32(&denali_phy[212], 0xff << 8, (tmp + 0x10) << 8);
608         tmp = (readl(&denali_phy[340]) >> 8) & 0xff;
609         clrsetbits_le32(&denali_phy[340], 0xff << 8, (tmp + 0x10) << 8);
610         tmp = (readl(&denali_phy[468]) >> 8) & 0xff;
611         clrsetbits_le32(&denali_phy[468], 0xff << 8, (tmp + 0x10) << 8);
612
613         /*
614          * phy_dqs_tsel_wr_timing_X 8bits DENALI_PHY_83/211/339/467 offset_8
615          * dq_tsel_wr_end[7:4] add Half cycle
616          */
617         tmp = (readl(&denali_phy[83]) >> 16) & 0xff;
618         clrsetbits_le32(&denali_phy[83], 0xff << 16, (tmp + 0x10) << 16);
619         tmp = (readl(&denali_phy[211]) >> 16) & 0xff;
620         clrsetbits_le32(&denali_phy[211], 0xff << 16, (tmp + 0x10) << 16);
621         tmp = (readl(&denali_phy[339]) >> 16) & 0xff;
622         clrsetbits_le32(&denali_phy[339], 0xff << 16, (tmp + 0x10) << 16);
623         tmp = (readl(&denali_phy[467]) >> 16) & 0xff;
624         clrsetbits_le32(&denali_phy[467], 0xff << 16, (tmp + 0x10) << 16);
625
626         ret = phy_io_config(chan, params);
627         if (ret)
628                 return ret;
629
630         return 0;
631 }
632
633 static void select_per_cs_training_index(const struct chan_info *chan,
634                                          u32 rank)
635 {
636         u32 *denali_phy = chan->publ->denali_phy;
637
638         /* PHY_84 PHY_PER_CS_TRAINING_EN_0 1bit offset_16 */
639         if ((readl(&denali_phy[84]) >> 16) & 1) {
640                 /*
641                  * PHY_8/136/264/392
642                  * phy_per_cs_training_index_X 1bit offset_24
643                  */
644                 clrsetbits_le32(&denali_phy[8], 0x1 << 24, rank << 24);
645                 clrsetbits_le32(&denali_phy[136], 0x1 << 24, rank << 24);
646                 clrsetbits_le32(&denali_phy[264], 0x1 << 24, rank << 24);
647                 clrsetbits_le32(&denali_phy[392], 0x1 << 24, rank << 24);
648         }
649 }
650
651 static void override_write_leveling_value(const struct chan_info *chan)
652 {
653         u32 *denali_ctl = chan->pctl->denali_ctl;
654         u32 *denali_phy = chan->publ->denali_phy;
655         u32 byte;
656
657         /* PHY_896 PHY_FREQ_SEL_MULTICAST_EN 1bit offset_0 */
658         setbits_le32(&denali_phy[896], 1);
659
660         /*
661          * PHY_8/136/264/392
662          * phy_per_cs_training_multicast_en_X 1bit offset_16
663          */
664         clrsetbits_le32(&denali_phy[8], 0x1 << 16, 1 << 16);
665         clrsetbits_le32(&denali_phy[136], 0x1 << 16, 1 << 16);
666         clrsetbits_le32(&denali_phy[264], 0x1 << 16, 1 << 16);
667         clrsetbits_le32(&denali_phy[392], 0x1 << 16, 1 << 16);
668
669         for (byte = 0; byte < 4; byte++)
670                 clrsetbits_le32(&denali_phy[63 + (128 * byte)], 0xffff << 16,
671                                 0x200 << 16);
672
673         /* PHY_896 PHY_FREQ_SEL_MULTICAST_EN 1bit offset_0 */
674         clrbits_le32(&denali_phy[896], 1);
675
676         /* CTL_200 ctrlupd_req 1bit offset_8 */
677         clrsetbits_le32(&denali_ctl[200], 0x1 << 8, 0x1 << 8);
678 }
679
680 static int data_training_ca(const struct chan_info *chan, u32 channel,
681                             const struct rk3399_sdram_params *params)
682 {
683         u32 *denali_pi = chan->pi->denali_pi;
684         u32 *denali_phy = chan->publ->denali_phy;
685         u32 i, tmp;
686         u32 obs_0, obs_1, obs_2, obs_err = 0;
687         u32 rank = params->ch[channel].cap_info.rank;
688         u32 rank_mask;
689
690         /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
691         writel(0x00003f7c, (&denali_pi[175]));
692
693         rank_mask = (rank == 1) ? 0x1 : 0x3;
694
695         for (i = 0; i < 4; i++) {
696                 if (!(rank_mask & (1 << i)))
697                         continue;
698
699                 select_per_cs_training_index(chan, i);
700
701                 /* PI_100 PI_CALVL_EN:RW:8:2 */
702                 clrsetbits_le32(&denali_pi[100], 0x3 << 8, 0x2 << 8);
703
704                 /* PI_92 PI_CALVL_REQ:WR:16:1,PI_CALVL_CS:RW:24:2 */
705                 clrsetbits_le32(&denali_pi[92],
706                                 (0x1 << 16) | (0x3 << 24),
707                                 (0x1 << 16) | (i << 24));
708
709                 /* Waiting for training complete */
710                 while (1) {
711                         /* PI_174 PI_INT_STATUS:RD:8:18 */
712                         tmp = readl(&denali_pi[174]) >> 8;
713                         /*
714                          * check status obs
715                          * PHY_532/660/789 phy_adr_calvl_obs1_:0:32
716                          */
717                         obs_0 = readl(&denali_phy[532]);
718                         obs_1 = readl(&denali_phy[660]);
719                         obs_2 = readl(&denali_phy[788]);
720                         if (((obs_0 >> 30) & 0x3) ||
721                             ((obs_1 >> 30) & 0x3) ||
722                             ((obs_2 >> 30) & 0x3))
723                                 obs_err = 1;
724                         if ((((tmp >> 11) & 0x1) == 0x1) &&
725                             (((tmp >> 13) & 0x1) == 0x1) &&
726                             (((tmp >> 5) & 0x1) == 0x0) &&
727                             obs_err == 0)
728                                 break;
729                         else if ((((tmp >> 5) & 0x1) == 0x1) ||
730                                  (obs_err == 1))
731                                 return -EIO;
732                 }
733
734                 /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
735                 writel(0x00003f7c, (&denali_pi[175]));
736         }
737
738         clrbits_le32(&denali_pi[100], 0x3 << 8);
739
740         return 0;
741 }
742
743 static int data_training_wl(const struct chan_info *chan, u32 channel,
744                             const struct rk3399_sdram_params *params)
745 {
746         u32 *denali_pi = chan->pi->denali_pi;
747         u32 *denali_phy = chan->publ->denali_phy;
748         u32 i, tmp;
749         u32 obs_0, obs_1, obs_2, obs_3, obs_err = 0;
750         u32 rank = params->ch[channel].cap_info.rank;
751
752         /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
753         writel(0x00003f7c, (&denali_pi[175]));
754
755         for (i = 0; i < rank; i++) {
756                 select_per_cs_training_index(chan, i);
757
758                 /* PI_60 PI_WRLVL_EN:RW:8:2 */
759                 clrsetbits_le32(&denali_pi[60], 0x3 << 8, 0x2 << 8);
760
761                 /* PI_59 PI_WRLVL_REQ:WR:8:1,PI_WRLVL_CS:RW:16:2 */
762                 clrsetbits_le32(&denali_pi[59],
763                                 (0x1 << 8) | (0x3 << 16),
764                                 (0x1 << 8) | (i << 16));
765
766                 /* Waiting for training complete */
767                 while (1) {
768                         /* PI_174 PI_INT_STATUS:RD:8:18 */
769                         tmp = readl(&denali_pi[174]) >> 8;
770
771                         /*
772                          * check status obs, if error maybe can not
773                          * get leveling done PHY_40/168/296/424
774                          * phy_wrlvl_status_obs_X:0:13
775                          */
776                         obs_0 = readl(&denali_phy[40]);
777                         obs_1 = readl(&denali_phy[168]);
778                         obs_2 = readl(&denali_phy[296]);
779                         obs_3 = readl(&denali_phy[424]);
780                         if (((obs_0 >> 12) & 0x1) ||
781                             ((obs_1 >> 12) & 0x1) ||
782                             ((obs_2 >> 12) & 0x1) ||
783                             ((obs_3 >> 12) & 0x1))
784                                 obs_err = 1;
785                         if ((((tmp >> 10) & 0x1) == 0x1) &&
786                             (((tmp >> 13) & 0x1) == 0x1) &&
787                             (((tmp >> 4) & 0x1) == 0x0) &&
788                             obs_err == 0)
789                                 break;
790                         else if ((((tmp >> 4) & 0x1) == 0x1) ||
791                                  (obs_err == 1))
792                                 return -EIO;
793                 }
794
795                 /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
796                 writel(0x00003f7c, (&denali_pi[175]));
797         }
798
799         override_write_leveling_value(chan);
800         clrbits_le32(&denali_pi[60], 0x3 << 8);
801
802         return 0;
803 }
804
805 static int data_training_rg(const struct chan_info *chan, u32 channel,
806                             const struct rk3399_sdram_params *params)
807 {
808         u32 *denali_pi = chan->pi->denali_pi;
809         u32 *denali_phy = chan->publ->denali_phy;
810         u32 i, tmp;
811         u32 obs_0, obs_1, obs_2, obs_3, obs_err = 0;
812         u32 rank = params->ch[channel].cap_info.rank;
813
814         /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
815         writel(0x00003f7c, (&denali_pi[175]));
816
817         for (i = 0; i < rank; i++) {
818                 select_per_cs_training_index(chan, i);
819
820                 /* PI_80 PI_RDLVL_GATE_EN:RW:24:2 */
821                 clrsetbits_le32(&denali_pi[80], 0x3 << 24, 0x2 << 24);
822
823                 /*
824                  * PI_74 PI_RDLVL_GATE_REQ:WR:16:1
825                  * PI_RDLVL_CS:RW:24:2
826                  */
827                 clrsetbits_le32(&denali_pi[74],
828                                 (0x1 << 16) | (0x3 << 24),
829                                 (0x1 << 16) | (i << 24));
830
831                 /* Waiting for training complete */
832                 while (1) {
833                         /* PI_174 PI_INT_STATUS:RD:8:18 */
834                         tmp = readl(&denali_pi[174]) >> 8;
835
836                         /*
837                          * check status obs
838                          * PHY_43/171/299/427
839                          *     PHY_GTLVL_STATUS_OBS_x:16:8
840                          */
841                         obs_0 = readl(&denali_phy[43]);
842                         obs_1 = readl(&denali_phy[171]);
843                         obs_2 = readl(&denali_phy[299]);
844                         obs_3 = readl(&denali_phy[427]);
845                         if (((obs_0 >> (16 + 6)) & 0x3) ||
846                             ((obs_1 >> (16 + 6)) & 0x3) ||
847                             ((obs_2 >> (16 + 6)) & 0x3) ||
848                             ((obs_3 >> (16 + 6)) & 0x3))
849                                 obs_err = 1;
850                         if ((((tmp >> 9) & 0x1) == 0x1) &&
851                             (((tmp >> 13) & 0x1) == 0x1) &&
852                             (((tmp >> 3) & 0x1) == 0x0) &&
853                             obs_err == 0)
854                                 break;
855                         else if ((((tmp >> 3) & 0x1) == 0x1) ||
856                                  (obs_err == 1))
857                                 return -EIO;
858                 }
859
860                 /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
861                 writel(0x00003f7c, (&denali_pi[175]));
862         }
863
864         clrbits_le32(&denali_pi[80], 0x3 << 24);
865
866         return 0;
867 }
868
869 static int data_training_rl(const struct chan_info *chan, u32 channel,
870                             const struct rk3399_sdram_params *params)
871 {
872         u32 *denali_pi = chan->pi->denali_pi;
873         u32 i, tmp;
874         u32 rank = params->ch[channel].cap_info.rank;
875
876         /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
877         writel(0x00003f7c, (&denali_pi[175]));
878
879         for (i = 0; i < rank; i++) {
880                 select_per_cs_training_index(chan, i);
881
882                 /* PI_80 PI_RDLVL_EN:RW:16:2 */
883                 clrsetbits_le32(&denali_pi[80], 0x3 << 16, 0x2 << 16);
884
885                 /* PI_74 PI_RDLVL_REQ:WR:8:1,PI_RDLVL_CS:RW:24:2 */
886                 clrsetbits_le32(&denali_pi[74],
887                                 (0x1 << 8) | (0x3 << 24),
888                                 (0x1 << 8) | (i << 24));
889
890                 /* Waiting for training complete */
891                 while (1) {
892                         /* PI_174 PI_INT_STATUS:RD:8:18 */
893                         tmp = readl(&denali_pi[174]) >> 8;
894
895                         /*
896                          * make sure status obs not report error bit
897                          * PHY_46/174/302/430
898                          *     phy_rdlvl_status_obs_X:16:8
899                          */
900                         if ((((tmp >> 8) & 0x1) == 0x1) &&
901                             (((tmp >> 13) & 0x1) == 0x1) &&
902                             (((tmp >> 2) & 0x1) == 0x0))
903                                 break;
904                         else if (((tmp >> 2) & 0x1) == 0x1)
905                                 return -EIO;
906                 }
907
908                 /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
909                 writel(0x00003f7c, (&denali_pi[175]));
910         }
911
912         clrbits_le32(&denali_pi[80], 0x3 << 16);
913
914         return 0;
915 }
916
917 static int data_training_wdql(const struct chan_info *chan, u32 channel,
918                               const struct rk3399_sdram_params *params)
919 {
920         u32 *denali_pi = chan->pi->denali_pi;
921         u32 i, tmp;
922         u32 rank = params->ch[channel].cap_info.rank;
923         u32 rank_mask;
924
925         /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
926         writel(0x00003f7c, (&denali_pi[175]));
927
928         rank_mask = (rank == 1) ? 0x1 : 0x3;
929
930         for (i = 0; i < 4; i++) {
931                 if (!(rank_mask & (1 << i)))
932                         continue;
933
934                 select_per_cs_training_index(chan, i);
935
936                 /*
937                  * disable PI_WDQLVL_VREF_EN before wdq leveling?
938                  * PI_181 PI_WDQLVL_VREF_EN:RW:8:1
939                  */
940                 clrbits_le32(&denali_pi[181], 0x1 << 8);
941
942                 /* PI_124 PI_WDQLVL_EN:RW:16:2 */
943                 clrsetbits_le32(&denali_pi[124], 0x3 << 16, 0x2 << 16);
944
945                 /* PI_121 PI_WDQLVL_REQ:WR:8:1,PI_WDQLVL_CS:RW:16:2 */
946                 clrsetbits_le32(&denali_pi[121],
947                                 (0x1 << 8) | (0x3 << 16),
948                                 (0x1 << 8) | (i << 16));
949
950                 /* Waiting for training complete */
951                 while (1) {
952                         /* PI_174 PI_INT_STATUS:RD:8:18 */
953                         tmp = readl(&denali_pi[174]) >> 8;
954                         if ((((tmp >> 12) & 0x1) == 0x1) &&
955                             (((tmp >> 13) & 0x1) == 0x1) &&
956                             (((tmp >> 6) & 0x1) == 0x0))
957                                 break;
958                         else if (((tmp >> 6) & 0x1) == 0x1)
959                                 return -EIO;
960                 }
961
962                 /* clear interrupt,PI_175 PI_INT_ACK:WR:0:17 */
963                 writel(0x00003f7c, (&denali_pi[175]));
964         }
965
966         clrbits_le32(&denali_pi[124], 0x3 << 16);
967
968         return 0;
969 }
970
971 static int data_training(const struct chan_info *chan, u32 channel,
972                          const struct rk3399_sdram_params *params,
973                          u32 training_flag)
974 {
975         u32 *denali_phy = chan->publ->denali_phy;
976         int ret;
977
978         /* PHY_927 PHY_PAD_DQS_DRIVE  RPULL offset_22 */
979         setbits_le32(&denali_phy[927], (1 << 22));
980
981         if (training_flag == PI_FULL_TRAINING) {
982                 if (params->base.dramtype == LPDDR4) {
983                         training_flag = PI_CA_TRAINING | PI_WRITE_LEVELING |
984                                         PI_READ_GATE_TRAINING |
985                                         PI_READ_LEVELING | PI_WDQ_LEVELING;
986                 } else if (params->base.dramtype == LPDDR3) {
987                         training_flag = PI_CA_TRAINING | PI_WRITE_LEVELING |
988                                         PI_READ_GATE_TRAINING;
989                 } else if (params->base.dramtype == DDR3) {
990                         training_flag = PI_WRITE_LEVELING |
991                                         PI_READ_GATE_TRAINING |
992                                         PI_READ_LEVELING;
993                 }
994         }
995
996         /* ca training(LPDDR4,LPDDR3 support) */
997         if ((training_flag & PI_CA_TRAINING) == PI_CA_TRAINING) {
998                 ret = data_training_ca(chan, channel, params);
999                 if (ret < 0) {
1000                         debug("%s: data training ca failed\n", __func__);
1001                         return ret;
1002                 }
1003         }
1004
1005         /* write leveling(LPDDR4,LPDDR3,DDR3 support) */
1006         if ((training_flag & PI_WRITE_LEVELING) == PI_WRITE_LEVELING) {
1007                 ret = data_training_wl(chan, channel, params);
1008                 if (ret < 0) {
1009                         debug("%s: data training wl failed\n", __func__);
1010                         return ret;
1011                 }
1012         }
1013
1014         /* read gate training(LPDDR4,LPDDR3,DDR3 support) */
1015         if ((training_flag & PI_READ_GATE_TRAINING) == PI_READ_GATE_TRAINING) {
1016                 ret = data_training_rg(chan, channel, params);
1017                 if (ret < 0) {
1018                         debug("%s: data training rg failed\n", __func__);
1019                         return ret;
1020                 }
1021         }
1022
1023         /* read leveling(LPDDR4,LPDDR3,DDR3 support) */
1024         if ((training_flag & PI_READ_LEVELING) == PI_READ_LEVELING) {
1025                 ret = data_training_rl(chan, channel, params);
1026                 if (ret < 0) {
1027                         debug("%s: data training rl failed\n", __func__);
1028                         return ret;
1029                 }
1030         }
1031
1032         /* wdq leveling(LPDDR4 support) */
1033         if ((training_flag & PI_WDQ_LEVELING) == PI_WDQ_LEVELING) {
1034                 ret = data_training_wdql(chan, channel, params);
1035                 if (ret < 0) {
1036                         debug("%s: data training wdql failed\n", __func__);
1037                         return ret;
1038                 }
1039         }
1040
1041         /* PHY_927 PHY_PAD_DQS_DRIVE  RPULL offset_22 */
1042         clrbits_le32(&denali_phy[927], (1 << 22));
1043
1044         return 0;
1045 }
1046
1047 static void set_ddrconfig(const struct chan_info *chan,
1048                           const struct rk3399_sdram_params *params,
1049                           unsigned char channel, u32 ddrconfig)
1050 {
1051         /* only need to set ddrconfig */
1052         struct rk3399_msch_regs *ddr_msch_regs = chan->msch;
1053         unsigned int cs0_cap = 0;
1054         unsigned int cs1_cap = 0;
1055
1056         cs0_cap = (1 << (params->ch[channel].cap_info.cs0_row
1057                         + params->ch[channel].cap_info.col
1058                         + params->ch[channel].cap_info.bk
1059                         + params->ch[channel].cap_info.bw - 20));
1060         if (params->ch[channel].cap_info.rank > 1)
1061                 cs1_cap = cs0_cap >> (params->ch[channel].cap_info.cs0_row
1062                                 - params->ch[channel].cap_info.cs1_row);
1063         if (params->ch[channel].cap_info.row_3_4) {
1064                 cs0_cap = cs0_cap * 3 / 4;
1065                 cs1_cap = cs1_cap * 3 / 4;
1066         }
1067
1068         writel(ddrconfig | (ddrconfig << 8), &ddr_msch_regs->ddrconf);
1069         writel(((cs0_cap / 32) & 0xff) | (((cs1_cap / 32) & 0xff) << 8),
1070                &ddr_msch_regs->ddrsize);
1071 }
1072
1073 static void dram_all_config(struct dram_info *dram,
1074                             const struct rk3399_sdram_params *params)
1075 {
1076         u32 sys_reg = 0;
1077         unsigned int channel, idx;
1078
1079         sys_reg |= params->base.dramtype << SYS_REG_DDRTYPE_SHIFT;
1080         sys_reg |= (params->base.num_channels - 1) << SYS_REG_NUM_CH_SHIFT;
1081
1082         for (channel = 0, idx = 0;
1083              (idx < params->base.num_channels) && (channel < 2);
1084              channel++) {
1085                 const struct rk3399_sdram_channel *info = &params->ch[channel];
1086                 struct rk3399_msch_regs *ddr_msch_regs;
1087                 const struct rk3399_msch_timings *noc_timing;
1088
1089                 if (params->ch[channel].cap_info.col == 0)
1090                         continue;
1091                 idx++;
1092                 sys_reg |= info->cap_info.row_3_4 <<
1093                            SYS_REG_ROW_3_4_SHIFT(channel);
1094                 sys_reg |= 1 << SYS_REG_CHINFO_SHIFT(channel);
1095                 sys_reg |= (info->cap_info.rank - 1) <<
1096                            SYS_REG_RANK_SHIFT(channel);
1097                 sys_reg |= (info->cap_info.col - 9) <<
1098                            SYS_REG_COL_SHIFT(channel);
1099                 sys_reg |= info->cap_info.bk == 3 ? 0 : 1 <<
1100                            SYS_REG_BK_SHIFT(channel);
1101                 sys_reg |= (info->cap_info.cs0_row - 13) <<
1102                             SYS_REG_CS0_ROW_SHIFT(channel);
1103                 sys_reg |= (info->cap_info.cs1_row - 13) <<
1104                             SYS_REG_CS1_ROW_SHIFT(channel);
1105                 sys_reg |= (2 >> info->cap_info.bw) <<
1106                            SYS_REG_BW_SHIFT(channel);
1107                 sys_reg |= (2 >> info->cap_info.dbw) <<
1108                            SYS_REG_DBW_SHIFT(channel);
1109
1110                 ddr_msch_regs = dram->chan[channel].msch;
1111                 noc_timing = &params->ch[channel].noc_timings;
1112                 writel(noc_timing->ddrtiminga0,
1113                        &ddr_msch_regs->ddrtiminga0);
1114                 writel(noc_timing->ddrtimingb0,
1115                        &ddr_msch_regs->ddrtimingb0);
1116                 writel(noc_timing->ddrtimingc0,
1117                        &ddr_msch_regs->ddrtimingc0);
1118                 writel(noc_timing->devtodev0,
1119                        &ddr_msch_regs->devtodev0);
1120                 writel(noc_timing->ddrmode,
1121                        &ddr_msch_regs->ddrmode);
1122
1123                 /* rank 1 memory clock disable (dfi_dram_clk_disable = 1) */
1124                 if (params->ch[channel].cap_info.rank == 1)
1125                         setbits_le32(&dram->chan[channel].pctl->denali_ctl[276],
1126                                      1 << 17);
1127         }
1128
1129         writel(sys_reg, &dram->pmugrf->os_reg2);
1130         rk_clrsetreg(&dram->pmusgrf->soc_con4, 0x1f << 10,
1131                      params->base.stride << 10);
1132
1133         /* reboot hold register set */
1134         writel(PRESET_SGRF_HOLD(0) | PRESET_GPIO0_HOLD(1) |
1135                 PRESET_GPIO1_HOLD(1),
1136                 &dram->pmucru->pmucru_rstnhold_con[1]);
1137         clrsetbits_le32(&dram->cru->glb_rst_con, 0x3, 0x3);
1138 }
1139
1140 static int switch_to_phy_index1(struct dram_info *dram,
1141                                 const struct rk3399_sdram_params *params)
1142 {
1143         u32 channel;
1144         u32 *denali_phy;
1145         u32 ch_count = params->base.num_channels;
1146         int ret;
1147         int i = 0;
1148
1149         writel(RK_CLRSETBITS(0x03 << 4 | 1 << 2 | 1,
1150                              1 << 4 | 1 << 2 | 1),
1151                         &dram->cic->cic_ctrl0);
1152         while (!(readl(&dram->cic->cic_status0) & (1 << 2))) {
1153                 mdelay(10);
1154                 i++;
1155                 if (i > 10) {
1156                         debug("index1 frequency change overtime\n");
1157                         return -ETIME;
1158                 }
1159         }
1160
1161         i = 0;
1162         writel(RK_CLRSETBITS(1 << 1, 1 << 1), &dram->cic->cic_ctrl0);
1163         while (!(readl(&dram->cic->cic_status0) & (1 << 0))) {
1164                 mdelay(10);
1165                 i++;
1166                 if (i > 10) {
1167                         debug("index1 frequency done overtime\n");
1168                         return -ETIME;
1169                 }
1170         }
1171
1172         for (channel = 0; channel < ch_count; channel++) {
1173                 denali_phy = dram->chan[channel].publ->denali_phy;
1174                 clrsetbits_le32(&denali_phy[896], (0x3 << 8) | 1, 1 << 8);
1175                 ret = data_training(&dram->chan[channel], channel,
1176                                     params, PI_FULL_TRAINING);
1177                 if (ret < 0) {
1178                         debug("index1 training failed\n");
1179                         return ret;
1180                 }
1181         }
1182
1183         return 0;
1184 }
1185
1186 static int sdram_init(struct dram_info *dram,
1187                       const struct rk3399_sdram_params *params)
1188 {
1189         unsigned char dramtype = params->base.dramtype;
1190         unsigned int ddr_freq = params->base.ddr_freq;
1191         struct rk3399_cru *cru = dram->cru;
1192         int channel;
1193         int ret;
1194
1195         debug("Starting SDRAM initialization...\n");
1196
1197         if ((dramtype == DDR3 && ddr_freq > 933) ||
1198             (dramtype == LPDDR3 && ddr_freq > 933) ||
1199             (dramtype == LPDDR4 && ddr_freq > 800)) {
1200                 debug("SDRAM frequency is to high!");
1201                 return -E2BIG;
1202         }
1203
1204         for (channel = 0; channel < 2; channel++) {
1205                 const struct chan_info *chan = &dram->chan[channel];
1206                 struct rk3399_ddr_publ_regs *publ = chan->publ;
1207
1208                 phy_pctrl_reset(cru, channel);
1209                 phy_dll_bypass_set(publ, ddr_freq);
1210
1211                 if (channel >= params->base.num_channels)
1212                         continue;
1213
1214                 ret = pctl_cfg(dram, chan, channel, params);
1215                 if (ret < 0) {
1216                         printf("%s: pctl config failed\n", __func__);
1217                         return ret;
1218                 }
1219
1220                 /* start to trigger initialization */
1221                 pctl_start(dram, channel);
1222
1223                 /* LPDDR2/LPDDR3 need to wait DAI complete, max 10us */
1224                 if (dramtype == LPDDR3)
1225                         udelay(10);
1226
1227                 if (data_training(chan, channel, params, PI_FULL_TRAINING)) {
1228                         printf("%s: data training failed\n", __func__);
1229                         return -EIO;
1230                 }
1231
1232                 set_ddrconfig(chan, params, channel,
1233                               params->ch[channel].cap_info.ddrconfig);
1234         }
1235         dram_all_config(dram, params);
1236         switch_to_phy_index1(dram, params);
1237
1238         debug("Finish SDRAM initialization...\n");
1239         return 0;
1240 }
1241
1242 static int rk3399_dmc_ofdata_to_platdata(struct udevice *dev)
1243 {
1244 #if !CONFIG_IS_ENABLED(OF_PLATDATA)
1245         struct rockchip_dmc_plat *plat = dev_get_platdata(dev);
1246         int ret;
1247
1248         ret = dev_read_u32_array(dev, "rockchip,sdram-params",
1249                                  (u32 *)&plat->sdram_params,
1250                                  sizeof(plat->sdram_params) / sizeof(u32));
1251         if (ret) {
1252                 printf("%s: Cannot read rockchip,sdram-params %d\n",
1253                        __func__, ret);
1254                 return ret;
1255         }
1256         ret = regmap_init_mem(dev_ofnode(dev), &plat->map);
1257         if (ret)
1258                 printf("%s: regmap failed %d\n", __func__, ret);
1259
1260 #endif
1261         return 0;
1262 }
1263
1264 #if CONFIG_IS_ENABLED(OF_PLATDATA)
1265 static int conv_of_platdata(struct udevice *dev)
1266 {
1267         struct rockchip_dmc_plat *plat = dev_get_platdata(dev);
1268         struct dtd_rockchip_rk3399_dmc *dtplat = &plat->dtplat;
1269         int ret;
1270
1271         ret = regmap_init_mem_platdata(dev, dtplat->reg,
1272                                        ARRAY_SIZE(dtplat->reg) / 2,
1273                                        &plat->map);
1274         if (ret)
1275                 return ret;
1276
1277         return 0;
1278 }
1279 #endif
1280
1281 static int rk3399_dmc_init(struct udevice *dev)
1282 {
1283         struct dram_info *priv = dev_get_priv(dev);
1284         struct rockchip_dmc_plat *plat = dev_get_platdata(dev);
1285         int ret;
1286 #if !CONFIG_IS_ENABLED(OF_PLATDATA)
1287         struct rk3399_sdram_params *params = &plat->sdram_params;
1288 #else
1289         struct dtd_rockchip_rk3399_dmc *dtplat = &plat->dtplat;
1290         struct rk3399_sdram_params *params =
1291                                         (void *)dtplat->rockchip_sdram_params;
1292
1293         ret = conv_of_platdata(dev);
1294         if (ret)
1295                 return ret;
1296 #endif
1297
1298         priv->cic = syscon_get_first_range(ROCKCHIP_SYSCON_CIC);
1299         priv->grf = syscon_get_first_range(ROCKCHIP_SYSCON_GRF);
1300         priv->pmugrf = syscon_get_first_range(ROCKCHIP_SYSCON_PMUGRF);
1301         priv->pmusgrf = syscon_get_first_range(ROCKCHIP_SYSCON_PMUSGRF);
1302         priv->pmucru = rockchip_get_pmucru();
1303         priv->cru = rockchip_get_cru();
1304         priv->chan[0].pctl = regmap_get_range(plat->map, 0);
1305         priv->chan[0].pi = regmap_get_range(plat->map, 1);
1306         priv->chan[0].publ = regmap_get_range(plat->map, 2);
1307         priv->chan[0].msch = regmap_get_range(plat->map, 3);
1308         priv->chan[1].pctl = regmap_get_range(plat->map, 4);
1309         priv->chan[1].pi = regmap_get_range(plat->map, 5);
1310         priv->chan[1].publ = regmap_get_range(plat->map, 6);
1311         priv->chan[1].msch = regmap_get_range(plat->map, 7);
1312
1313         debug("con reg %p %p %p %p %p %p %p %p\n",
1314               priv->chan[0].pctl, priv->chan[0].pi,
1315               priv->chan[0].publ, priv->chan[0].msch,
1316               priv->chan[1].pctl, priv->chan[1].pi,
1317               priv->chan[1].publ, priv->chan[1].msch);
1318         debug("cru %p, cic %p, grf %p, sgrf %p, pmucru %p\n", priv->cru,
1319               priv->cic, priv->pmugrf, priv->pmusgrf, priv->pmucru);
1320
1321 #if CONFIG_IS_ENABLED(OF_PLATDATA)
1322         ret = clk_get_by_index_platdata(dev, 0, dtplat->clocks, &priv->ddr_clk);
1323 #else
1324         ret = clk_get_by_index(dev, 0, &priv->ddr_clk);
1325 #endif
1326         if (ret) {
1327                 printf("%s clk get failed %d\n", __func__, ret);
1328                 return ret;
1329         }
1330
1331         ret = clk_set_rate(&priv->ddr_clk, params->base.ddr_freq * MHz);
1332         if (ret < 0) {
1333                 printf("%s clk set failed %d\n", __func__, ret);
1334                 return ret;
1335         }
1336
1337         ret = sdram_init(priv, params);
1338         if (ret < 0) {
1339                 printf("%s DRAM init failed %d\n", __func__, ret);
1340                 return ret;
1341         }
1342
1343         return 0;
1344 }
1345 #endif
1346
1347 static int rk3399_dmc_probe(struct udevice *dev)
1348 {
1349 #if defined(CONFIG_TPL_BUILD) || \
1350         (!defined(CONFIG_TPL) && defined(CONFIG_SPL_BUILD))
1351         if (rk3399_dmc_init(dev))
1352                 return 0;
1353 #else
1354         struct dram_info *priv = dev_get_priv(dev);
1355
1356         priv->pmugrf = syscon_get_first_range(ROCKCHIP_SYSCON_PMUGRF);
1357         debug("%s: pmugrf = %p\n", __func__, priv->pmugrf);
1358         priv->info.base = CONFIG_SYS_SDRAM_BASE;
1359         priv->info.size =
1360                 rockchip_sdram_size((phys_addr_t)&priv->pmugrf->os_reg2);
1361 #endif
1362         return 0;
1363 }
1364
1365 static int rk3399_dmc_get_info(struct udevice *dev, struct ram_info *info)
1366 {
1367         struct dram_info *priv = dev_get_priv(dev);
1368
1369         *info = priv->info;
1370
1371         return 0;
1372 }
1373
1374 static struct ram_ops rk3399_dmc_ops = {
1375         .get_info = rk3399_dmc_get_info,
1376 };
1377
1378 static const struct udevice_id rk3399_dmc_ids[] = {
1379         { .compatible = "rockchip,rk3399-dmc" },
1380         { }
1381 };
1382
1383 U_BOOT_DRIVER(dmc_rk3399) = {
1384         .name = "rockchip_rk3399_dmc",
1385         .id = UCLASS_RAM,
1386         .of_match = rk3399_dmc_ids,
1387         .ops = &rk3399_dmc_ops,
1388 #if defined(CONFIG_TPL_BUILD) || \
1389         (!defined(CONFIG_TPL) && defined(CONFIG_SPL_BUILD))
1390         .ofdata_to_platdata = rk3399_dmc_ofdata_to_platdata,
1391 #endif
1392         .probe = rk3399_dmc_probe,
1393         .priv_auto_alloc_size = sizeof(struct dram_info),
1394 #if defined(CONFIG_TPL_BUILD) || \
1395         (!defined(CONFIG_TPL) && defined(CONFIG_SPL_BUILD))
1396         .platdata_auto_alloc_size = sizeof(struct rockchip_dmc_plat),
1397 #endif
1398 };