1 /*
2 * Copyright 2010 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 * Authors: Alex Deucher
23 */
24 #include <linux/firmware.h>
25 #include <linux/slab.h>
26 #include <drm/drmP.h>
27 #include "radeon.h"
28 #include "radeon_asic.h"
29 #include "radeon_audio.h"
30 #include <drm/radeon_drm.h>
31 #include "evergreend.h"
32 #include "atom.h"
33 #include "avivod.h"
34 #include "evergreen_reg.h"
35 #include "evergreen_blit_shaders.h"
36 #include "radeon_ucode.h"
37
38 #define DC_HPDx_CONTROL(x) (DC_HPD1_CONTROL + (x * 0xc))
39 #define DC_HPDx_INT_CONTROL(x) (DC_HPD1_INT_CONTROL + (x * 0xc))
40 #define DC_HPDx_INT_STATUS_REG(x) (DC_HPD1_INT_STATUS + (x * 0xc))
41
42 /*
43 * Indirect registers accessor
44 */
eg_cg_rreg(struct radeon_device * rdev,u32 reg)45 u32 eg_cg_rreg(struct radeon_device *rdev, u32 reg)
46 {
47 unsigned long flags;
48 u32 r;
49
50 spin_lock_irqsave(&rdev->cg_idx_lock, flags);
51 WREG32(EVERGREEN_CG_IND_ADDR, ((reg) & 0xffff));
52 r = RREG32(EVERGREEN_CG_IND_DATA);
53 spin_unlock_irqrestore(&rdev->cg_idx_lock, flags);
54 return r;
55 }
56
eg_cg_wreg(struct radeon_device * rdev,u32 reg,u32 v)57 void eg_cg_wreg(struct radeon_device *rdev, u32 reg, u32 v)
58 {
59 unsigned long flags;
60
61 spin_lock_irqsave(&rdev->cg_idx_lock, flags);
62 WREG32(EVERGREEN_CG_IND_ADDR, ((reg) & 0xffff));
63 WREG32(EVERGREEN_CG_IND_DATA, (v));
64 spin_unlock_irqrestore(&rdev->cg_idx_lock, flags);
65 }
66
eg_pif_phy0_rreg(struct radeon_device * rdev,u32 reg)67 u32 eg_pif_phy0_rreg(struct radeon_device *rdev, u32 reg)
68 {
69 unsigned long flags;
70 u32 r;
71
72 spin_lock_irqsave(&rdev->pif_idx_lock, flags);
73 WREG32(EVERGREEN_PIF_PHY0_INDEX, ((reg) & 0xffff));
74 r = RREG32(EVERGREEN_PIF_PHY0_DATA);
75 spin_unlock_irqrestore(&rdev->pif_idx_lock, flags);
76 return r;
77 }
78
eg_pif_phy0_wreg(struct radeon_device * rdev,u32 reg,u32 v)79 void eg_pif_phy0_wreg(struct radeon_device *rdev, u32 reg, u32 v)
80 {
81 unsigned long flags;
82
83 spin_lock_irqsave(&rdev->pif_idx_lock, flags);
84 WREG32(EVERGREEN_PIF_PHY0_INDEX, ((reg) & 0xffff));
85 WREG32(EVERGREEN_PIF_PHY0_DATA, (v));
86 spin_unlock_irqrestore(&rdev->pif_idx_lock, flags);
87 }
88
eg_pif_phy1_rreg(struct radeon_device * rdev,u32 reg)89 u32 eg_pif_phy1_rreg(struct radeon_device *rdev, u32 reg)
90 {
91 unsigned long flags;
92 u32 r;
93
94 spin_lock_irqsave(&rdev->pif_idx_lock, flags);
95 WREG32(EVERGREEN_PIF_PHY1_INDEX, ((reg) & 0xffff));
96 r = RREG32(EVERGREEN_PIF_PHY1_DATA);
97 spin_unlock_irqrestore(&rdev->pif_idx_lock, flags);
98 return r;
99 }
100
eg_pif_phy1_wreg(struct radeon_device * rdev,u32 reg,u32 v)101 void eg_pif_phy1_wreg(struct radeon_device *rdev, u32 reg, u32 v)
102 {
103 unsigned long flags;
104
105 spin_lock_irqsave(&rdev->pif_idx_lock, flags);
106 WREG32(EVERGREEN_PIF_PHY1_INDEX, ((reg) & 0xffff));
107 WREG32(EVERGREEN_PIF_PHY1_DATA, (v));
108 spin_unlock_irqrestore(&rdev->pif_idx_lock, flags);
109 }
110
111 static const u32 crtc_offsets[6] =
112 {
113 EVERGREEN_CRTC0_REGISTER_OFFSET,
114 EVERGREEN_CRTC1_REGISTER_OFFSET,
115 EVERGREEN_CRTC2_REGISTER_OFFSET,
116 EVERGREEN_CRTC3_REGISTER_OFFSET,
117 EVERGREEN_CRTC4_REGISTER_OFFSET,
118 EVERGREEN_CRTC5_REGISTER_OFFSET
119 };
120
121 #include "clearstate_evergreen.h"
122
123 static const u32 sumo_rlc_save_restore_register_list[] =
124 {
125 0x98fc,
126 0x9830,
127 0x9834,
128 0x9838,
129 0x9870,
130 0x9874,
131 0x8a14,
132 0x8b24,
133 0x8bcc,
134 0x8b10,
135 0x8d00,
136 0x8d04,
137 0x8c00,
138 0x8c04,
139 0x8c08,
140 0x8c0c,
141 0x8d8c,
142 0x8c20,
143 0x8c24,
144 0x8c28,
145 0x8c18,
146 0x8c1c,
147 0x8cf0,
148 0x8e2c,
149 0x8e38,
150 0x8c30,
151 0x9508,
152 0x9688,
153 0x9608,
154 0x960c,
155 0x9610,
156 0x9614,
157 0x88c4,
158 0x88d4,
159 0xa008,
160 0x900c,
161 0x9100,
162 0x913c,
163 0x98f8,
164 0x98f4,
165 0x9b7c,
166 0x3f8c,
167 0x8950,
168 0x8954,
169 0x8a18,
170 0x8b28,
171 0x9144,
172 0x9148,
173 0x914c,
174 0x3f90,
175 0x3f94,
176 0x915c,
177 0x9160,
178 0x9178,
179 0x917c,
180 0x9180,
181 0x918c,
182 0x9190,
183 0x9194,
184 0x9198,
185 0x919c,
186 0x91a8,
187 0x91ac,
188 0x91b0,
189 0x91b4,
190 0x91b8,
191 0x91c4,
192 0x91c8,
193 0x91cc,
194 0x91d0,
195 0x91d4,
196 0x91e0,
197 0x91e4,
198 0x91ec,
199 0x91f0,
200 0x91f4,
201 0x9200,
202 0x9204,
203 0x929c,
204 0x9150,
205 0x802c,
206 };
207
208 static void evergreen_gpu_init(struct radeon_device *rdev);
209 void evergreen_fini(struct radeon_device *rdev);
210 void evergreen_pcie_gen2_enable(struct radeon_device *rdev);
211 void evergreen_program_aspm(struct radeon_device *rdev);
212 extern void cayman_cp_int_cntl_setup(struct radeon_device *rdev,
213 int ring, u32 cp_int_cntl);
214 extern void cayman_vm_decode_fault(struct radeon_device *rdev,
215 u32 status, u32 addr);
216 void cik_init_cp_pg_table(struct radeon_device *rdev);
217
218 extern u32 si_get_csb_size(struct radeon_device *rdev);
219 extern void si_get_csb_buffer(struct radeon_device *rdev, volatile u32 *buffer);
220 extern u32 cik_get_csb_size(struct radeon_device *rdev);
221 extern void cik_get_csb_buffer(struct radeon_device *rdev, volatile u32 *buffer);
222 extern void rv770_set_clk_bypass_mode(struct radeon_device *rdev);
223
224 static const u32 evergreen_golden_registers[] =
225 {
226 0x3f90, 0xffff0000, 0xff000000,
227 0x9148, 0xffff0000, 0xff000000,
228 0x3f94, 0xffff0000, 0xff000000,
229 0x914c, 0xffff0000, 0xff000000,
230 0x9b7c, 0xffffffff, 0x00000000,
231 0x8a14, 0xffffffff, 0x00000007,
232 0x8b10, 0xffffffff, 0x00000000,
233 0x960c, 0xffffffff, 0x54763210,
234 0x88c4, 0xffffffff, 0x000000c2,
235 0x88d4, 0xffffffff, 0x00000010,
236 0x8974, 0xffffffff, 0x00000000,
237 0xc78, 0x00000080, 0x00000080,
238 0x5eb4, 0xffffffff, 0x00000002,
239 0x5e78, 0xffffffff, 0x001000f0,
240 0x6104, 0x01000300, 0x00000000,
241 0x5bc0, 0x00300000, 0x00000000,
242 0x7030, 0xffffffff, 0x00000011,
243 0x7c30, 0xffffffff, 0x00000011,
244 0x10830, 0xffffffff, 0x00000011,
245 0x11430, 0xffffffff, 0x00000011,
246 0x12030, 0xffffffff, 0x00000011,
247 0x12c30, 0xffffffff, 0x00000011,
248 0xd02c, 0xffffffff, 0x08421000,
249 0x240c, 0xffffffff, 0x00000380,
250 0x8b24, 0xffffffff, 0x00ff0fff,
251 0x28a4c, 0x06000000, 0x06000000,
252 0x10c, 0x00000001, 0x00000001,
253 0x8d00, 0xffffffff, 0x100e4848,
254 0x8d04, 0xffffffff, 0x00164745,
255 0x8c00, 0xffffffff, 0xe4000003,
256 0x8c04, 0xffffffff, 0x40600060,
257 0x8c08, 0xffffffff, 0x001c001c,
258 0x8cf0, 0xffffffff, 0x08e00620,
259 0x8c20, 0xffffffff, 0x00800080,
260 0x8c24, 0xffffffff, 0x00800080,
261 0x8c18, 0xffffffff, 0x20202078,
262 0x8c1c, 0xffffffff, 0x00001010,
263 0x28350, 0xffffffff, 0x00000000,
264 0xa008, 0xffffffff, 0x00010000,
265 0x5c4, 0xffffffff, 0x00000001,
266 0x9508, 0xffffffff, 0x00000002,
267 0x913c, 0x0000000f, 0x0000000a
268 };
269
270 static const u32 evergreen_golden_registers2[] =
271 {
272 0x2f4c, 0xffffffff, 0x00000000,
273 0x54f4, 0xffffffff, 0x00000000,
274 0x54f0, 0xffffffff, 0x00000000,
275 0x5498, 0xffffffff, 0x00000000,
276 0x549c, 0xffffffff, 0x00000000,
277 0x5494, 0xffffffff, 0x00000000,
278 0x53cc, 0xffffffff, 0x00000000,
279 0x53c8, 0xffffffff, 0x00000000,
280 0x53c4, 0xffffffff, 0x00000000,
281 0x53c0, 0xffffffff, 0x00000000,
282 0x53bc, 0xffffffff, 0x00000000,
283 0x53b8, 0xffffffff, 0x00000000,
284 0x53b4, 0xffffffff, 0x00000000,
285 0x53b0, 0xffffffff, 0x00000000
286 };
287
288 static const u32 cypress_mgcg_init[] =
289 {
290 0x802c, 0xffffffff, 0xc0000000,
291 0x5448, 0xffffffff, 0x00000100,
292 0x55e4, 0xffffffff, 0x00000100,
293 0x160c, 0xffffffff, 0x00000100,
294 0x5644, 0xffffffff, 0x00000100,
295 0xc164, 0xffffffff, 0x00000100,
296 0x8a18, 0xffffffff, 0x00000100,
297 0x897c, 0xffffffff, 0x06000100,
298 0x8b28, 0xffffffff, 0x00000100,
299 0x9144, 0xffffffff, 0x00000100,
300 0x9a60, 0xffffffff, 0x00000100,
301 0x9868, 0xffffffff, 0x00000100,
302 0x8d58, 0xffffffff, 0x00000100,
303 0x9510, 0xffffffff, 0x00000100,
304 0x949c, 0xffffffff, 0x00000100,
305 0x9654, 0xffffffff, 0x00000100,
306 0x9030, 0xffffffff, 0x00000100,
307 0x9034, 0xffffffff, 0x00000100,
308 0x9038, 0xffffffff, 0x00000100,
309 0x903c, 0xffffffff, 0x00000100,
310 0x9040, 0xffffffff, 0x00000100,
311 0xa200, 0xffffffff, 0x00000100,
312 0xa204, 0xffffffff, 0x00000100,
313 0xa208, 0xffffffff, 0x00000100,
314 0xa20c, 0xffffffff, 0x00000100,
315 0x971c, 0xffffffff, 0x00000100,
316 0x977c, 0xffffffff, 0x00000100,
317 0x3f80, 0xffffffff, 0x00000100,
318 0xa210, 0xffffffff, 0x00000100,
319 0xa214, 0xffffffff, 0x00000100,
320 0x4d8, 0xffffffff, 0x00000100,
321 0x9784, 0xffffffff, 0x00000100,
322 0x9698, 0xffffffff, 0x00000100,
323 0x4d4, 0xffffffff, 0x00000200,
324 0x30cc, 0xffffffff, 0x00000100,
325 0xd0c0, 0xffffffff, 0xff000100,
326 0x802c, 0xffffffff, 0x40000000,
327 0x915c, 0xffffffff, 0x00010000,
328 0x9160, 0xffffffff, 0x00030002,
329 0x9178, 0xffffffff, 0x00070000,
330 0x917c, 0xffffffff, 0x00030002,
331 0x9180, 0xffffffff, 0x00050004,
332 0x918c, 0xffffffff, 0x00010006,
333 0x9190, 0xffffffff, 0x00090008,
334 0x9194, 0xffffffff, 0x00070000,
335 0x9198, 0xffffffff, 0x00030002,
336 0x919c, 0xffffffff, 0x00050004,
337 0x91a8, 0xffffffff, 0x00010006,
338 0x91ac, 0xffffffff, 0x00090008,
339 0x91b0, 0xffffffff, 0x00070000,
340 0x91b4, 0xffffffff, 0x00030002,
341 0x91b8, 0xffffffff, 0x00050004,
342 0x91c4, 0xffffffff, 0x00010006,
343 0x91c8, 0xffffffff, 0x00090008,
344 0x91cc, 0xffffffff, 0x00070000,
345 0x91d0, 0xffffffff, 0x00030002,
346 0x91d4, 0xffffffff, 0x00050004,
347 0x91e0, 0xffffffff, 0x00010006,
348 0x91e4, 0xffffffff, 0x00090008,
349 0x91e8, 0xffffffff, 0x00000000,
350 0x91ec, 0xffffffff, 0x00070000,
351 0x91f0, 0xffffffff, 0x00030002,
352 0x91f4, 0xffffffff, 0x00050004,
353 0x9200, 0xffffffff, 0x00010006,
354 0x9204, 0xffffffff, 0x00090008,
355 0x9208, 0xffffffff, 0x00070000,
356 0x920c, 0xffffffff, 0x00030002,
357 0x9210, 0xffffffff, 0x00050004,
358 0x921c, 0xffffffff, 0x00010006,
359 0x9220, 0xffffffff, 0x00090008,
360 0x9224, 0xffffffff, 0x00070000,
361 0x9228, 0xffffffff, 0x00030002,
362 0x922c, 0xffffffff, 0x00050004,
363 0x9238, 0xffffffff, 0x00010006,
364 0x923c, 0xffffffff, 0x00090008,
365 0x9240, 0xffffffff, 0x00070000,
366 0x9244, 0xffffffff, 0x00030002,
367 0x9248, 0xffffffff, 0x00050004,
368 0x9254, 0xffffffff, 0x00010006,
369 0x9258, 0xffffffff, 0x00090008,
370 0x925c, 0xffffffff, 0x00070000,
371 0x9260, 0xffffffff, 0x00030002,
372 0x9264, 0xffffffff, 0x00050004,
373 0x9270, 0xffffffff, 0x00010006,
374 0x9274, 0xffffffff, 0x00090008,
375 0x9278, 0xffffffff, 0x00070000,
376 0x927c, 0xffffffff, 0x00030002,
377 0x9280, 0xffffffff, 0x00050004,
378 0x928c, 0xffffffff, 0x00010006,
379 0x9290, 0xffffffff, 0x00090008,
380 0x9294, 0xffffffff, 0x00000000,
381 0x929c, 0xffffffff, 0x00000001,
382 0x802c, 0xffffffff, 0x40010000,
383 0x915c, 0xffffffff, 0x00010000,
384 0x9160, 0xffffffff, 0x00030002,
385 0x9178, 0xffffffff, 0x00070000,
386 0x917c, 0xffffffff, 0x00030002,
387 0x9180, 0xffffffff, 0x00050004,
388 0x918c, 0xffffffff, 0x00010006,
389 0x9190, 0xffffffff, 0x00090008,
390 0x9194, 0xffffffff, 0x00070000,
391 0x9198, 0xffffffff, 0x00030002,
392 0x919c, 0xffffffff, 0x00050004,
393 0x91a8, 0xffffffff, 0x00010006,
394 0x91ac, 0xffffffff, 0x00090008,
395 0x91b0, 0xffffffff, 0x00070000,
396 0x91b4, 0xffffffff, 0x00030002,
397 0x91b8, 0xffffffff, 0x00050004,
398 0x91c4, 0xffffffff, 0x00010006,
399 0x91c8, 0xffffffff, 0x00090008,
400 0x91cc, 0xffffffff, 0x00070000,
401 0x91d0, 0xffffffff, 0x00030002,
402 0x91d4, 0xffffffff, 0x00050004,
403 0x91e0, 0xffffffff, 0x00010006,
404 0x91e4, 0xffffffff, 0x00090008,
405 0x91e8, 0xffffffff, 0x00000000,
406 0x91ec, 0xffffffff, 0x00070000,
407 0x91f0, 0xffffffff, 0x00030002,
408 0x91f4, 0xffffffff, 0x00050004,
409 0x9200, 0xffffffff, 0x00010006,
410 0x9204, 0xffffffff, 0x00090008,
411 0x9208, 0xffffffff, 0x00070000,
412 0x920c, 0xffffffff, 0x00030002,
413 0x9210, 0xffffffff, 0x00050004,
414 0x921c, 0xffffffff, 0x00010006,
415 0x9220, 0xffffffff, 0x00090008,
416 0x9224, 0xffffffff, 0x00070000,
417 0x9228, 0xffffffff, 0x00030002,
418 0x922c, 0xffffffff, 0x00050004,
419 0x9238, 0xffffffff, 0x00010006,
420 0x923c, 0xffffffff, 0x00090008,
421 0x9240, 0xffffffff, 0x00070000,
422 0x9244, 0xffffffff, 0x00030002,
423 0x9248, 0xffffffff, 0x00050004,
424 0x9254, 0xffffffff, 0x00010006,
425 0x9258, 0xffffffff, 0x00090008,
426 0x925c, 0xffffffff, 0x00070000,
427 0x9260, 0xffffffff, 0x00030002,
428 0x9264, 0xffffffff, 0x00050004,
429 0x9270, 0xffffffff, 0x00010006,
430 0x9274, 0xffffffff, 0x00090008,
431 0x9278, 0xffffffff, 0x00070000,
432 0x927c, 0xffffffff, 0x00030002,
433 0x9280, 0xffffffff, 0x00050004,
434 0x928c, 0xffffffff, 0x00010006,
435 0x9290, 0xffffffff, 0x00090008,
436 0x9294, 0xffffffff, 0x00000000,
437 0x929c, 0xffffffff, 0x00000001,
438 0x802c, 0xffffffff, 0xc0000000
439 };
440
441 static const u32 redwood_mgcg_init[] =
442 {
443 0x802c, 0xffffffff, 0xc0000000,
444 0x5448, 0xffffffff, 0x00000100,
445 0x55e4, 0xffffffff, 0x00000100,
446 0x160c, 0xffffffff, 0x00000100,
447 0x5644, 0xffffffff, 0x00000100,
448 0xc164, 0xffffffff, 0x00000100,
449 0x8a18, 0xffffffff, 0x00000100,
450 0x897c, 0xffffffff, 0x06000100,
451 0x8b28, 0xffffffff, 0x00000100,
452 0x9144, 0xffffffff, 0x00000100,
453 0x9a60, 0xffffffff, 0x00000100,
454 0x9868, 0xffffffff, 0x00000100,
455 0x8d58, 0xffffffff, 0x00000100,
456 0x9510, 0xffffffff, 0x00000100,
457 0x949c, 0xffffffff, 0x00000100,
458 0x9654, 0xffffffff, 0x00000100,
459 0x9030, 0xffffffff, 0x00000100,
460 0x9034, 0xffffffff, 0x00000100,
461 0x9038, 0xffffffff, 0x00000100,
462 0x903c, 0xffffffff, 0x00000100,
463 0x9040, 0xffffffff, 0x00000100,
464 0xa200, 0xffffffff, 0x00000100,
465 0xa204, 0xffffffff, 0x00000100,
466 0xa208, 0xffffffff, 0x00000100,
467 0xa20c, 0xffffffff, 0x00000100,
468 0x971c, 0xffffffff, 0x00000100,
469 0x977c, 0xffffffff, 0x00000100,
470 0x3f80, 0xffffffff, 0x00000100,
471 0xa210, 0xffffffff, 0x00000100,
472 0xa214, 0xffffffff, 0x00000100,
473 0x4d8, 0xffffffff, 0x00000100,
474 0x9784, 0xffffffff, 0x00000100,
475 0x9698, 0xffffffff, 0x00000100,
476 0x4d4, 0xffffffff, 0x00000200,
477 0x30cc, 0xffffffff, 0x00000100,
478 0xd0c0, 0xffffffff, 0xff000100,
479 0x802c, 0xffffffff, 0x40000000,
480 0x915c, 0xffffffff, 0x00010000,
481 0x9160, 0xffffffff, 0x00030002,
482 0x9178, 0xffffffff, 0x00070000,
483 0x917c, 0xffffffff, 0x00030002,
484 0x9180, 0xffffffff, 0x00050004,
485 0x918c, 0xffffffff, 0x00010006,
486 0x9190, 0xffffffff, 0x00090008,
487 0x9194, 0xffffffff, 0x00070000,
488 0x9198, 0xffffffff, 0x00030002,
489 0x919c, 0xffffffff, 0x00050004,
490 0x91a8, 0xffffffff, 0x00010006,
491 0x91ac, 0xffffffff, 0x00090008,
492 0x91b0, 0xffffffff, 0x00070000,
493 0x91b4, 0xffffffff, 0x00030002,
494 0x91b8, 0xffffffff, 0x00050004,
495 0x91c4, 0xffffffff, 0x00010006,
496 0x91c8, 0xffffffff, 0x00090008,
497 0x91cc, 0xffffffff, 0x00070000,
498 0x91d0, 0xffffffff, 0x00030002,
499 0x91d4, 0xffffffff, 0x00050004,
500 0x91e0, 0xffffffff, 0x00010006,
501 0x91e4, 0xffffffff, 0x00090008,
502 0x91e8, 0xffffffff, 0x00000000,
503 0x91ec, 0xffffffff, 0x00070000,
504 0x91f0, 0xffffffff, 0x00030002,
505 0x91f4, 0xffffffff, 0x00050004,
506 0x9200, 0xffffffff, 0x00010006,
507 0x9204, 0xffffffff, 0x00090008,
508 0x9294, 0xffffffff, 0x00000000,
509 0x929c, 0xffffffff, 0x00000001,
510 0x802c, 0xffffffff, 0xc0000000
511 };
512
513 static const u32 cedar_golden_registers[] =
514 {
515 0x3f90, 0xffff0000, 0xff000000,
516 0x9148, 0xffff0000, 0xff000000,
517 0x3f94, 0xffff0000, 0xff000000,
518 0x914c, 0xffff0000, 0xff000000,
519 0x9b7c, 0xffffffff, 0x00000000,
520 0x8a14, 0xffffffff, 0x00000007,
521 0x8b10, 0xffffffff, 0x00000000,
522 0x960c, 0xffffffff, 0x54763210,
523 0x88c4, 0xffffffff, 0x000000c2,
524 0x88d4, 0xffffffff, 0x00000000,
525 0x8974, 0xffffffff, 0x00000000,
526 0xc78, 0x00000080, 0x00000080,
527 0x5eb4, 0xffffffff, 0x00000002,
528 0x5e78, 0xffffffff, 0x001000f0,
529 0x6104, 0x01000300, 0x00000000,
530 0x5bc0, 0x00300000, 0x00000000,
531 0x7030, 0xffffffff, 0x00000011,
532 0x7c30, 0xffffffff, 0x00000011,
533 0x10830, 0xffffffff, 0x00000011,
534 0x11430, 0xffffffff, 0x00000011,
535 0xd02c, 0xffffffff, 0x08421000,
536 0x240c, 0xffffffff, 0x00000380,
537 0x8b24, 0xffffffff, 0x00ff0fff,
538 0x28a4c, 0x06000000, 0x06000000,
539 0x10c, 0x00000001, 0x00000001,
540 0x8d00, 0xffffffff, 0x100e4848,
541 0x8d04, 0xffffffff, 0x00164745,
542 0x8c00, 0xffffffff, 0xe4000003,
543 0x8c04, 0xffffffff, 0x40600060,
544 0x8c08, 0xffffffff, 0x001c001c,
545 0x8cf0, 0xffffffff, 0x08e00410,
546 0x8c20, 0xffffffff, 0x00800080,
547 0x8c24, 0xffffffff, 0x00800080,
548 0x8c18, 0xffffffff, 0x20202078,
549 0x8c1c, 0xffffffff, 0x00001010,
550 0x28350, 0xffffffff, 0x00000000,
551 0xa008, 0xffffffff, 0x00010000,
552 0x5c4, 0xffffffff, 0x00000001,
553 0x9508, 0xffffffff, 0x00000002
554 };
555
556 static const u32 cedar_mgcg_init[] =
557 {
558 0x802c, 0xffffffff, 0xc0000000,
559 0x5448, 0xffffffff, 0x00000100,
560 0x55e4, 0xffffffff, 0x00000100,
561 0x160c, 0xffffffff, 0x00000100,
562 0x5644, 0xffffffff, 0x00000100,
563 0xc164, 0xffffffff, 0x00000100,
564 0x8a18, 0xffffffff, 0x00000100,
565 0x897c, 0xffffffff, 0x06000100,
566 0x8b28, 0xffffffff, 0x00000100,
567 0x9144, 0xffffffff, 0x00000100,
568 0x9a60, 0xffffffff, 0x00000100,
569 0x9868, 0xffffffff, 0x00000100,
570 0x8d58, 0xffffffff, 0x00000100,
571 0x9510, 0xffffffff, 0x00000100,
572 0x949c, 0xffffffff, 0x00000100,
573 0x9654, 0xffffffff, 0x00000100,
574 0x9030, 0xffffffff, 0x00000100,
575 0x9034, 0xffffffff, 0x00000100,
576 0x9038, 0xffffffff, 0x00000100,
577 0x903c, 0xffffffff, 0x00000100,
578 0x9040, 0xffffffff, 0x00000100,
579 0xa200, 0xffffffff, 0x00000100,
580 0xa204, 0xffffffff, 0x00000100,
581 0xa208, 0xffffffff, 0x00000100,
582 0xa20c, 0xffffffff, 0x00000100,
583 0x971c, 0xffffffff, 0x00000100,
584 0x977c, 0xffffffff, 0x00000100,
585 0x3f80, 0xffffffff, 0x00000100,
586 0xa210, 0xffffffff, 0x00000100,
587 0xa214, 0xffffffff, 0x00000100,
588 0x4d8, 0xffffffff, 0x00000100,
589 0x9784, 0xffffffff, 0x00000100,
590 0x9698, 0xffffffff, 0x00000100,
591 0x4d4, 0xffffffff, 0x00000200,
592 0x30cc, 0xffffffff, 0x00000100,
593 0xd0c0, 0xffffffff, 0xff000100,
594 0x802c, 0xffffffff, 0x40000000,
595 0x915c, 0xffffffff, 0x00010000,
596 0x9178, 0xffffffff, 0x00050000,
597 0x917c, 0xffffffff, 0x00030002,
598 0x918c, 0xffffffff, 0x00010004,
599 0x9190, 0xffffffff, 0x00070006,
600 0x9194, 0xffffffff, 0x00050000,
601 0x9198, 0xffffffff, 0x00030002,
602 0x91a8, 0xffffffff, 0x00010004,
603 0x91ac, 0xffffffff, 0x00070006,
604 0x91e8, 0xffffffff, 0x00000000,
605 0x9294, 0xffffffff, 0x00000000,
606 0x929c, 0xffffffff, 0x00000001,
607 0x802c, 0xffffffff, 0xc0000000
608 };
609
610 static const u32 juniper_mgcg_init[] =
611 {
612 0x802c, 0xffffffff, 0xc0000000,
613 0x5448, 0xffffffff, 0x00000100,
614 0x55e4, 0xffffffff, 0x00000100,
615 0x160c, 0xffffffff, 0x00000100,
616 0x5644, 0xffffffff, 0x00000100,
617 0xc164, 0xffffffff, 0x00000100,
618 0x8a18, 0xffffffff, 0x00000100,
619 0x897c, 0xffffffff, 0x06000100,
620 0x8b28, 0xffffffff, 0x00000100,
621 0x9144, 0xffffffff, 0x00000100,
622 0x9a60, 0xffffffff, 0x00000100,
623 0x9868, 0xffffffff, 0x00000100,
624 0x8d58, 0xffffffff, 0x00000100,
625 0x9510, 0xffffffff, 0x00000100,
626 0x949c, 0xffffffff, 0x00000100,
627 0x9654, 0xffffffff, 0x00000100,
628 0x9030, 0xffffffff, 0x00000100,
629 0x9034, 0xffffffff, 0x00000100,
630 0x9038, 0xffffffff, 0x00000100,
631 0x903c, 0xffffffff, 0x00000100,
632 0x9040, 0xffffffff, 0x00000100,
633 0xa200, 0xffffffff, 0x00000100,
634 0xa204, 0xffffffff, 0x00000100,
635 0xa208, 0xffffffff, 0x00000100,
636 0xa20c, 0xffffffff, 0x00000100,
637 0x971c, 0xffffffff, 0x00000100,
638 0xd0c0, 0xffffffff, 0xff000100,
639 0x802c, 0xffffffff, 0x40000000,
640 0x915c, 0xffffffff, 0x00010000,
641 0x9160, 0xffffffff, 0x00030002,
642 0x9178, 0xffffffff, 0x00070000,
643 0x917c, 0xffffffff, 0x00030002,
644 0x9180, 0xffffffff, 0x00050004,
645 0x918c, 0xffffffff, 0x00010006,
646 0x9190, 0xffffffff, 0x00090008,
647 0x9194, 0xffffffff, 0x00070000,
648 0x9198, 0xffffffff, 0x00030002,
649 0x919c, 0xffffffff, 0x00050004,
650 0x91a8, 0xffffffff, 0x00010006,
651 0x91ac, 0xffffffff, 0x00090008,
652 0x91b0, 0xffffffff, 0x00070000,
653 0x91b4, 0xffffffff, 0x00030002,
654 0x91b8, 0xffffffff, 0x00050004,
655 0x91c4, 0xffffffff, 0x00010006,
656 0x91c8, 0xffffffff, 0x00090008,
657 0x91cc, 0xffffffff, 0x00070000,
658 0x91d0, 0xffffffff, 0x00030002,
659 0x91d4, 0xffffffff, 0x00050004,
660 0x91e0, 0xffffffff, 0x00010006,
661 0x91e4, 0xffffffff, 0x00090008,
662 0x91e8, 0xffffffff, 0x00000000,
663 0x91ec, 0xffffffff, 0x00070000,
664 0x91f0, 0xffffffff, 0x00030002,
665 0x91f4, 0xffffffff, 0x00050004,
666 0x9200, 0xffffffff, 0x00010006,
667 0x9204, 0xffffffff, 0x00090008,
668 0x9208, 0xffffffff, 0x00070000,
669 0x920c, 0xffffffff, 0x00030002,
670 0x9210, 0xffffffff, 0x00050004,
671 0x921c, 0xffffffff, 0x00010006,
672 0x9220, 0xffffffff, 0x00090008,
673 0x9224, 0xffffffff, 0x00070000,
674 0x9228, 0xffffffff, 0x00030002,
675 0x922c, 0xffffffff, 0x00050004,
676 0x9238, 0xffffffff, 0x00010006,
677 0x923c, 0xffffffff, 0x00090008,
678 0x9240, 0xffffffff, 0x00070000,
679 0x9244, 0xffffffff, 0x00030002,
680 0x9248, 0xffffffff, 0x00050004,
681 0x9254, 0xffffffff, 0x00010006,
682 0x9258, 0xffffffff, 0x00090008,
683 0x925c, 0xffffffff, 0x00070000,
684 0x9260, 0xffffffff, 0x00030002,
685 0x9264, 0xffffffff, 0x00050004,
686 0x9270, 0xffffffff, 0x00010006,
687 0x9274, 0xffffffff, 0x00090008,
688 0x9278, 0xffffffff, 0x00070000,
689 0x927c, 0xffffffff, 0x00030002,
690 0x9280, 0xffffffff, 0x00050004,
691 0x928c, 0xffffffff, 0x00010006,
692 0x9290, 0xffffffff, 0x00090008,
693 0x9294, 0xffffffff, 0x00000000,
694 0x929c, 0xffffffff, 0x00000001,
695 0x802c, 0xffffffff, 0xc0000000,
696 0x977c, 0xffffffff, 0x00000100,
697 0x3f80, 0xffffffff, 0x00000100,
698 0xa210, 0xffffffff, 0x00000100,
699 0xa214, 0xffffffff, 0x00000100,
700 0x4d8, 0xffffffff, 0x00000100,
701 0x9784, 0xffffffff, 0x00000100,
702 0x9698, 0xffffffff, 0x00000100,
703 0x4d4, 0xffffffff, 0x00000200,
704 0x30cc, 0xffffffff, 0x00000100,
705 0x802c, 0xffffffff, 0xc0000000
706 };
707
708 static const u32 supersumo_golden_registers[] =
709 {
710 0x5eb4, 0xffffffff, 0x00000002,
711 0x5c4, 0xffffffff, 0x00000001,
712 0x7030, 0xffffffff, 0x00000011,
713 0x7c30, 0xffffffff, 0x00000011,
714 0x6104, 0x01000300, 0x00000000,
715 0x5bc0, 0x00300000, 0x00000000,
716 0x8c04, 0xffffffff, 0x40600060,
717 0x8c08, 0xffffffff, 0x001c001c,
718 0x8c20, 0xffffffff, 0x00800080,
719 0x8c24, 0xffffffff, 0x00800080,
720 0x8c18, 0xffffffff, 0x20202078,
721 0x8c1c, 0xffffffff, 0x00001010,
722 0x918c, 0xffffffff, 0x00010006,
723 0x91a8, 0xffffffff, 0x00010006,
724 0x91c4, 0xffffffff, 0x00010006,
725 0x91e0, 0xffffffff, 0x00010006,
726 0x9200, 0xffffffff, 0x00010006,
727 0x9150, 0xffffffff, 0x6e944040,
728 0x917c, 0xffffffff, 0x00030002,
729 0x9180, 0xffffffff, 0x00050004,
730 0x9198, 0xffffffff, 0x00030002,
731 0x919c, 0xffffffff, 0x00050004,
732 0x91b4, 0xffffffff, 0x00030002,
733 0x91b8, 0xffffffff, 0x00050004,
734 0x91d0, 0xffffffff, 0x00030002,
735 0x91d4, 0xffffffff, 0x00050004,
736 0x91f0, 0xffffffff, 0x00030002,
737 0x91f4, 0xffffffff, 0x00050004,
738 0x915c, 0xffffffff, 0x00010000,
739 0x9160, 0xffffffff, 0x00030002,
740 0x3f90, 0xffff0000, 0xff000000,
741 0x9178, 0xffffffff, 0x00070000,
742 0x9194, 0xffffffff, 0x00070000,
743 0x91b0, 0xffffffff, 0x00070000,
744 0x91cc, 0xffffffff, 0x00070000,
745 0x91ec, 0xffffffff, 0x00070000,
746 0x9148, 0xffff0000, 0xff000000,
747 0x9190, 0xffffffff, 0x00090008,
748 0x91ac, 0xffffffff, 0x00090008,
749 0x91c8, 0xffffffff, 0x00090008,
750 0x91e4, 0xffffffff, 0x00090008,
751 0x9204, 0xffffffff, 0x00090008,
752 0x3f94, 0xffff0000, 0xff000000,
753 0x914c, 0xffff0000, 0xff000000,
754 0x929c, 0xffffffff, 0x00000001,
755 0x8a18, 0xffffffff, 0x00000100,
756 0x8b28, 0xffffffff, 0x00000100,
757 0x9144, 0xffffffff, 0x00000100,
758 0x5644, 0xffffffff, 0x00000100,
759 0x9b7c, 0xffffffff, 0x00000000,
760 0x8030, 0xffffffff, 0x0000100a,
761 0x8a14, 0xffffffff, 0x00000007,
762 0x8b24, 0xffffffff, 0x00ff0fff,
763 0x8b10, 0xffffffff, 0x00000000,
764 0x28a4c, 0x06000000, 0x06000000,
765 0x4d8, 0xffffffff, 0x00000100,
766 0x913c, 0xffff000f, 0x0100000a,
767 0x960c, 0xffffffff, 0x54763210,
768 0x88c4, 0xffffffff, 0x000000c2,
769 0x88d4, 0xffffffff, 0x00000010,
770 0x8974, 0xffffffff, 0x00000000,
771 0xc78, 0x00000080, 0x00000080,
772 0x5e78, 0xffffffff, 0x001000f0,
773 0xd02c, 0xffffffff, 0x08421000,
774 0xa008, 0xffffffff, 0x00010000,
775 0x8d00, 0xffffffff, 0x100e4848,
776 0x8d04, 0xffffffff, 0x00164745,
777 0x8c00, 0xffffffff, 0xe4000003,
778 0x8cf0, 0x1fffffff, 0x08e00620,
779 0x28350, 0xffffffff, 0x00000000,
780 0x9508, 0xffffffff, 0x00000002
781 };
782
783 static const u32 sumo_golden_registers[] =
784 {
785 0x900c, 0x00ffffff, 0x0017071f,
786 0x8c18, 0xffffffff, 0x10101060,
787 0x8c1c, 0xffffffff, 0x00001010,
788 0x8c30, 0x0000000f, 0x00000005,
789 0x9688, 0x0000000f, 0x00000007
790 };
791
792 static const u32 wrestler_golden_registers[] =
793 {
794 0x5eb4, 0xffffffff, 0x00000002,
795 0x5c4, 0xffffffff, 0x00000001,
796 0x7030, 0xffffffff, 0x00000011,
797 0x7c30, 0xffffffff, 0x00000011,
798 0x6104, 0x01000300, 0x00000000,
799 0x5bc0, 0x00300000, 0x00000000,
800 0x918c, 0xffffffff, 0x00010006,
801 0x91a8, 0xffffffff, 0x00010006,
802 0x9150, 0xffffffff, 0x6e944040,
803 0x917c, 0xffffffff, 0x00030002,
804 0x9198, 0xffffffff, 0x00030002,
805 0x915c, 0xffffffff, 0x00010000,
806 0x3f90, 0xffff0000, 0xff000000,
807 0x9178, 0xffffffff, 0x00070000,
808 0x9194, 0xffffffff, 0x00070000,
809 0x9148, 0xffff0000, 0xff000000,
810 0x9190, 0xffffffff, 0x00090008,
811 0x91ac, 0xffffffff, 0x00090008,
812 0x3f94, 0xffff0000, 0xff000000,
813 0x914c, 0xffff0000, 0xff000000,
814 0x929c, 0xffffffff, 0x00000001,
815 0x8a18, 0xffffffff, 0x00000100,
816 0x8b28, 0xffffffff, 0x00000100,
817 0x9144, 0xffffffff, 0x00000100,
818 0x9b7c, 0xffffffff, 0x00000000,
819 0x8030, 0xffffffff, 0x0000100a,
820 0x8a14, 0xffffffff, 0x00000001,
821 0x8b24, 0xffffffff, 0x00ff0fff,
822 0x8b10, 0xffffffff, 0x00000000,
823 0x28a4c, 0x06000000, 0x06000000,
824 0x4d8, 0xffffffff, 0x00000100,
825 0x913c, 0xffff000f, 0x0100000a,
826 0x960c, 0xffffffff, 0x54763210,
827 0x88c4, 0xffffffff, 0x000000c2,
828 0x88d4, 0xffffffff, 0x00000010,
829 0x8974, 0xffffffff, 0x00000000,
830 0xc78, 0x00000080, 0x00000080,
831 0x5e78, 0xffffffff, 0x001000f0,
832 0xd02c, 0xffffffff, 0x08421000,
833 0xa008, 0xffffffff, 0x00010000,
834 0x8d00, 0xffffffff, 0x100e4848,
835 0x8d04, 0xffffffff, 0x00164745,
836 0x8c00, 0xffffffff, 0xe4000003,
837 0x8cf0, 0x1fffffff, 0x08e00410,
838 0x28350, 0xffffffff, 0x00000000,
839 0x9508, 0xffffffff, 0x00000002,
840 0x900c, 0xffffffff, 0x0017071f,
841 0x8c18, 0xffffffff, 0x10101060,
842 0x8c1c, 0xffffffff, 0x00001010
843 };
844
845 static const u32 barts_golden_registers[] =
846 {
847 0x5eb4, 0xffffffff, 0x00000002,
848 0x5e78, 0x8f311ff1, 0x001000f0,
849 0x3f90, 0xffff0000, 0xff000000,
850 0x9148, 0xffff0000, 0xff000000,
851 0x3f94, 0xffff0000, 0xff000000,
852 0x914c, 0xffff0000, 0xff000000,
853 0xc78, 0x00000080, 0x00000080,
854 0xbd4, 0x70073777, 0x00010001,
855 0xd02c, 0xbfffff1f, 0x08421000,
856 0xd0b8, 0x03773777, 0x02011003,
857 0x5bc0, 0x00200000, 0x50100000,
858 0x98f8, 0x33773777, 0x02011003,
859 0x98fc, 0xffffffff, 0x76543210,
860 0x7030, 0x31000311, 0x00000011,
861 0x2f48, 0x00000007, 0x02011003,
862 0x6b28, 0x00000010, 0x00000012,
863 0x7728, 0x00000010, 0x00000012,
864 0x10328, 0x00000010, 0x00000012,
865 0x10f28, 0x00000010, 0x00000012,
866 0x11b28, 0x00000010, 0x00000012,
867 0x12728, 0x00000010, 0x00000012,
868 0x240c, 0x000007ff, 0x00000380,
869 0x8a14, 0xf000001f, 0x00000007,
870 0x8b24, 0x3fff3fff, 0x00ff0fff,
871 0x8b10, 0x0000ff0f, 0x00000000,
872 0x28a4c, 0x07ffffff, 0x06000000,
873 0x10c, 0x00000001, 0x00010003,
874 0xa02c, 0xffffffff, 0x0000009b,
875 0x913c, 0x0000000f, 0x0100000a,
876 0x8d00, 0xffff7f7f, 0x100e4848,
877 0x8d04, 0x00ffffff, 0x00164745,
878 0x8c00, 0xfffc0003, 0xe4000003,
879 0x8c04, 0xf8ff00ff, 0x40600060,
880 0x8c08, 0x00ff00ff, 0x001c001c,
881 0x8cf0, 0x1fff1fff, 0x08e00620,
882 0x8c20, 0x0fff0fff, 0x00800080,
883 0x8c24, 0x0fff0fff, 0x00800080,
884 0x8c18, 0xffffffff, 0x20202078,
885 0x8c1c, 0x0000ffff, 0x00001010,
886 0x28350, 0x00000f01, 0x00000000,
887 0x9508, 0x3700001f, 0x00000002,
888 0x960c, 0xffffffff, 0x54763210,
889 0x88c4, 0x001f3ae3, 0x000000c2,
890 0x88d4, 0x0000001f, 0x00000010,
891 0x8974, 0xffffffff, 0x00000000
892 };
893
894 static const u32 turks_golden_registers[] =
895 {
896 0x5eb4, 0xffffffff, 0x00000002,
897 0x5e78, 0x8f311ff1, 0x001000f0,
898 0x8c8, 0x00003000, 0x00001070,
899 0x8cc, 0x000fffff, 0x00040035,
900 0x3f90, 0xffff0000, 0xfff00000,
901 0x9148, 0xffff0000, 0xfff00000,
902 0x3f94, 0xffff0000, 0xfff00000,
903 0x914c, 0xffff0000, 0xfff00000,
904 0xc78, 0x00000080, 0x00000080,
905 0xbd4, 0x00073007, 0x00010002,
906 0xd02c, 0xbfffff1f, 0x08421000,
907 0xd0b8, 0x03773777, 0x02010002,
908 0x5bc0, 0x00200000, 0x50100000,
909 0x98f8, 0x33773777, 0x00010002,
910 0x98fc, 0xffffffff, 0x33221100,
911 0x7030, 0x31000311, 0x00000011,
912 0x2f48, 0x33773777, 0x00010002,
913 0x6b28, 0x00000010, 0x00000012,
914 0x7728, 0x00000010, 0x00000012,
915 0x10328, 0x00000010, 0x00000012,
916 0x10f28, 0x00000010, 0x00000012,
917 0x11b28, 0x00000010, 0x00000012,
918 0x12728, 0x00000010, 0x00000012,
919 0x240c, 0x000007ff, 0x00000380,
920 0x8a14, 0xf000001f, 0x00000007,
921 0x8b24, 0x3fff3fff, 0x00ff0fff,
922 0x8b10, 0x0000ff0f, 0x00000000,
923 0x28a4c, 0x07ffffff, 0x06000000,
924 0x10c, 0x00000001, 0x00010003,
925 0xa02c, 0xffffffff, 0x0000009b,
926 0x913c, 0x0000000f, 0x0100000a,
927 0x8d00, 0xffff7f7f, 0x100e4848,
928 0x8d04, 0x00ffffff, 0x00164745,
929 0x8c00, 0xfffc0003, 0xe4000003,
930 0x8c04, 0xf8ff00ff, 0x40600060,
931 0x8c08, 0x00ff00ff, 0x001c001c,
932 0x8cf0, 0x1fff1fff, 0x08e00410,
933 0x8c20, 0x0fff0fff, 0x00800080,
934 0x8c24, 0x0fff0fff, 0x00800080,
935 0x8c18, 0xffffffff, 0x20202078,
936 0x8c1c, 0x0000ffff, 0x00001010,
937 0x28350, 0x00000f01, 0x00000000,
938 0x9508, 0x3700001f, 0x00000002,
939 0x960c, 0xffffffff, 0x54763210,
940 0x88c4, 0x001f3ae3, 0x000000c2,
941 0x88d4, 0x0000001f, 0x00000010,
942 0x8974, 0xffffffff, 0x00000000
943 };
944
945 static const u32 caicos_golden_registers[] =
946 {
947 0x5eb4, 0xffffffff, 0x00000002,
948 0x5e78, 0x8f311ff1, 0x001000f0,
949 0x8c8, 0x00003420, 0x00001450,
950 0x8cc, 0x000fffff, 0x00040035,
951 0x3f90, 0xffff0000, 0xfffc0000,
952 0x9148, 0xffff0000, 0xfffc0000,
953 0x3f94, 0xffff0000, 0xfffc0000,
954 0x914c, 0xffff0000, 0xfffc0000,
955 0xc78, 0x00000080, 0x00000080,
956 0xbd4, 0x00073007, 0x00010001,
957 0xd02c, 0xbfffff1f, 0x08421000,
958 0xd0b8, 0x03773777, 0x02010001,
959 0x5bc0, 0x00200000, 0x50100000,
960 0x98f8, 0x33773777, 0x02010001,
961 0x98fc, 0xffffffff, 0x33221100,
962 0x7030, 0x31000311, 0x00000011,
963 0x2f48, 0x33773777, 0x02010001,
964 0x6b28, 0x00000010, 0x00000012,
965 0x7728, 0x00000010, 0x00000012,
966 0x10328, 0x00000010, 0x00000012,
967 0x10f28, 0x00000010, 0x00000012,
968 0x11b28, 0x00000010, 0x00000012,
969 0x12728, 0x00000010, 0x00000012,
970 0x240c, 0x000007ff, 0x00000380,
971 0x8a14, 0xf000001f, 0x00000001,
972 0x8b24, 0x3fff3fff, 0x00ff0fff,
973 0x8b10, 0x0000ff0f, 0x00000000,
974 0x28a4c, 0x07ffffff, 0x06000000,
975 0x10c, 0x00000001, 0x00010003,
976 0xa02c, 0xffffffff, 0x0000009b,
977 0x913c, 0x0000000f, 0x0100000a,
978 0x8d00, 0xffff7f7f, 0x100e4848,
979 0x8d04, 0x00ffffff, 0x00164745,
980 0x8c00, 0xfffc0003, 0xe4000003,
981 0x8c04, 0xf8ff00ff, 0x40600060,
982 0x8c08, 0x00ff00ff, 0x001c001c,
983 0x8cf0, 0x1fff1fff, 0x08e00410,
984 0x8c20, 0x0fff0fff, 0x00800080,
985 0x8c24, 0x0fff0fff, 0x00800080,
986 0x8c18, 0xffffffff, 0x20202078,
987 0x8c1c, 0x0000ffff, 0x00001010,
988 0x28350, 0x00000f01, 0x00000000,
989 0x9508, 0x3700001f, 0x00000002,
990 0x960c, 0xffffffff, 0x54763210,
991 0x88c4, 0x001f3ae3, 0x000000c2,
992 0x88d4, 0x0000001f, 0x00000010,
993 0x8974, 0xffffffff, 0x00000000
994 };
995
evergreen_init_golden_registers(struct radeon_device * rdev)996 static void evergreen_init_golden_registers(struct radeon_device *rdev)
997 {
998 switch (rdev->family) {
999 case CHIP_CYPRESS:
1000 case CHIP_HEMLOCK:
1001 radeon_program_register_sequence(rdev,
1002 evergreen_golden_registers,
1003 (const u32)ARRAY_SIZE(evergreen_golden_registers));
1004 radeon_program_register_sequence(rdev,
1005 evergreen_golden_registers2,
1006 (const u32)ARRAY_SIZE(evergreen_golden_registers2));
1007 radeon_program_register_sequence(rdev,
1008 cypress_mgcg_init,
1009 (const u32)ARRAY_SIZE(cypress_mgcg_init));
1010 break;
1011 case CHIP_JUNIPER:
1012 radeon_program_register_sequence(rdev,
1013 evergreen_golden_registers,
1014 (const u32)ARRAY_SIZE(evergreen_golden_registers));
1015 radeon_program_register_sequence(rdev,
1016 evergreen_golden_registers2,
1017 (const u32)ARRAY_SIZE(evergreen_golden_registers2));
1018 radeon_program_register_sequence(rdev,
1019 juniper_mgcg_init,
1020 (const u32)ARRAY_SIZE(juniper_mgcg_init));
1021 break;
1022 case CHIP_REDWOOD:
1023 radeon_program_register_sequence(rdev,
1024 evergreen_golden_registers,
1025 (const u32)ARRAY_SIZE(evergreen_golden_registers));
1026 radeon_program_register_sequence(rdev,
1027 evergreen_golden_registers2,
1028 (const u32)ARRAY_SIZE(evergreen_golden_registers2));
1029 radeon_program_register_sequence(rdev,
1030 redwood_mgcg_init,
1031 (const u32)ARRAY_SIZE(redwood_mgcg_init));
1032 break;
1033 case CHIP_CEDAR:
1034 radeon_program_register_sequence(rdev,
1035 cedar_golden_registers,
1036 (const u32)ARRAY_SIZE(cedar_golden_registers));
1037 radeon_program_register_sequence(rdev,
1038 evergreen_golden_registers2,
1039 (const u32)ARRAY_SIZE(evergreen_golden_registers2));
1040 radeon_program_register_sequence(rdev,
1041 cedar_mgcg_init,
1042 (const u32)ARRAY_SIZE(cedar_mgcg_init));
1043 break;
1044 case CHIP_PALM:
1045 radeon_program_register_sequence(rdev,
1046 wrestler_golden_registers,
1047 (const u32)ARRAY_SIZE(wrestler_golden_registers));
1048 break;
1049 case CHIP_SUMO:
1050 radeon_program_register_sequence(rdev,
1051 supersumo_golden_registers,
1052 (const u32)ARRAY_SIZE(supersumo_golden_registers));
1053 break;
1054 case CHIP_SUMO2:
1055 radeon_program_register_sequence(rdev,
1056 supersumo_golden_registers,
1057 (const u32)ARRAY_SIZE(supersumo_golden_registers));
1058 radeon_program_register_sequence(rdev,
1059 sumo_golden_registers,
1060 (const u32)ARRAY_SIZE(sumo_golden_registers));
1061 break;
1062 case CHIP_BARTS:
1063 radeon_program_register_sequence(rdev,
1064 barts_golden_registers,
1065 (const u32)ARRAY_SIZE(barts_golden_registers));
1066 break;
1067 case CHIP_TURKS:
1068 radeon_program_register_sequence(rdev,
1069 turks_golden_registers,
1070 (const u32)ARRAY_SIZE(turks_golden_registers));
1071 break;
1072 case CHIP_CAICOS:
1073 radeon_program_register_sequence(rdev,
1074 caicos_golden_registers,
1075 (const u32)ARRAY_SIZE(caicos_golden_registers));
1076 break;
1077 default:
1078 break;
1079 }
1080 }
1081
1082 /**
1083 * evergreen_get_allowed_info_register - fetch the register for the info ioctl
1084 *
1085 * @rdev: radeon_device pointer
1086 * @reg: register offset in bytes
1087 * @val: register value
1088 *
1089 * Returns 0 for success or -EINVAL for an invalid register
1090 *
1091 */
evergreen_get_allowed_info_register(struct radeon_device * rdev,u32 reg,u32 * val)1092 int evergreen_get_allowed_info_register(struct radeon_device *rdev,
1093 u32 reg, u32 *val)
1094 {
1095 switch (reg) {
1096 case GRBM_STATUS:
1097 case GRBM_STATUS_SE0:
1098 case GRBM_STATUS_SE1:
1099 case SRBM_STATUS:
1100 case SRBM_STATUS2:
1101 case DMA_STATUS_REG:
1102 case UVD_STATUS:
1103 *val = RREG32(reg);
1104 return 0;
1105 default:
1106 return -EINVAL;
1107 }
1108 }
1109
evergreen_tiling_fields(unsigned tiling_flags,unsigned * bankw,unsigned * bankh,unsigned * mtaspect,unsigned * tile_split)1110 void evergreen_tiling_fields(unsigned tiling_flags, unsigned *bankw,
1111 unsigned *bankh, unsigned *mtaspect,
1112 unsigned *tile_split)
1113 {
1114 *bankw = (tiling_flags >> RADEON_TILING_EG_BANKW_SHIFT) & RADEON_TILING_EG_BANKW_MASK;
1115 *bankh = (tiling_flags >> RADEON_TILING_EG_BANKH_SHIFT) & RADEON_TILING_EG_BANKH_MASK;
1116 *mtaspect = (tiling_flags >> RADEON_TILING_EG_MACRO_TILE_ASPECT_SHIFT) & RADEON_TILING_EG_MACRO_TILE_ASPECT_MASK;
1117 *tile_split = (tiling_flags >> RADEON_TILING_EG_TILE_SPLIT_SHIFT) & RADEON_TILING_EG_TILE_SPLIT_MASK;
1118 switch (*bankw) {
1119 default:
1120 case 1: *bankw = EVERGREEN_ADDR_SURF_BANK_WIDTH_1; break;
1121 case 2: *bankw = EVERGREEN_ADDR_SURF_BANK_WIDTH_2; break;
1122 case 4: *bankw = EVERGREEN_ADDR_SURF_BANK_WIDTH_4; break;
1123 case 8: *bankw = EVERGREEN_ADDR_SURF_BANK_WIDTH_8; break;
1124 }
1125 switch (*bankh) {
1126 default:
1127 case 1: *bankh = EVERGREEN_ADDR_SURF_BANK_HEIGHT_1; break;
1128 case 2: *bankh = EVERGREEN_ADDR_SURF_BANK_HEIGHT_2; break;
1129 case 4: *bankh = EVERGREEN_ADDR_SURF_BANK_HEIGHT_4; break;
1130 case 8: *bankh = EVERGREEN_ADDR_SURF_BANK_HEIGHT_8; break;
1131 }
1132 switch (*mtaspect) {
1133 default:
1134 case 1: *mtaspect = EVERGREEN_ADDR_SURF_MACRO_TILE_ASPECT_1; break;
1135 case 2: *mtaspect = EVERGREEN_ADDR_SURF_MACRO_TILE_ASPECT_2; break;
1136 case 4: *mtaspect = EVERGREEN_ADDR_SURF_MACRO_TILE_ASPECT_4; break;
1137 case 8: *mtaspect = EVERGREEN_ADDR_SURF_MACRO_TILE_ASPECT_8; break;
1138 }
1139 }
1140
sumo_set_uvd_clock(struct radeon_device * rdev,u32 clock,u32 cntl_reg,u32 status_reg)1141 static int sumo_set_uvd_clock(struct radeon_device *rdev, u32 clock,
1142 u32 cntl_reg, u32 status_reg)
1143 {
1144 int r, i;
1145 struct atom_clock_dividers dividers;
1146
1147 r = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
1148 clock, false, ÷rs);
1149 if (r)
1150 return r;
1151
1152 WREG32_P(cntl_reg, dividers.post_div, ~(DCLK_DIR_CNTL_EN|DCLK_DIVIDER_MASK));
1153
1154 for (i = 0; i < 100; i++) {
1155 if (RREG32(status_reg) & DCLK_STATUS)
1156 break;
1157 mdelay(10);
1158 }
1159 if (i == 100)
1160 return -ETIMEDOUT;
1161
1162 return 0;
1163 }
1164
sumo_set_uvd_clocks(struct radeon_device * rdev,u32 vclk,u32 dclk)1165 int sumo_set_uvd_clocks(struct radeon_device *rdev, u32 vclk, u32 dclk)
1166 {
1167 int r = 0;
1168 u32 cg_scratch = RREG32(CG_SCRATCH1);
1169
1170 r = sumo_set_uvd_clock(rdev, vclk, CG_VCLK_CNTL, CG_VCLK_STATUS);
1171 if (r)
1172 goto done;
1173 cg_scratch &= 0xffff0000;
1174 cg_scratch |= vclk / 100; /* Mhz */
1175
1176 r = sumo_set_uvd_clock(rdev, dclk, CG_DCLK_CNTL, CG_DCLK_STATUS);
1177 if (r)
1178 goto done;
1179 cg_scratch &= 0x0000ffff;
1180 cg_scratch |= (dclk / 100) << 16; /* Mhz */
1181
1182 done:
1183 WREG32(CG_SCRATCH1, cg_scratch);
1184
1185 return r;
1186 }
1187
evergreen_set_uvd_clocks(struct radeon_device * rdev,u32 vclk,u32 dclk)1188 int evergreen_set_uvd_clocks(struct radeon_device *rdev, u32 vclk, u32 dclk)
1189 {
1190 /* start off with something large */
1191 unsigned fb_div = 0, vclk_div = 0, dclk_div = 0;
1192 int r;
1193
1194 /* bypass vclk and dclk with bclk */
1195 WREG32_P(CG_UPLL_FUNC_CNTL_2,
1196 VCLK_SRC_SEL(1) | DCLK_SRC_SEL(1),
1197 ~(VCLK_SRC_SEL_MASK | DCLK_SRC_SEL_MASK));
1198
1199 /* put PLL in bypass mode */
1200 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_BYPASS_EN_MASK, ~UPLL_BYPASS_EN_MASK);
1201
1202 if (!vclk || !dclk) {
1203 /* keep the Bypass mode, put PLL to sleep */
1204 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_SLEEP_MASK, ~UPLL_SLEEP_MASK);
1205 return 0;
1206 }
1207
1208 r = radeon_uvd_calc_upll_dividers(rdev, vclk, dclk, 125000, 250000,
1209 16384, 0x03FFFFFF, 0, 128, 5,
1210 &fb_div, &vclk_div, &dclk_div);
1211 if (r)
1212 return r;
1213
1214 /* set VCO_MODE to 1 */
1215 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_VCO_MODE_MASK, ~UPLL_VCO_MODE_MASK);
1216
1217 /* toggle UPLL_SLEEP to 1 then back to 0 */
1218 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_SLEEP_MASK, ~UPLL_SLEEP_MASK);
1219 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_SLEEP_MASK);
1220
1221 /* deassert UPLL_RESET */
1222 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_RESET_MASK);
1223
1224 mdelay(1);
1225
1226 r = radeon_uvd_send_upll_ctlreq(rdev, CG_UPLL_FUNC_CNTL);
1227 if (r)
1228 return r;
1229
1230 /* assert UPLL_RESET again */
1231 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_RESET_MASK, ~UPLL_RESET_MASK);
1232
1233 /* disable spread spectrum. */
1234 WREG32_P(CG_UPLL_SPREAD_SPECTRUM, 0, ~SSEN_MASK);
1235
1236 /* set feedback divider */
1237 WREG32_P(CG_UPLL_FUNC_CNTL_3, UPLL_FB_DIV(fb_div), ~UPLL_FB_DIV_MASK);
1238
1239 /* set ref divider to 0 */
1240 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_REF_DIV_MASK);
1241
1242 if (fb_div < 307200)
1243 WREG32_P(CG_UPLL_FUNC_CNTL_4, 0, ~UPLL_SPARE_ISPARE9);
1244 else
1245 WREG32_P(CG_UPLL_FUNC_CNTL_4, UPLL_SPARE_ISPARE9, ~UPLL_SPARE_ISPARE9);
1246
1247 /* set PDIV_A and PDIV_B */
1248 WREG32_P(CG_UPLL_FUNC_CNTL_2,
1249 UPLL_PDIV_A(vclk_div) | UPLL_PDIV_B(dclk_div),
1250 ~(UPLL_PDIV_A_MASK | UPLL_PDIV_B_MASK));
1251
1252 /* give the PLL some time to settle */
1253 mdelay(15);
1254
1255 /* deassert PLL_RESET */
1256 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_RESET_MASK);
1257
1258 mdelay(15);
1259
1260 /* switch from bypass mode to normal mode */
1261 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_BYPASS_EN_MASK);
1262
1263 r = radeon_uvd_send_upll_ctlreq(rdev, CG_UPLL_FUNC_CNTL);
1264 if (r)
1265 return r;
1266
1267 /* switch VCLK and DCLK selection */
1268 WREG32_P(CG_UPLL_FUNC_CNTL_2,
1269 VCLK_SRC_SEL(2) | DCLK_SRC_SEL(2),
1270 ~(VCLK_SRC_SEL_MASK | DCLK_SRC_SEL_MASK));
1271
1272 mdelay(100);
1273
1274 return 0;
1275 }
1276
evergreen_fix_pci_max_read_req_size(struct radeon_device * rdev)1277 void evergreen_fix_pci_max_read_req_size(struct radeon_device *rdev)
1278 {
1279 int readrq;
1280 u16 v;
1281
1282 readrq = pcie_get_readrq(rdev->pdev);
1283 v = ffs(readrq) - 8;
1284 /* if bios or OS sets MAX_READ_REQUEST_SIZE to an invalid value, fix it
1285 * to avoid hangs or perfomance issues
1286 */
1287 if ((v == 0) || (v == 6) || (v == 7))
1288 pcie_set_readrq(rdev->pdev, 512);
1289 }
1290
dce4_program_fmt(struct drm_encoder * encoder)1291 void dce4_program_fmt(struct drm_encoder *encoder)
1292 {
1293 struct drm_device *dev = encoder->dev;
1294 struct radeon_device *rdev = dev->dev_private;
1295 struct radeon_encoder *radeon_encoder = to_radeon_encoder(encoder);
1296 struct radeon_crtc *radeon_crtc = to_radeon_crtc(encoder->crtc);
1297 struct drm_connector *connector = radeon_get_connector_for_encoder(encoder);
1298 int bpc = 0;
1299 u32 tmp = 0;
1300 enum radeon_connector_dither dither = RADEON_FMT_DITHER_DISABLE;
1301
1302 if (connector) {
1303 struct radeon_connector *radeon_connector = to_radeon_connector(connector);
1304 bpc = radeon_get_monitor_bpc(connector);
1305 dither = radeon_connector->dither;
1306 }
1307
1308 /* LVDS/eDP FMT is set up by atom */
1309 if (radeon_encoder->devices & ATOM_DEVICE_LCD_SUPPORT)
1310 return;
1311
1312 /* not needed for analog */
1313 if ((radeon_encoder->encoder_id == ENCODER_OBJECT_ID_INTERNAL_KLDSCP_DAC1) ||
1314 (radeon_encoder->encoder_id == ENCODER_OBJECT_ID_INTERNAL_KLDSCP_DAC2))
1315 return;
1316
1317 if (bpc == 0)
1318 return;
1319
1320 switch (bpc) {
1321 case 6:
1322 if (dither == RADEON_FMT_DITHER_ENABLE)
1323 /* XXX sort out optimal dither settings */
1324 tmp |= (FMT_FRAME_RANDOM_ENABLE | FMT_HIGHPASS_RANDOM_ENABLE |
1325 FMT_SPATIAL_DITHER_EN);
1326 else
1327 tmp |= FMT_TRUNCATE_EN;
1328 break;
1329 case 8:
1330 if (dither == RADEON_FMT_DITHER_ENABLE)
1331 /* XXX sort out optimal dither settings */
1332 tmp |= (FMT_FRAME_RANDOM_ENABLE | FMT_HIGHPASS_RANDOM_ENABLE |
1333 FMT_RGB_RANDOM_ENABLE |
1334 FMT_SPATIAL_DITHER_EN | FMT_SPATIAL_DITHER_DEPTH);
1335 else
1336 tmp |= (FMT_TRUNCATE_EN | FMT_TRUNCATE_DEPTH);
1337 break;
1338 case 10:
1339 default:
1340 /* not needed */
1341 break;
1342 }
1343
1344 WREG32(FMT_BIT_DEPTH_CONTROL + radeon_crtc->crtc_offset, tmp);
1345 }
1346
dce4_is_in_vblank(struct radeon_device * rdev,int crtc)1347 static bool dce4_is_in_vblank(struct radeon_device *rdev, int crtc)
1348 {
1349 if (RREG32(EVERGREEN_CRTC_STATUS + crtc_offsets[crtc]) & EVERGREEN_CRTC_V_BLANK)
1350 return true;
1351 else
1352 return false;
1353 }
1354
dce4_is_counter_moving(struct radeon_device * rdev,int crtc)1355 static bool dce4_is_counter_moving(struct radeon_device *rdev, int crtc)
1356 {
1357 u32 pos1, pos2;
1358
1359 pos1 = RREG32(EVERGREEN_CRTC_STATUS_POSITION + crtc_offsets[crtc]);
1360 pos2 = RREG32(EVERGREEN_CRTC_STATUS_POSITION + crtc_offsets[crtc]);
1361
1362 if (pos1 != pos2)
1363 return true;
1364 else
1365 return false;
1366 }
1367
1368 /**
1369 * dce4_wait_for_vblank - vblank wait asic callback.
1370 *
1371 * @rdev: radeon_device pointer
1372 * @crtc: crtc to wait for vblank on
1373 *
1374 * Wait for vblank on the requested crtc (evergreen+).
1375 */
dce4_wait_for_vblank(struct radeon_device * rdev,int crtc)1376 void dce4_wait_for_vblank(struct radeon_device *rdev, int crtc)
1377 {
1378 unsigned i = 0;
1379
1380 if (crtc >= rdev->num_crtc)
1381 return;
1382
1383 if (!(RREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[crtc]) & EVERGREEN_CRTC_MASTER_EN))
1384 return;
1385
1386 /* depending on when we hit vblank, we may be close to active; if so,
1387 * wait for another frame.
1388 */
1389 while (dce4_is_in_vblank(rdev, crtc)) {
1390 if (i++ % 100 == 0) {
1391 if (!dce4_is_counter_moving(rdev, crtc))
1392 break;
1393 }
1394 }
1395
1396 while (!dce4_is_in_vblank(rdev, crtc)) {
1397 if (i++ % 100 == 0) {
1398 if (!dce4_is_counter_moving(rdev, crtc))
1399 break;
1400 }
1401 }
1402 }
1403
1404 /**
1405 * evergreen_page_flip - pageflip callback.
1406 *
1407 * @rdev: radeon_device pointer
1408 * @crtc_id: crtc to cleanup pageflip on
1409 * @crtc_base: new address of the crtc (GPU MC address)
1410 *
1411 * Triggers the actual pageflip by updating the primary
1412 * surface base address (evergreen+).
1413 */
evergreen_page_flip(struct radeon_device * rdev,int crtc_id,u64 crtc_base,bool async)1414 void evergreen_page_flip(struct radeon_device *rdev, int crtc_id, u64 crtc_base,
1415 bool async)
1416 {
1417 struct radeon_crtc *radeon_crtc = rdev->mode_info.crtcs[crtc_id];
1418
1419 /* update the scanout addresses */
1420 WREG32(EVERGREEN_GRPH_FLIP_CONTROL + radeon_crtc->crtc_offset,
1421 async ? EVERGREEN_GRPH_SURFACE_UPDATE_H_RETRACE_EN : 0);
1422 WREG32(EVERGREEN_GRPH_PRIMARY_SURFACE_ADDRESS_HIGH + radeon_crtc->crtc_offset,
1423 upper_32_bits(crtc_base));
1424 WREG32(EVERGREEN_GRPH_PRIMARY_SURFACE_ADDRESS + radeon_crtc->crtc_offset,
1425 (u32)crtc_base);
1426 /* post the write */
1427 RREG32(EVERGREEN_GRPH_PRIMARY_SURFACE_ADDRESS + radeon_crtc->crtc_offset);
1428 }
1429
1430 /**
1431 * evergreen_page_flip_pending - check if page flip is still pending
1432 *
1433 * @rdev: radeon_device pointer
1434 * @crtc_id: crtc to check
1435 *
1436 * Returns the current update pending status.
1437 */
evergreen_page_flip_pending(struct radeon_device * rdev,int crtc_id)1438 bool evergreen_page_flip_pending(struct radeon_device *rdev, int crtc_id)
1439 {
1440 struct radeon_crtc *radeon_crtc = rdev->mode_info.crtcs[crtc_id];
1441
1442 /* Return current update_pending status: */
1443 return !!(RREG32(EVERGREEN_GRPH_UPDATE + radeon_crtc->crtc_offset) &
1444 EVERGREEN_GRPH_SURFACE_UPDATE_PENDING);
1445 }
1446
1447 /* get temperature in millidegrees */
evergreen_get_temp(struct radeon_device * rdev)1448 int evergreen_get_temp(struct radeon_device *rdev)
1449 {
1450 u32 temp, toffset;
1451 int actual_temp = 0;
1452
1453 if (rdev->family == CHIP_JUNIPER) {
1454 toffset = (RREG32(CG_THERMAL_CTRL) & TOFFSET_MASK) >>
1455 TOFFSET_SHIFT;
1456 temp = (RREG32(CG_TS0_STATUS) & TS0_ADC_DOUT_MASK) >>
1457 TS0_ADC_DOUT_SHIFT;
1458
1459 if (toffset & 0x100)
1460 actual_temp = temp / 2 - (0x200 - toffset);
1461 else
1462 actual_temp = temp / 2 + toffset;
1463
1464 actual_temp = actual_temp * 1000;
1465
1466 } else {
1467 temp = (RREG32(CG_MULT_THERMAL_STATUS) & ASIC_T_MASK) >>
1468 ASIC_T_SHIFT;
1469
1470 if (temp & 0x400)
1471 actual_temp = -256;
1472 else if (temp & 0x200)
1473 actual_temp = 255;
1474 else if (temp & 0x100) {
1475 actual_temp = temp & 0x1ff;
1476 actual_temp |= ~0x1ff;
1477 } else
1478 actual_temp = temp & 0xff;
1479
1480 actual_temp = (actual_temp * 1000) / 2;
1481 }
1482
1483 return actual_temp;
1484 }
1485
sumo_get_temp(struct radeon_device * rdev)1486 int sumo_get_temp(struct radeon_device *rdev)
1487 {
1488 u32 temp = RREG32(CG_THERMAL_STATUS) & 0xff;
1489 int actual_temp = temp - 49;
1490
1491 return actual_temp * 1000;
1492 }
1493
1494 /**
1495 * sumo_pm_init_profile - Initialize power profiles callback.
1496 *
1497 * @rdev: radeon_device pointer
1498 *
1499 * Initialize the power states used in profile mode
1500 * (sumo, trinity, SI).
1501 * Used for profile mode only.
1502 */
sumo_pm_init_profile(struct radeon_device * rdev)1503 void sumo_pm_init_profile(struct radeon_device *rdev)
1504 {
1505 int idx;
1506
1507 /* default */
1508 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
1509 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
1510 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
1511 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 0;
1512
1513 /* low,mid sh/mh */
1514 if (rdev->flags & RADEON_IS_MOBILITY)
1515 idx = radeon_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 0);
1516 else
1517 idx = radeon_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
1518
1519 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = idx;
1520 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = idx;
1521 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
1522 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
1523
1524 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = idx;
1525 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = idx;
1526 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
1527 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
1528
1529 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = idx;
1530 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = idx;
1531 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
1532 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 0;
1533
1534 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = idx;
1535 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = idx;
1536 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
1537 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 0;
1538
1539 /* high sh/mh */
1540 idx = radeon_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
1541 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = idx;
1542 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = idx;
1543 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
1544 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx =
1545 rdev->pm.power_state[idx].num_clock_modes - 1;
1546
1547 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = idx;
1548 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = idx;
1549 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
1550 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx =
1551 rdev->pm.power_state[idx].num_clock_modes - 1;
1552 }
1553
1554 /**
1555 * btc_pm_init_profile - Initialize power profiles callback.
1556 *
1557 * @rdev: radeon_device pointer
1558 *
1559 * Initialize the power states used in profile mode
1560 * (BTC, cayman).
1561 * Used for profile mode only.
1562 */
btc_pm_init_profile(struct radeon_device * rdev)1563 void btc_pm_init_profile(struct radeon_device *rdev)
1564 {
1565 int idx;
1566
1567 /* default */
1568 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
1569 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
1570 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
1571 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 2;
1572 /* starting with BTC, there is one state that is used for both
1573 * MH and SH. Difference is that we always use the high clock index for
1574 * mclk.
1575 */
1576 if (rdev->flags & RADEON_IS_MOBILITY)
1577 idx = radeon_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 0);
1578 else
1579 idx = radeon_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
1580 /* low sh */
1581 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = idx;
1582 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = idx;
1583 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
1584 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
1585 /* mid sh */
1586 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = idx;
1587 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = idx;
1588 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
1589 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 1;
1590 /* high sh */
1591 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = idx;
1592 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = idx;
1593 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
1594 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 2;
1595 /* low mh */
1596 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = idx;
1597 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = idx;
1598 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
1599 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
1600 /* mid mh */
1601 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = idx;
1602 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = idx;
1603 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
1604 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 1;
1605 /* high mh */
1606 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = idx;
1607 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = idx;
1608 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
1609 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 2;
1610 }
1611
1612 /**
1613 * evergreen_pm_misc - set additional pm hw parameters callback.
1614 *
1615 * @rdev: radeon_device pointer
1616 *
1617 * Set non-clock parameters associated with a power state
1618 * (voltage, etc.) (evergreen+).
1619 */
evergreen_pm_misc(struct radeon_device * rdev)1620 void evergreen_pm_misc(struct radeon_device *rdev)
1621 {
1622 int req_ps_idx = rdev->pm.requested_power_state_index;
1623 int req_cm_idx = rdev->pm.requested_clock_mode_index;
1624 struct radeon_power_state *ps = &rdev->pm.power_state[req_ps_idx];
1625 struct radeon_voltage *voltage = &ps->clock_info[req_cm_idx].voltage;
1626
1627 if (voltage->type == VOLTAGE_SW) {
1628 /* 0xff0x are flags rather then an actual voltage */
1629 if ((voltage->voltage & 0xff00) == 0xff00)
1630 return;
1631 if (voltage->voltage && (voltage->voltage != rdev->pm.current_vddc)) {
1632 radeon_atom_set_voltage(rdev, voltage->voltage, SET_VOLTAGE_TYPE_ASIC_VDDC);
1633 rdev->pm.current_vddc = voltage->voltage;
1634 DRM_DEBUG("Setting: vddc: %d\n", voltage->voltage);
1635 }
1636
1637 /* starting with BTC, there is one state that is used for both
1638 * MH and SH. Difference is that we always use the high clock index for
1639 * mclk and vddci.
1640 */
1641 if ((rdev->pm.pm_method == PM_METHOD_PROFILE) &&
1642 (rdev->family >= CHIP_BARTS) &&
1643 rdev->pm.active_crtc_count &&
1644 ((rdev->pm.profile_index == PM_PROFILE_MID_MH_IDX) ||
1645 (rdev->pm.profile_index == PM_PROFILE_LOW_MH_IDX)))
1646 voltage = &rdev->pm.power_state[req_ps_idx].
1647 clock_info[rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx].voltage;
1648
1649 /* 0xff0x are flags rather then an actual voltage */
1650 if ((voltage->vddci & 0xff00) == 0xff00)
1651 return;
1652 if (voltage->vddci && (voltage->vddci != rdev->pm.current_vddci)) {
1653 radeon_atom_set_voltage(rdev, voltage->vddci, SET_VOLTAGE_TYPE_ASIC_VDDCI);
1654 rdev->pm.current_vddci = voltage->vddci;
1655 DRM_DEBUG("Setting: vddci: %d\n", voltage->vddci);
1656 }
1657 }
1658 }
1659
1660 /**
1661 * evergreen_pm_prepare - pre-power state change callback.
1662 *
1663 * @rdev: radeon_device pointer
1664 *
1665 * Prepare for a power state change (evergreen+).
1666 */
evergreen_pm_prepare(struct radeon_device * rdev)1667 void evergreen_pm_prepare(struct radeon_device *rdev)
1668 {
1669 struct drm_device *ddev = rdev->ddev;
1670 struct drm_crtc *crtc;
1671 struct radeon_crtc *radeon_crtc;
1672 u32 tmp;
1673
1674 /* disable any active CRTCs */
1675 list_for_each_entry(crtc, &ddev->mode_config.crtc_list, head) {
1676 radeon_crtc = to_radeon_crtc(crtc);
1677 if (radeon_crtc->enabled) {
1678 tmp = RREG32(EVERGREEN_CRTC_CONTROL + radeon_crtc->crtc_offset);
1679 tmp |= EVERGREEN_CRTC_DISP_READ_REQUEST_DISABLE;
1680 WREG32(EVERGREEN_CRTC_CONTROL + radeon_crtc->crtc_offset, tmp);
1681 }
1682 }
1683 }
1684
1685 /**
1686 * evergreen_pm_finish - post-power state change callback.
1687 *
1688 * @rdev: radeon_device pointer
1689 *
1690 * Clean up after a power state change (evergreen+).
1691 */
evergreen_pm_finish(struct radeon_device * rdev)1692 void evergreen_pm_finish(struct radeon_device *rdev)
1693 {
1694 struct drm_device *ddev = rdev->ddev;
1695 struct drm_crtc *crtc;
1696 struct radeon_crtc *radeon_crtc;
1697 u32 tmp;
1698
1699 /* enable any active CRTCs */
1700 list_for_each_entry(crtc, &ddev->mode_config.crtc_list, head) {
1701 radeon_crtc = to_radeon_crtc(crtc);
1702 if (radeon_crtc->enabled) {
1703 tmp = RREG32(EVERGREEN_CRTC_CONTROL + radeon_crtc->crtc_offset);
1704 tmp &= ~EVERGREEN_CRTC_DISP_READ_REQUEST_DISABLE;
1705 WREG32(EVERGREEN_CRTC_CONTROL + radeon_crtc->crtc_offset, tmp);
1706 }
1707 }
1708 }
1709
1710 /**
1711 * evergreen_hpd_sense - hpd sense callback.
1712 *
1713 * @rdev: radeon_device pointer
1714 * @hpd: hpd (hotplug detect) pin
1715 *
1716 * Checks if a digital monitor is connected (evergreen+).
1717 * Returns true if connected, false if not connected.
1718 */
evergreen_hpd_sense(struct radeon_device * rdev,enum radeon_hpd_id hpd)1719 bool evergreen_hpd_sense(struct radeon_device *rdev, enum radeon_hpd_id hpd)
1720 {
1721 if (hpd == RADEON_HPD_NONE)
1722 return false;
1723
1724 return !!(RREG32(DC_HPDx_INT_STATUS_REG(hpd)) & DC_HPDx_SENSE);
1725 }
1726
1727 /**
1728 * evergreen_hpd_set_polarity - hpd set polarity callback.
1729 *
1730 * @rdev: radeon_device pointer
1731 * @hpd: hpd (hotplug detect) pin
1732 *
1733 * Set the polarity of the hpd pin (evergreen+).
1734 */
evergreen_hpd_set_polarity(struct radeon_device * rdev,enum radeon_hpd_id hpd)1735 void evergreen_hpd_set_polarity(struct radeon_device *rdev,
1736 enum radeon_hpd_id hpd)
1737 {
1738 bool connected = evergreen_hpd_sense(rdev, hpd);
1739
1740 if (hpd == RADEON_HPD_NONE)
1741 return;
1742
1743 if (connected)
1744 WREG32_AND(DC_HPDx_INT_CONTROL(hpd), ~DC_HPDx_INT_POLARITY);
1745 else
1746 WREG32_OR(DC_HPDx_INT_CONTROL(hpd), DC_HPDx_INT_POLARITY);
1747 }
1748
1749 /**
1750 * evergreen_hpd_init - hpd setup callback.
1751 *
1752 * @rdev: radeon_device pointer
1753 *
1754 * Setup the hpd pins used by the card (evergreen+).
1755 * Enable the pin, set the polarity, and enable the hpd interrupts.
1756 */
evergreen_hpd_init(struct radeon_device * rdev)1757 void evergreen_hpd_init(struct radeon_device *rdev)
1758 {
1759 struct drm_device *dev = rdev->ddev;
1760 struct drm_connector *connector;
1761 unsigned enabled = 0;
1762 u32 tmp = DC_HPDx_CONNECTION_TIMER(0x9c4) |
1763 DC_HPDx_RX_INT_TIMER(0xfa) | DC_HPDx_EN;
1764
1765 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
1766 enum radeon_hpd_id hpd =
1767 to_radeon_connector(connector)->hpd.hpd;
1768
1769 if (connector->connector_type == DRM_MODE_CONNECTOR_eDP ||
1770 connector->connector_type == DRM_MODE_CONNECTOR_LVDS) {
1771 /* don't try to enable hpd on eDP or LVDS avoid breaking the
1772 * aux dp channel on imac and help (but not completely fix)
1773 * https://bugzilla.redhat.com/show_bug.cgi?id=726143
1774 * also avoid interrupt storms during dpms.
1775 */
1776 continue;
1777 }
1778
1779 if (hpd == RADEON_HPD_NONE)
1780 continue;
1781
1782 WREG32(DC_HPDx_CONTROL(hpd), tmp);
1783 enabled |= 1 << hpd;
1784
1785 radeon_hpd_set_polarity(rdev, hpd);
1786 }
1787 radeon_irq_kms_enable_hpd(rdev, enabled);
1788 }
1789
1790 /**
1791 * evergreen_hpd_fini - hpd tear down callback.
1792 *
1793 * @rdev: radeon_device pointer
1794 *
1795 * Tear down the hpd pins used by the card (evergreen+).
1796 * Disable the hpd interrupts.
1797 */
evergreen_hpd_fini(struct radeon_device * rdev)1798 void evergreen_hpd_fini(struct radeon_device *rdev)
1799 {
1800 struct drm_device *dev = rdev->ddev;
1801 struct drm_connector *connector;
1802 unsigned disabled = 0;
1803
1804 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
1805 enum radeon_hpd_id hpd =
1806 to_radeon_connector(connector)->hpd.hpd;
1807
1808 if (hpd == RADEON_HPD_NONE)
1809 continue;
1810
1811 WREG32(DC_HPDx_CONTROL(hpd), 0);
1812 disabled |= 1 << hpd;
1813 }
1814 radeon_irq_kms_disable_hpd(rdev, disabled);
1815 }
1816
1817 /* watermark setup */
1818
evergreen_line_buffer_adjust(struct radeon_device * rdev,struct radeon_crtc * radeon_crtc,struct drm_display_mode * mode,struct drm_display_mode * other_mode)1819 static u32 evergreen_line_buffer_adjust(struct radeon_device *rdev,
1820 struct radeon_crtc *radeon_crtc,
1821 struct drm_display_mode *mode,
1822 struct drm_display_mode *other_mode)
1823 {
1824 u32 tmp, buffer_alloc, i;
1825 u32 pipe_offset = radeon_crtc->crtc_id * 0x20;
1826 /*
1827 * Line Buffer Setup
1828 * There are 3 line buffers, each one shared by 2 display controllers.
1829 * DC_LB_MEMORY_SPLIT controls how that line buffer is shared between
1830 * the display controllers. The paritioning is done via one of four
1831 * preset allocations specified in bits 2:0:
1832 * first display controller
1833 * 0 - first half of lb (3840 * 2)
1834 * 1 - first 3/4 of lb (5760 * 2)
1835 * 2 - whole lb (7680 * 2), other crtc must be disabled
1836 * 3 - first 1/4 of lb (1920 * 2)
1837 * second display controller
1838 * 4 - second half of lb (3840 * 2)
1839 * 5 - second 3/4 of lb (5760 * 2)
1840 * 6 - whole lb (7680 * 2), other crtc must be disabled
1841 * 7 - last 1/4 of lb (1920 * 2)
1842 */
1843 /* this can get tricky if we have two large displays on a paired group
1844 * of crtcs. Ideally for multiple large displays we'd assign them to
1845 * non-linked crtcs for maximum line buffer allocation.
1846 */
1847 if (radeon_crtc->base.enabled && mode) {
1848 if (other_mode) {
1849 tmp = 0; /* 1/2 */
1850 buffer_alloc = 1;
1851 } else {
1852 tmp = 2; /* whole */
1853 buffer_alloc = 2;
1854 }
1855 } else {
1856 tmp = 0;
1857 buffer_alloc = 0;
1858 }
1859
1860 /* second controller of the pair uses second half of the lb */
1861 if (radeon_crtc->crtc_id % 2)
1862 tmp += 4;
1863 WREG32(DC_LB_MEMORY_SPLIT + radeon_crtc->crtc_offset, tmp);
1864
1865 if (ASIC_IS_DCE41(rdev) || ASIC_IS_DCE5(rdev)) {
1866 WREG32(PIPE0_DMIF_BUFFER_CONTROL + pipe_offset,
1867 DMIF_BUFFERS_ALLOCATED(buffer_alloc));
1868 for (i = 0; i < rdev->usec_timeout; i++) {
1869 if (RREG32(PIPE0_DMIF_BUFFER_CONTROL + pipe_offset) &
1870 DMIF_BUFFERS_ALLOCATED_COMPLETED)
1871 break;
1872 udelay(1);
1873 }
1874 }
1875
1876 if (radeon_crtc->base.enabled && mode) {
1877 switch (tmp) {
1878 case 0:
1879 case 4:
1880 default:
1881 if (ASIC_IS_DCE5(rdev))
1882 return 4096 * 2;
1883 else
1884 return 3840 * 2;
1885 case 1:
1886 case 5:
1887 if (ASIC_IS_DCE5(rdev))
1888 return 6144 * 2;
1889 else
1890 return 5760 * 2;
1891 case 2:
1892 case 6:
1893 if (ASIC_IS_DCE5(rdev))
1894 return 8192 * 2;
1895 else
1896 return 7680 * 2;
1897 case 3:
1898 case 7:
1899 if (ASIC_IS_DCE5(rdev))
1900 return 2048 * 2;
1901 else
1902 return 1920 * 2;
1903 }
1904 }
1905
1906 /* controller not enabled, so no lb used */
1907 return 0;
1908 }
1909
evergreen_get_number_of_dram_channels(struct radeon_device * rdev)1910 u32 evergreen_get_number_of_dram_channels(struct radeon_device *rdev)
1911 {
1912 u32 tmp = RREG32(MC_SHARED_CHMAP);
1913
1914 switch ((tmp & NOOFCHAN_MASK) >> NOOFCHAN_SHIFT) {
1915 case 0:
1916 default:
1917 return 1;
1918 case 1:
1919 return 2;
1920 case 2:
1921 return 4;
1922 case 3:
1923 return 8;
1924 }
1925 }
1926
1927 struct evergreen_wm_params {
1928 u32 dram_channels; /* number of dram channels */
1929 u32 yclk; /* bandwidth per dram data pin in kHz */
1930 u32 sclk; /* engine clock in kHz */
1931 u32 disp_clk; /* display clock in kHz */
1932 u32 src_width; /* viewport width */
1933 u32 active_time; /* active display time in ns */
1934 u32 blank_time; /* blank time in ns */
1935 bool interlaced; /* mode is interlaced */
1936 fixed20_12 vsc; /* vertical scale ratio */
1937 u32 num_heads; /* number of active crtcs */
1938 u32 bytes_per_pixel; /* bytes per pixel display + overlay */
1939 u32 lb_size; /* line buffer allocated to pipe */
1940 u32 vtaps; /* vertical scaler taps */
1941 };
1942
evergreen_dram_bandwidth(struct evergreen_wm_params * wm)1943 static u32 evergreen_dram_bandwidth(struct evergreen_wm_params *wm)
1944 {
1945 /* Calculate DRAM Bandwidth and the part allocated to display. */
1946 fixed20_12 dram_efficiency; /* 0.7 */
1947 fixed20_12 yclk, dram_channels, bandwidth;
1948 fixed20_12 a;
1949
1950 a.full = dfixed_const(1000);
1951 yclk.full = dfixed_const(wm->yclk);
1952 yclk.full = dfixed_div(yclk, a);
1953 dram_channels.full = dfixed_const(wm->dram_channels * 4);
1954 a.full = dfixed_const(10);
1955 dram_efficiency.full = dfixed_const(7);
1956 dram_efficiency.full = dfixed_div(dram_efficiency, a);
1957 bandwidth.full = dfixed_mul(dram_channels, yclk);
1958 bandwidth.full = dfixed_mul(bandwidth, dram_efficiency);
1959
1960 return dfixed_trunc(bandwidth);
1961 }
1962
evergreen_dram_bandwidth_for_display(struct evergreen_wm_params * wm)1963 static u32 evergreen_dram_bandwidth_for_display(struct evergreen_wm_params *wm)
1964 {
1965 /* Calculate DRAM Bandwidth and the part allocated to display. */
1966 fixed20_12 disp_dram_allocation; /* 0.3 to 0.7 */
1967 fixed20_12 yclk, dram_channels, bandwidth;
1968 fixed20_12 a;
1969
1970 a.full = dfixed_const(1000);
1971 yclk.full = dfixed_const(wm->yclk);
1972 yclk.full = dfixed_div(yclk, a);
1973 dram_channels.full = dfixed_const(wm->dram_channels * 4);
1974 a.full = dfixed_const(10);
1975 disp_dram_allocation.full = dfixed_const(3); /* XXX worse case value 0.3 */
1976 disp_dram_allocation.full = dfixed_div(disp_dram_allocation, a);
1977 bandwidth.full = dfixed_mul(dram_channels, yclk);
1978 bandwidth.full = dfixed_mul(bandwidth, disp_dram_allocation);
1979
1980 return dfixed_trunc(bandwidth);
1981 }
1982
evergreen_data_return_bandwidth(struct evergreen_wm_params * wm)1983 static u32 evergreen_data_return_bandwidth(struct evergreen_wm_params *wm)
1984 {
1985 /* Calculate the display Data return Bandwidth */
1986 fixed20_12 return_efficiency; /* 0.8 */
1987 fixed20_12 sclk, bandwidth;
1988 fixed20_12 a;
1989
1990 a.full = dfixed_const(1000);
1991 sclk.full = dfixed_const(wm->sclk);
1992 sclk.full = dfixed_div(sclk, a);
1993 a.full = dfixed_const(10);
1994 return_efficiency.full = dfixed_const(8);
1995 return_efficiency.full = dfixed_div(return_efficiency, a);
1996 a.full = dfixed_const(32);
1997 bandwidth.full = dfixed_mul(a, sclk);
1998 bandwidth.full = dfixed_mul(bandwidth, return_efficiency);
1999
2000 return dfixed_trunc(bandwidth);
2001 }
2002
evergreen_dmif_request_bandwidth(struct evergreen_wm_params * wm)2003 static u32 evergreen_dmif_request_bandwidth(struct evergreen_wm_params *wm)
2004 {
2005 /* Calculate the DMIF Request Bandwidth */
2006 fixed20_12 disp_clk_request_efficiency; /* 0.8 */
2007 fixed20_12 disp_clk, bandwidth;
2008 fixed20_12 a;
2009
2010 a.full = dfixed_const(1000);
2011 disp_clk.full = dfixed_const(wm->disp_clk);
2012 disp_clk.full = dfixed_div(disp_clk, a);
2013 a.full = dfixed_const(10);
2014 disp_clk_request_efficiency.full = dfixed_const(8);
2015 disp_clk_request_efficiency.full = dfixed_div(disp_clk_request_efficiency, a);
2016 a.full = dfixed_const(32);
2017 bandwidth.full = dfixed_mul(a, disp_clk);
2018 bandwidth.full = dfixed_mul(bandwidth, disp_clk_request_efficiency);
2019
2020 return dfixed_trunc(bandwidth);
2021 }
2022
evergreen_available_bandwidth(struct evergreen_wm_params * wm)2023 static u32 evergreen_available_bandwidth(struct evergreen_wm_params *wm)
2024 {
2025 /* Calculate the Available bandwidth. Display can use this temporarily but not in average. */
2026 u32 dram_bandwidth = evergreen_dram_bandwidth(wm);
2027 u32 data_return_bandwidth = evergreen_data_return_bandwidth(wm);
2028 u32 dmif_req_bandwidth = evergreen_dmif_request_bandwidth(wm);
2029
2030 return min(dram_bandwidth, min(data_return_bandwidth, dmif_req_bandwidth));
2031 }
2032
evergreen_average_bandwidth(struct evergreen_wm_params * wm)2033 static u32 evergreen_average_bandwidth(struct evergreen_wm_params *wm)
2034 {
2035 /* Calculate the display mode Average Bandwidth
2036 * DisplayMode should contain the source and destination dimensions,
2037 * timing, etc.
2038 */
2039 fixed20_12 bpp;
2040 fixed20_12 line_time;
2041 fixed20_12 src_width;
2042 fixed20_12 bandwidth;
2043 fixed20_12 a;
2044
2045 a.full = dfixed_const(1000);
2046 line_time.full = dfixed_const(wm->active_time + wm->blank_time);
2047 line_time.full = dfixed_div(line_time, a);
2048 bpp.full = dfixed_const(wm->bytes_per_pixel);
2049 src_width.full = dfixed_const(wm->src_width);
2050 bandwidth.full = dfixed_mul(src_width, bpp);
2051 bandwidth.full = dfixed_mul(bandwidth, wm->vsc);
2052 bandwidth.full = dfixed_div(bandwidth, line_time);
2053
2054 return dfixed_trunc(bandwidth);
2055 }
2056
evergreen_latency_watermark(struct evergreen_wm_params * wm)2057 static u32 evergreen_latency_watermark(struct evergreen_wm_params *wm)
2058 {
2059 /* First calcualte the latency in ns */
2060 u32 mc_latency = 2000; /* 2000 ns. */
2061 u32 available_bandwidth = evergreen_available_bandwidth(wm);
2062 u32 worst_chunk_return_time = (512 * 8 * 1000) / available_bandwidth;
2063 u32 cursor_line_pair_return_time = (128 * 4 * 1000) / available_bandwidth;
2064 u32 dc_latency = 40000000 / wm->disp_clk; /* dc pipe latency */
2065 u32 other_heads_data_return_time = ((wm->num_heads + 1) * worst_chunk_return_time) +
2066 (wm->num_heads * cursor_line_pair_return_time);
2067 u32 latency = mc_latency + other_heads_data_return_time + dc_latency;
2068 u32 max_src_lines_per_dst_line, lb_fill_bw, line_fill_time;
2069 fixed20_12 a, b, c;
2070
2071 if (wm->num_heads == 0)
2072 return 0;
2073
2074 a.full = dfixed_const(2);
2075 b.full = dfixed_const(1);
2076 if ((wm->vsc.full > a.full) ||
2077 ((wm->vsc.full > b.full) && (wm->vtaps >= 3)) ||
2078 (wm->vtaps >= 5) ||
2079 ((wm->vsc.full >= a.full) && wm->interlaced))
2080 max_src_lines_per_dst_line = 4;
2081 else
2082 max_src_lines_per_dst_line = 2;
2083
2084 a.full = dfixed_const(available_bandwidth);
2085 b.full = dfixed_const(wm->num_heads);
2086 a.full = dfixed_div(a, b);
2087
2088 lb_fill_bw = min(dfixed_trunc(a), wm->disp_clk * wm->bytes_per_pixel / 1000);
2089
2090 a.full = dfixed_const(max_src_lines_per_dst_line * wm->src_width * wm->bytes_per_pixel);
2091 b.full = dfixed_const(1000);
2092 c.full = dfixed_const(lb_fill_bw);
2093 b.full = dfixed_div(c, b);
2094 a.full = dfixed_div(a, b);
2095 line_fill_time = dfixed_trunc(a);
2096
2097 if (line_fill_time < wm->active_time)
2098 return latency;
2099 else
2100 return latency + (line_fill_time - wm->active_time);
2101
2102 }
2103
evergreen_average_bandwidth_vs_dram_bandwidth_for_display(struct evergreen_wm_params * wm)2104 static bool evergreen_average_bandwidth_vs_dram_bandwidth_for_display(struct evergreen_wm_params *wm)
2105 {
2106 if (evergreen_average_bandwidth(wm) <=
2107 (evergreen_dram_bandwidth_for_display(wm) / wm->num_heads))
2108 return true;
2109 else
2110 return false;
2111 };
2112
evergreen_average_bandwidth_vs_available_bandwidth(struct evergreen_wm_params * wm)2113 static bool evergreen_average_bandwidth_vs_available_bandwidth(struct evergreen_wm_params *wm)
2114 {
2115 if (evergreen_average_bandwidth(wm) <=
2116 (evergreen_available_bandwidth(wm) / wm->num_heads))
2117 return true;
2118 else
2119 return false;
2120 };
2121
evergreen_check_latency_hiding(struct evergreen_wm_params * wm)2122 static bool evergreen_check_latency_hiding(struct evergreen_wm_params *wm)
2123 {
2124 u32 lb_partitions = wm->lb_size / wm->src_width;
2125 u32 line_time = wm->active_time + wm->blank_time;
2126 u32 latency_tolerant_lines;
2127 u32 latency_hiding;
2128 fixed20_12 a;
2129
2130 a.full = dfixed_const(1);
2131 if (wm->vsc.full > a.full)
2132 latency_tolerant_lines = 1;
2133 else {
2134 if (lb_partitions <= (wm->vtaps + 1))
2135 latency_tolerant_lines = 1;
2136 else
2137 latency_tolerant_lines = 2;
2138 }
2139
2140 latency_hiding = (latency_tolerant_lines * line_time + wm->blank_time);
2141
2142 if (evergreen_latency_watermark(wm) <= latency_hiding)
2143 return true;
2144 else
2145 return false;
2146 }
2147
evergreen_program_watermarks(struct radeon_device * rdev,struct radeon_crtc * radeon_crtc,u32 lb_size,u32 num_heads)2148 static void evergreen_program_watermarks(struct radeon_device *rdev,
2149 struct radeon_crtc *radeon_crtc,
2150 u32 lb_size, u32 num_heads)
2151 {
2152 struct drm_display_mode *mode = &radeon_crtc->base.mode;
2153 struct evergreen_wm_params wm_low, wm_high;
2154 u32 dram_channels;
2155 u32 active_time;
2156 u32 line_time = 0;
2157 u32 latency_watermark_a = 0, latency_watermark_b = 0;
2158 u32 priority_a_mark = 0, priority_b_mark = 0;
2159 u32 priority_a_cnt = PRIORITY_OFF;
2160 u32 priority_b_cnt = PRIORITY_OFF;
2161 u32 pipe_offset = radeon_crtc->crtc_id * 16;
2162 u32 tmp, arb_control3;
2163 fixed20_12 a, b, c;
2164
2165 if (radeon_crtc->base.enabled && num_heads && mode) {
2166 active_time = (u32) div_u64((u64)mode->crtc_hdisplay * 1000000,
2167 (u32)mode->clock);
2168 line_time = (u32) div_u64((u64)mode->crtc_htotal * 1000000,
2169 (u32)mode->clock);
2170 line_time = min(line_time, (u32)65535);
2171 priority_a_cnt = 0;
2172 priority_b_cnt = 0;
2173 dram_channels = evergreen_get_number_of_dram_channels(rdev);
2174
2175 /* watermark for high clocks */
2176 if ((rdev->pm.pm_method == PM_METHOD_DPM) && rdev->pm.dpm_enabled) {
2177 wm_high.yclk =
2178 radeon_dpm_get_mclk(rdev, false) * 10;
2179 wm_high.sclk =
2180 radeon_dpm_get_sclk(rdev, false) * 10;
2181 } else {
2182 wm_high.yclk = rdev->pm.current_mclk * 10;
2183 wm_high.sclk = rdev->pm.current_sclk * 10;
2184 }
2185
2186 wm_high.disp_clk = mode->clock;
2187 wm_high.src_width = mode->crtc_hdisplay;
2188 wm_high.active_time = active_time;
2189 wm_high.blank_time = line_time - wm_high.active_time;
2190 wm_high.interlaced = false;
2191 if (mode->flags & DRM_MODE_FLAG_INTERLACE)
2192 wm_high.interlaced = true;
2193 wm_high.vsc = radeon_crtc->vsc;
2194 wm_high.vtaps = 1;
2195 if (radeon_crtc->rmx_type != RMX_OFF)
2196 wm_high.vtaps = 2;
2197 wm_high.bytes_per_pixel = 4; /* XXX: get this from fb config */
2198 wm_high.lb_size = lb_size;
2199 wm_high.dram_channels = dram_channels;
2200 wm_high.num_heads = num_heads;
2201
2202 /* watermark for low clocks */
2203 if ((rdev->pm.pm_method == PM_METHOD_DPM) && rdev->pm.dpm_enabled) {
2204 wm_low.yclk =
2205 radeon_dpm_get_mclk(rdev, true) * 10;
2206 wm_low.sclk =
2207 radeon_dpm_get_sclk(rdev, true) * 10;
2208 } else {
2209 wm_low.yclk = rdev->pm.current_mclk * 10;
2210 wm_low.sclk = rdev->pm.current_sclk * 10;
2211 }
2212
2213 wm_low.disp_clk = mode->clock;
2214 wm_low.src_width = mode->crtc_hdisplay;
2215 wm_low.active_time = active_time;
2216 wm_low.blank_time = line_time - wm_low.active_time;
2217 wm_low.interlaced = false;
2218 if (mode->flags & DRM_MODE_FLAG_INTERLACE)
2219 wm_low.interlaced = true;
2220 wm_low.vsc = radeon_crtc->vsc;
2221 wm_low.vtaps = 1;
2222 if (radeon_crtc->rmx_type != RMX_OFF)
2223 wm_low.vtaps = 2;
2224 wm_low.bytes_per_pixel = 4; /* XXX: get this from fb config */
2225 wm_low.lb_size = lb_size;
2226 wm_low.dram_channels = dram_channels;
2227 wm_low.num_heads = num_heads;
2228
2229 /* set for high clocks */
2230 latency_watermark_a = min(evergreen_latency_watermark(&wm_high), (u32)65535);
2231 /* set for low clocks */
2232 latency_watermark_b = min(evergreen_latency_watermark(&wm_low), (u32)65535);
2233
2234 /* possibly force display priority to high */
2235 /* should really do this at mode validation time... */
2236 if (!evergreen_average_bandwidth_vs_dram_bandwidth_for_display(&wm_high) ||
2237 !evergreen_average_bandwidth_vs_available_bandwidth(&wm_high) ||
2238 !evergreen_check_latency_hiding(&wm_high) ||
2239 (rdev->disp_priority == 2)) {
2240 DRM_DEBUG_KMS("force priority a to high\n");
2241 priority_a_cnt |= PRIORITY_ALWAYS_ON;
2242 }
2243 if (!evergreen_average_bandwidth_vs_dram_bandwidth_for_display(&wm_low) ||
2244 !evergreen_average_bandwidth_vs_available_bandwidth(&wm_low) ||
2245 !evergreen_check_latency_hiding(&wm_low) ||
2246 (rdev->disp_priority == 2)) {
2247 DRM_DEBUG_KMS("force priority b to high\n");
2248 priority_b_cnt |= PRIORITY_ALWAYS_ON;
2249 }
2250
2251 a.full = dfixed_const(1000);
2252 b.full = dfixed_const(mode->clock);
2253 b.full = dfixed_div(b, a);
2254 c.full = dfixed_const(latency_watermark_a);
2255 c.full = dfixed_mul(c, b);
2256 c.full = dfixed_mul(c, radeon_crtc->hsc);
2257 c.full = dfixed_div(c, a);
2258 a.full = dfixed_const(16);
2259 c.full = dfixed_div(c, a);
2260 priority_a_mark = dfixed_trunc(c);
2261 priority_a_cnt |= priority_a_mark & PRIORITY_MARK_MASK;
2262
2263 a.full = dfixed_const(1000);
2264 b.full = dfixed_const(mode->clock);
2265 b.full = dfixed_div(b, a);
2266 c.full = dfixed_const(latency_watermark_b);
2267 c.full = dfixed_mul(c, b);
2268 c.full = dfixed_mul(c, radeon_crtc->hsc);
2269 c.full = dfixed_div(c, a);
2270 a.full = dfixed_const(16);
2271 c.full = dfixed_div(c, a);
2272 priority_b_mark = dfixed_trunc(c);
2273 priority_b_cnt |= priority_b_mark & PRIORITY_MARK_MASK;
2274
2275 /* Save number of lines the linebuffer leads before the scanout */
2276 radeon_crtc->lb_vblank_lead_lines = DIV_ROUND_UP(lb_size, mode->crtc_hdisplay);
2277 }
2278
2279 /* select wm A */
2280 arb_control3 = RREG32(PIPE0_ARBITRATION_CONTROL3 + pipe_offset);
2281 tmp = arb_control3;
2282 tmp &= ~LATENCY_WATERMARK_MASK(3);
2283 tmp |= LATENCY_WATERMARK_MASK(1);
2284 WREG32(PIPE0_ARBITRATION_CONTROL3 + pipe_offset, tmp);
2285 WREG32(PIPE0_LATENCY_CONTROL + pipe_offset,
2286 (LATENCY_LOW_WATERMARK(latency_watermark_a) |
2287 LATENCY_HIGH_WATERMARK(line_time)));
2288 /* select wm B */
2289 tmp = RREG32(PIPE0_ARBITRATION_CONTROL3 + pipe_offset);
2290 tmp &= ~LATENCY_WATERMARK_MASK(3);
2291 tmp |= LATENCY_WATERMARK_MASK(2);
2292 WREG32(PIPE0_ARBITRATION_CONTROL3 + pipe_offset, tmp);
2293 WREG32(PIPE0_LATENCY_CONTROL + pipe_offset,
2294 (LATENCY_LOW_WATERMARK(latency_watermark_b) |
2295 LATENCY_HIGH_WATERMARK(line_time)));
2296 /* restore original selection */
2297 WREG32(PIPE0_ARBITRATION_CONTROL3 + pipe_offset, arb_control3);
2298
2299 /* write the priority marks */
2300 WREG32(PRIORITY_A_CNT + radeon_crtc->crtc_offset, priority_a_cnt);
2301 WREG32(PRIORITY_B_CNT + radeon_crtc->crtc_offset, priority_b_cnt);
2302
2303 /* save values for DPM */
2304 radeon_crtc->line_time = line_time;
2305 radeon_crtc->wm_high = latency_watermark_a;
2306 radeon_crtc->wm_low = latency_watermark_b;
2307 }
2308
2309 /**
2310 * evergreen_bandwidth_update - update display watermarks callback.
2311 *
2312 * @rdev: radeon_device pointer
2313 *
2314 * Update the display watermarks based on the requested mode(s)
2315 * (evergreen+).
2316 */
evergreen_bandwidth_update(struct radeon_device * rdev)2317 void evergreen_bandwidth_update(struct radeon_device *rdev)
2318 {
2319 struct drm_display_mode *mode0 = NULL;
2320 struct drm_display_mode *mode1 = NULL;
2321 u32 num_heads = 0, lb_size;
2322 int i;
2323
2324 if (!rdev->mode_info.mode_config_initialized)
2325 return;
2326
2327 radeon_update_display_priority(rdev);
2328
2329 for (i = 0; i < rdev->num_crtc; i++) {
2330 if (rdev->mode_info.crtcs[i]->base.enabled)
2331 num_heads++;
2332 }
2333 for (i = 0; i < rdev->num_crtc; i += 2) {
2334 mode0 = &rdev->mode_info.crtcs[i]->base.mode;
2335 mode1 = &rdev->mode_info.crtcs[i+1]->base.mode;
2336 lb_size = evergreen_line_buffer_adjust(rdev, rdev->mode_info.crtcs[i], mode0, mode1);
2337 evergreen_program_watermarks(rdev, rdev->mode_info.crtcs[i], lb_size, num_heads);
2338 lb_size = evergreen_line_buffer_adjust(rdev, rdev->mode_info.crtcs[i+1], mode1, mode0);
2339 evergreen_program_watermarks(rdev, rdev->mode_info.crtcs[i+1], lb_size, num_heads);
2340 }
2341 }
2342
2343 /**
2344 * evergreen_mc_wait_for_idle - wait for MC idle callback.
2345 *
2346 * @rdev: radeon_device pointer
2347 *
2348 * Wait for the MC (memory controller) to be idle.
2349 * (evergreen+).
2350 * Returns 0 if the MC is idle, -1 if not.
2351 */
evergreen_mc_wait_for_idle(struct radeon_device * rdev)2352 int evergreen_mc_wait_for_idle(struct radeon_device *rdev)
2353 {
2354 unsigned i;
2355 u32 tmp;
2356
2357 for (i = 0; i < rdev->usec_timeout; i++) {
2358 /* read MC_STATUS */
2359 tmp = RREG32(SRBM_STATUS) & 0x1F00;
2360 if (!tmp)
2361 return 0;
2362 udelay(1);
2363 }
2364 return -1;
2365 }
2366
2367 /*
2368 * GART
2369 */
evergreen_pcie_gart_tlb_flush(struct radeon_device * rdev)2370 void evergreen_pcie_gart_tlb_flush(struct radeon_device *rdev)
2371 {
2372 unsigned i;
2373 u32 tmp;
2374
2375 WREG32(HDP_MEM_COHERENCY_FLUSH_CNTL, 0x1);
2376
2377 WREG32(VM_CONTEXT0_REQUEST_RESPONSE, REQUEST_TYPE(1));
2378 for (i = 0; i < rdev->usec_timeout; i++) {
2379 /* read MC_STATUS */
2380 tmp = RREG32(VM_CONTEXT0_REQUEST_RESPONSE);
2381 tmp = (tmp & RESPONSE_TYPE_MASK) >> RESPONSE_TYPE_SHIFT;
2382 if (tmp == 2) {
2383 pr_warn("[drm] r600 flush TLB failed\n");
2384 return;
2385 }
2386 if (tmp) {
2387 return;
2388 }
2389 udelay(1);
2390 }
2391 }
2392
evergreen_pcie_gart_enable(struct radeon_device * rdev)2393 static int evergreen_pcie_gart_enable(struct radeon_device *rdev)
2394 {
2395 u32 tmp;
2396 int r;
2397
2398 if (rdev->gart.robj == NULL) {
2399 dev_err(rdev->dev, "No VRAM object for PCIE GART.\n");
2400 return -EINVAL;
2401 }
2402 r = radeon_gart_table_vram_pin(rdev);
2403 if (r)
2404 return r;
2405 /* Setup L2 cache */
2406 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
2407 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
2408 EFFECTIVE_L2_QUEUE_SIZE(7));
2409 WREG32(VM_L2_CNTL2, 0);
2410 WREG32(VM_L2_CNTL3, BANK_SELECT(0) | CACHE_UPDATE_MODE(2));
2411 /* Setup TLB control */
2412 tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
2413 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
2414 SYSTEM_APERTURE_UNMAPPED_ACCESS_PASS_THRU |
2415 EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5);
2416 if (rdev->flags & RADEON_IS_IGP) {
2417 WREG32(FUS_MC_VM_MD_L1_TLB0_CNTL, tmp);
2418 WREG32(FUS_MC_VM_MD_L1_TLB1_CNTL, tmp);
2419 WREG32(FUS_MC_VM_MD_L1_TLB2_CNTL, tmp);
2420 } else {
2421 WREG32(MC_VM_MD_L1_TLB0_CNTL, tmp);
2422 WREG32(MC_VM_MD_L1_TLB1_CNTL, tmp);
2423 WREG32(MC_VM_MD_L1_TLB2_CNTL, tmp);
2424 if ((rdev->family == CHIP_JUNIPER) ||
2425 (rdev->family == CHIP_CYPRESS) ||
2426 (rdev->family == CHIP_HEMLOCK) ||
2427 (rdev->family == CHIP_BARTS))
2428 WREG32(MC_VM_MD_L1_TLB3_CNTL, tmp);
2429 }
2430 WREG32(MC_VM_MB_L1_TLB0_CNTL, tmp);
2431 WREG32(MC_VM_MB_L1_TLB1_CNTL, tmp);
2432 WREG32(MC_VM_MB_L1_TLB2_CNTL, tmp);
2433 WREG32(MC_VM_MB_L1_TLB3_CNTL, tmp);
2434 WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR, rdev->mc.gtt_start >> 12);
2435 WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR, rdev->mc.gtt_end >> 12);
2436 WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR, rdev->gart.table_addr >> 12);
2437 WREG32(VM_CONTEXT0_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(0) |
2438 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT);
2439 WREG32(VM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
2440 (u32)(rdev->dummy_page.addr >> 12));
2441 WREG32(VM_CONTEXT1_CNTL, 0);
2442
2443 evergreen_pcie_gart_tlb_flush(rdev);
2444 DRM_INFO("PCIE GART of %uM enabled (table at 0x%016llX).\n",
2445 (unsigned)(rdev->mc.gtt_size >> 20),
2446 (unsigned long long)rdev->gart.table_addr);
2447 rdev->gart.ready = true;
2448 return 0;
2449 }
2450
evergreen_pcie_gart_disable(struct radeon_device * rdev)2451 static void evergreen_pcie_gart_disable(struct radeon_device *rdev)
2452 {
2453 u32 tmp;
2454
2455 /* Disable all tables */
2456 WREG32(VM_CONTEXT0_CNTL, 0);
2457 WREG32(VM_CONTEXT1_CNTL, 0);
2458
2459 /* Setup L2 cache */
2460 WREG32(VM_L2_CNTL, ENABLE_L2_FRAGMENT_PROCESSING |
2461 EFFECTIVE_L2_QUEUE_SIZE(7));
2462 WREG32(VM_L2_CNTL2, 0);
2463 WREG32(VM_L2_CNTL3, BANK_SELECT(0) | CACHE_UPDATE_MODE(2));
2464 /* Setup TLB control */
2465 tmp = EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5);
2466 WREG32(MC_VM_MD_L1_TLB0_CNTL, tmp);
2467 WREG32(MC_VM_MD_L1_TLB1_CNTL, tmp);
2468 WREG32(MC_VM_MD_L1_TLB2_CNTL, tmp);
2469 WREG32(MC_VM_MB_L1_TLB0_CNTL, tmp);
2470 WREG32(MC_VM_MB_L1_TLB1_CNTL, tmp);
2471 WREG32(MC_VM_MB_L1_TLB2_CNTL, tmp);
2472 WREG32(MC_VM_MB_L1_TLB3_CNTL, tmp);
2473 radeon_gart_table_vram_unpin(rdev);
2474 }
2475
evergreen_pcie_gart_fini(struct radeon_device * rdev)2476 static void evergreen_pcie_gart_fini(struct radeon_device *rdev)
2477 {
2478 evergreen_pcie_gart_disable(rdev);
2479 radeon_gart_table_vram_free(rdev);
2480 radeon_gart_fini(rdev);
2481 }
2482
2483
evergreen_agp_enable(struct radeon_device * rdev)2484 static void evergreen_agp_enable(struct radeon_device *rdev)
2485 {
2486 u32 tmp;
2487
2488 /* Setup L2 cache */
2489 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
2490 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
2491 EFFECTIVE_L2_QUEUE_SIZE(7));
2492 WREG32(VM_L2_CNTL2, 0);
2493 WREG32(VM_L2_CNTL3, BANK_SELECT(0) | CACHE_UPDATE_MODE(2));
2494 /* Setup TLB control */
2495 tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
2496 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
2497 SYSTEM_APERTURE_UNMAPPED_ACCESS_PASS_THRU |
2498 EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5);
2499 WREG32(MC_VM_MD_L1_TLB0_CNTL, tmp);
2500 WREG32(MC_VM_MD_L1_TLB1_CNTL, tmp);
2501 WREG32(MC_VM_MD_L1_TLB2_CNTL, tmp);
2502 WREG32(MC_VM_MB_L1_TLB0_CNTL, tmp);
2503 WREG32(MC_VM_MB_L1_TLB1_CNTL, tmp);
2504 WREG32(MC_VM_MB_L1_TLB2_CNTL, tmp);
2505 WREG32(MC_VM_MB_L1_TLB3_CNTL, tmp);
2506 WREG32(VM_CONTEXT0_CNTL, 0);
2507 WREG32(VM_CONTEXT1_CNTL, 0);
2508 }
2509
2510 static const unsigned ni_dig_offsets[] =
2511 {
2512 NI_DIG0_REGISTER_OFFSET,
2513 NI_DIG1_REGISTER_OFFSET,
2514 NI_DIG2_REGISTER_OFFSET,
2515 NI_DIG3_REGISTER_OFFSET,
2516 NI_DIG4_REGISTER_OFFSET,
2517 NI_DIG5_REGISTER_OFFSET
2518 };
2519
2520 static const unsigned ni_tx_offsets[] =
2521 {
2522 NI_DCIO_UNIPHY0_UNIPHY_TX_CONTROL1,
2523 NI_DCIO_UNIPHY1_UNIPHY_TX_CONTROL1,
2524 NI_DCIO_UNIPHY2_UNIPHY_TX_CONTROL1,
2525 NI_DCIO_UNIPHY3_UNIPHY_TX_CONTROL1,
2526 NI_DCIO_UNIPHY4_UNIPHY_TX_CONTROL1,
2527 NI_DCIO_UNIPHY5_UNIPHY_TX_CONTROL1
2528 };
2529
2530 static const unsigned evergreen_dp_offsets[] =
2531 {
2532 EVERGREEN_DP0_REGISTER_OFFSET,
2533 EVERGREEN_DP1_REGISTER_OFFSET,
2534 EVERGREEN_DP2_REGISTER_OFFSET,
2535 EVERGREEN_DP3_REGISTER_OFFSET,
2536 EVERGREEN_DP4_REGISTER_OFFSET,
2537 EVERGREEN_DP5_REGISTER_OFFSET
2538 };
2539
2540 static const unsigned evergreen_disp_int_status[] =
2541 {
2542 DISP_INTERRUPT_STATUS,
2543 DISP_INTERRUPT_STATUS_CONTINUE,
2544 DISP_INTERRUPT_STATUS_CONTINUE2,
2545 DISP_INTERRUPT_STATUS_CONTINUE3,
2546 DISP_INTERRUPT_STATUS_CONTINUE4,
2547 DISP_INTERRUPT_STATUS_CONTINUE5
2548 };
2549
2550 /*
2551 * Assumption is that EVERGREEN_CRTC_MASTER_EN enable for requested crtc
2552 * We go from crtc to connector and it is not relible since it
2553 * should be an opposite direction .If crtc is enable then
2554 * find the dig_fe which selects this crtc and insure that it enable.
2555 * if such dig_fe is found then find dig_be which selects found dig_be and
2556 * insure that it enable and in DP_SST mode.
2557 * if UNIPHY_PLL_CONTROL1.enable then we should disconnect timing
2558 * from dp symbols clocks .
2559 */
evergreen_is_dp_sst_stream_enabled(struct radeon_device * rdev,unsigned crtc_id,unsigned * ret_dig_fe)2560 static bool evergreen_is_dp_sst_stream_enabled(struct radeon_device *rdev,
2561 unsigned crtc_id, unsigned *ret_dig_fe)
2562 {
2563 unsigned i;
2564 unsigned dig_fe;
2565 unsigned dig_be;
2566 unsigned dig_en_be;
2567 unsigned uniphy_pll;
2568 unsigned digs_fe_selected;
2569 unsigned dig_be_mode;
2570 unsigned dig_fe_mask;
2571 bool is_enabled = false;
2572 bool found_crtc = false;
2573
2574 /* loop through all running dig_fe to find selected crtc */
2575 for (i = 0; i < ARRAY_SIZE(ni_dig_offsets); i++) {
2576 dig_fe = RREG32(NI_DIG_FE_CNTL + ni_dig_offsets[i]);
2577 if (dig_fe & NI_DIG_FE_CNTL_SYMCLK_FE_ON &&
2578 crtc_id == NI_DIG_FE_CNTL_SOURCE_SELECT(dig_fe)) {
2579 /* found running pipe */
2580 found_crtc = true;
2581 dig_fe_mask = 1 << i;
2582 dig_fe = i;
2583 break;
2584 }
2585 }
2586
2587 if (found_crtc) {
2588 /* loop through all running dig_be to find selected dig_fe */
2589 for (i = 0; i < ARRAY_SIZE(ni_dig_offsets); i++) {
2590 dig_be = RREG32(NI_DIG_BE_CNTL + ni_dig_offsets[i]);
2591 /* if dig_fe_selected by dig_be? */
2592 digs_fe_selected = NI_DIG_BE_CNTL_FE_SOURCE_SELECT(dig_be);
2593 dig_be_mode = NI_DIG_FE_CNTL_MODE(dig_be);
2594 if (dig_fe_mask & digs_fe_selected &&
2595 /* if dig_be in sst mode? */
2596 dig_be_mode == NI_DIG_BE_DPSST) {
2597 dig_en_be = RREG32(NI_DIG_BE_EN_CNTL +
2598 ni_dig_offsets[i]);
2599 uniphy_pll = RREG32(NI_DCIO_UNIPHY0_PLL_CONTROL1 +
2600 ni_tx_offsets[i]);
2601 /* dig_be enable and tx is running */
2602 if (dig_en_be & NI_DIG_BE_EN_CNTL_ENABLE &&
2603 dig_en_be & NI_DIG_BE_EN_CNTL_SYMBCLK_ON &&
2604 uniphy_pll & NI_DCIO_UNIPHY0_PLL_CONTROL1_ENABLE) {
2605 is_enabled = true;
2606 *ret_dig_fe = dig_fe;
2607 break;
2608 }
2609 }
2610 }
2611 }
2612
2613 return is_enabled;
2614 }
2615
2616 /*
2617 * Blank dig when in dp sst mode
2618 * Dig ignores crtc timing
2619 */
evergreen_blank_dp_output(struct radeon_device * rdev,unsigned dig_fe)2620 static void evergreen_blank_dp_output(struct radeon_device *rdev,
2621 unsigned dig_fe)
2622 {
2623 unsigned stream_ctrl;
2624 unsigned fifo_ctrl;
2625 unsigned counter = 0;
2626
2627 if (dig_fe >= ARRAY_SIZE(evergreen_dp_offsets)) {
2628 DRM_ERROR("invalid dig_fe %d\n", dig_fe);
2629 return;
2630 }
2631
2632 stream_ctrl = RREG32(EVERGREEN_DP_VID_STREAM_CNTL +
2633 evergreen_dp_offsets[dig_fe]);
2634 if (!(stream_ctrl & EVERGREEN_DP_VID_STREAM_CNTL_ENABLE)) {
2635 DRM_ERROR("dig %d , should be enable\n", dig_fe);
2636 return;
2637 }
2638
2639 stream_ctrl &=~EVERGREEN_DP_VID_STREAM_CNTL_ENABLE;
2640 WREG32(EVERGREEN_DP_VID_STREAM_CNTL +
2641 evergreen_dp_offsets[dig_fe], stream_ctrl);
2642
2643 stream_ctrl = RREG32(EVERGREEN_DP_VID_STREAM_CNTL +
2644 evergreen_dp_offsets[dig_fe]);
2645 while (counter < 32 && stream_ctrl & EVERGREEN_DP_VID_STREAM_STATUS) {
2646 msleep(1);
2647 counter++;
2648 stream_ctrl = RREG32(EVERGREEN_DP_VID_STREAM_CNTL +
2649 evergreen_dp_offsets[dig_fe]);
2650 }
2651 if (counter >= 32 )
2652 DRM_ERROR("counter exceeds %d\n", counter);
2653
2654 fifo_ctrl = RREG32(EVERGREEN_DP_STEER_FIFO + evergreen_dp_offsets[dig_fe]);
2655 fifo_ctrl |= EVERGREEN_DP_STEER_FIFO_RESET;
2656 WREG32(EVERGREEN_DP_STEER_FIFO + evergreen_dp_offsets[dig_fe], fifo_ctrl);
2657
2658 }
2659
evergreen_mc_stop(struct radeon_device * rdev,struct evergreen_mc_save * save)2660 void evergreen_mc_stop(struct radeon_device *rdev, struct evergreen_mc_save *save)
2661 {
2662 u32 crtc_enabled, tmp, frame_count, blackout;
2663 int i, j;
2664 unsigned dig_fe;
2665
2666 if (!ASIC_IS_NODCE(rdev)) {
2667 save->vga_render_control = RREG32(VGA_RENDER_CONTROL);
2668 save->vga_hdp_control = RREG32(VGA_HDP_CONTROL);
2669
2670 /* disable VGA render */
2671 WREG32(VGA_RENDER_CONTROL, 0);
2672 }
2673 /* blank the display controllers */
2674 for (i = 0; i < rdev->num_crtc; i++) {
2675 crtc_enabled = RREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i]) & EVERGREEN_CRTC_MASTER_EN;
2676 if (crtc_enabled) {
2677 save->crtc_enabled[i] = true;
2678 if (ASIC_IS_DCE6(rdev)) {
2679 tmp = RREG32(EVERGREEN_CRTC_BLANK_CONTROL + crtc_offsets[i]);
2680 if (!(tmp & EVERGREEN_CRTC_BLANK_DATA_EN)) {
2681 radeon_wait_for_vblank(rdev, i);
2682 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 1);
2683 tmp |= EVERGREEN_CRTC_BLANK_DATA_EN;
2684 WREG32(EVERGREEN_CRTC_BLANK_CONTROL + crtc_offsets[i], tmp);
2685 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 0);
2686 }
2687 } else {
2688 tmp = RREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i]);
2689 if (!(tmp & EVERGREEN_CRTC_DISP_READ_REQUEST_DISABLE)) {
2690 radeon_wait_for_vblank(rdev, i);
2691 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 1);
2692 tmp |= EVERGREEN_CRTC_DISP_READ_REQUEST_DISABLE;
2693 WREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i], tmp);
2694 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 0);
2695 }
2696 }
2697 /* wait for the next frame */
2698 frame_count = radeon_get_vblank_counter(rdev, i);
2699 for (j = 0; j < rdev->usec_timeout; j++) {
2700 if (radeon_get_vblank_counter(rdev, i) != frame_count)
2701 break;
2702 udelay(1);
2703 }
2704 /*we should disable dig if it drives dp sst*/
2705 /*but we are in radeon_device_init and the topology is unknown*/
2706 /*and it is available after radeon_modeset_init*/
2707 /*the following method radeon_atom_encoder_dpms_dig*/
2708 /*does the job if we initialize it properly*/
2709 /*for now we do it this manually*/
2710 /**/
2711 if (ASIC_IS_DCE5(rdev) &&
2712 evergreen_is_dp_sst_stream_enabled(rdev, i ,&dig_fe))
2713 evergreen_blank_dp_output(rdev, dig_fe);
2714 /*we could remove 6 lines below*/
2715 /* XXX this is a hack to avoid strange behavior with EFI on certain systems */
2716 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 1);
2717 tmp = RREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i]);
2718 tmp &= ~EVERGREEN_CRTC_MASTER_EN;
2719 WREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i], tmp);
2720 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 0);
2721 save->crtc_enabled[i] = false;
2722 /* ***** */
2723 } else {
2724 save->crtc_enabled[i] = false;
2725 }
2726 }
2727
2728 radeon_mc_wait_for_idle(rdev);
2729
2730 blackout = RREG32(MC_SHARED_BLACKOUT_CNTL);
2731 if ((blackout & BLACKOUT_MODE_MASK) != 1) {
2732 /* Block CPU access */
2733 WREG32(BIF_FB_EN, 0);
2734 /* blackout the MC */
2735 blackout &= ~BLACKOUT_MODE_MASK;
2736 WREG32(MC_SHARED_BLACKOUT_CNTL, blackout | 1);
2737 }
2738 /* wait for the MC to settle */
2739 udelay(100);
2740
2741 /* lock double buffered regs */
2742 for (i = 0; i < rdev->num_crtc; i++) {
2743 if (save->crtc_enabled[i]) {
2744 tmp = RREG32(EVERGREEN_GRPH_UPDATE + crtc_offsets[i]);
2745 if (!(tmp & EVERGREEN_GRPH_UPDATE_LOCK)) {
2746 tmp |= EVERGREEN_GRPH_UPDATE_LOCK;
2747 WREG32(EVERGREEN_GRPH_UPDATE + crtc_offsets[i], tmp);
2748 }
2749 tmp = RREG32(EVERGREEN_MASTER_UPDATE_LOCK + crtc_offsets[i]);
2750 if (!(tmp & 1)) {
2751 tmp |= 1;
2752 WREG32(EVERGREEN_MASTER_UPDATE_LOCK + crtc_offsets[i], tmp);
2753 }
2754 }
2755 }
2756 }
2757
evergreen_mc_resume(struct radeon_device * rdev,struct evergreen_mc_save * save)2758 void evergreen_mc_resume(struct radeon_device *rdev, struct evergreen_mc_save *save)
2759 {
2760 u32 tmp, frame_count;
2761 int i, j;
2762
2763 /* update crtc base addresses */
2764 for (i = 0; i < rdev->num_crtc; i++) {
2765 WREG32(EVERGREEN_GRPH_PRIMARY_SURFACE_ADDRESS_HIGH + crtc_offsets[i],
2766 upper_32_bits(rdev->mc.vram_start));
2767 WREG32(EVERGREEN_GRPH_SECONDARY_SURFACE_ADDRESS_HIGH + crtc_offsets[i],
2768 upper_32_bits(rdev->mc.vram_start));
2769 WREG32(EVERGREEN_GRPH_PRIMARY_SURFACE_ADDRESS + crtc_offsets[i],
2770 (u32)rdev->mc.vram_start);
2771 WREG32(EVERGREEN_GRPH_SECONDARY_SURFACE_ADDRESS + crtc_offsets[i],
2772 (u32)rdev->mc.vram_start);
2773 }
2774
2775 if (!ASIC_IS_NODCE(rdev)) {
2776 WREG32(EVERGREEN_VGA_MEMORY_BASE_ADDRESS_HIGH, upper_32_bits(rdev->mc.vram_start));
2777 WREG32(EVERGREEN_VGA_MEMORY_BASE_ADDRESS, (u32)rdev->mc.vram_start);
2778 }
2779
2780 /* unlock regs and wait for update */
2781 for (i = 0; i < rdev->num_crtc; i++) {
2782 if (save->crtc_enabled[i]) {
2783 tmp = RREG32(EVERGREEN_MASTER_UPDATE_MODE + crtc_offsets[i]);
2784 if ((tmp & 0x7) != 0) {
2785 tmp &= ~0x7;
2786 WREG32(EVERGREEN_MASTER_UPDATE_MODE + crtc_offsets[i], tmp);
2787 }
2788 tmp = RREG32(EVERGREEN_GRPH_UPDATE + crtc_offsets[i]);
2789 if (tmp & EVERGREEN_GRPH_UPDATE_LOCK) {
2790 tmp &= ~EVERGREEN_GRPH_UPDATE_LOCK;
2791 WREG32(EVERGREEN_GRPH_UPDATE + crtc_offsets[i], tmp);
2792 }
2793 tmp = RREG32(EVERGREEN_MASTER_UPDATE_LOCK + crtc_offsets[i]);
2794 if (tmp & 1) {
2795 tmp &= ~1;
2796 WREG32(EVERGREEN_MASTER_UPDATE_LOCK + crtc_offsets[i], tmp);
2797 }
2798 for (j = 0; j < rdev->usec_timeout; j++) {
2799 tmp = RREG32(EVERGREEN_GRPH_UPDATE + crtc_offsets[i]);
2800 if ((tmp & EVERGREEN_GRPH_SURFACE_UPDATE_PENDING) == 0)
2801 break;
2802 udelay(1);
2803 }
2804 }
2805 }
2806
2807 /* unblackout the MC */
2808 tmp = RREG32(MC_SHARED_BLACKOUT_CNTL);
2809 tmp &= ~BLACKOUT_MODE_MASK;
2810 WREG32(MC_SHARED_BLACKOUT_CNTL, tmp);
2811 /* allow CPU access */
2812 WREG32(BIF_FB_EN, FB_READ_EN | FB_WRITE_EN);
2813
2814 for (i = 0; i < rdev->num_crtc; i++) {
2815 if (save->crtc_enabled[i]) {
2816 if (ASIC_IS_DCE6(rdev)) {
2817 tmp = RREG32(EVERGREEN_CRTC_BLANK_CONTROL + crtc_offsets[i]);
2818 tmp &= ~EVERGREEN_CRTC_BLANK_DATA_EN;
2819 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 1);
2820 WREG32(EVERGREEN_CRTC_BLANK_CONTROL + crtc_offsets[i], tmp);
2821 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 0);
2822 } else {
2823 tmp = RREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i]);
2824 tmp &= ~EVERGREEN_CRTC_DISP_READ_REQUEST_DISABLE;
2825 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 1);
2826 WREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i], tmp);
2827 WREG32(EVERGREEN_CRTC_UPDATE_LOCK + crtc_offsets[i], 0);
2828 }
2829 /* wait for the next frame */
2830 frame_count = radeon_get_vblank_counter(rdev, i);
2831 for (j = 0; j < rdev->usec_timeout; j++) {
2832 if (radeon_get_vblank_counter(rdev, i) != frame_count)
2833 break;
2834 udelay(1);
2835 }
2836 }
2837 }
2838 if (!ASIC_IS_NODCE(rdev)) {
2839 /* Unlock vga access */
2840 WREG32(VGA_HDP_CONTROL, save->vga_hdp_control);
2841 mdelay(1);
2842 WREG32(VGA_RENDER_CONTROL, save->vga_render_control);
2843 }
2844 }
2845
evergreen_mc_program(struct radeon_device * rdev)2846 void evergreen_mc_program(struct radeon_device *rdev)
2847 {
2848 struct evergreen_mc_save save;
2849 u32 tmp;
2850 int i, j;
2851
2852 /* Initialize HDP */
2853 for (i = 0, j = 0; i < 32; i++, j += 0x18) {
2854 WREG32((0x2c14 + j), 0x00000000);
2855 WREG32((0x2c18 + j), 0x00000000);
2856 WREG32((0x2c1c + j), 0x00000000);
2857 WREG32((0x2c20 + j), 0x00000000);
2858 WREG32((0x2c24 + j), 0x00000000);
2859 }
2860 WREG32(HDP_REG_COHERENCY_FLUSH_CNTL, 0);
2861
2862 evergreen_mc_stop(rdev, &save);
2863 if (evergreen_mc_wait_for_idle(rdev)) {
2864 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
2865 }
2866 /* Lockout access through VGA aperture*/
2867 WREG32(VGA_HDP_CONTROL, VGA_MEMORY_DISABLE);
2868 /* Update configuration */
2869 if (rdev->flags & RADEON_IS_AGP) {
2870 if (rdev->mc.vram_start < rdev->mc.gtt_start) {
2871 /* VRAM before AGP */
2872 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
2873 rdev->mc.vram_start >> 12);
2874 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
2875 rdev->mc.gtt_end >> 12);
2876 } else {
2877 /* VRAM after AGP */
2878 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
2879 rdev->mc.gtt_start >> 12);
2880 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
2881 rdev->mc.vram_end >> 12);
2882 }
2883 } else {
2884 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
2885 rdev->mc.vram_start >> 12);
2886 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
2887 rdev->mc.vram_end >> 12);
2888 }
2889 WREG32(MC_VM_SYSTEM_APERTURE_DEFAULT_ADDR, rdev->vram_scratch.gpu_addr >> 12);
2890 /* llano/ontario only */
2891 if ((rdev->family == CHIP_PALM) ||
2892 (rdev->family == CHIP_SUMO) ||
2893 (rdev->family == CHIP_SUMO2)) {
2894 tmp = RREG32(MC_FUS_VM_FB_OFFSET) & 0x000FFFFF;
2895 tmp |= ((rdev->mc.vram_end >> 20) & 0xF) << 24;
2896 tmp |= ((rdev->mc.vram_start >> 20) & 0xF) << 20;
2897 WREG32(MC_FUS_VM_FB_OFFSET, tmp);
2898 }
2899 tmp = ((rdev->mc.vram_end >> 24) & 0xFFFF) << 16;
2900 tmp |= ((rdev->mc.vram_start >> 24) & 0xFFFF);
2901 WREG32(MC_VM_FB_LOCATION, tmp);
2902 WREG32(HDP_NONSURFACE_BASE, (rdev->mc.vram_start >> 8));
2903 WREG32(HDP_NONSURFACE_INFO, (2 << 7) | (1 << 30));
2904 WREG32(HDP_NONSURFACE_SIZE, 0x3FFFFFFF);
2905 if (rdev->flags & RADEON_IS_AGP) {
2906 WREG32(MC_VM_AGP_TOP, rdev->mc.gtt_end >> 16);
2907 WREG32(MC_VM_AGP_BOT, rdev->mc.gtt_start >> 16);
2908 WREG32(MC_VM_AGP_BASE, rdev->mc.agp_base >> 22);
2909 } else {
2910 WREG32(MC_VM_AGP_BASE, 0);
2911 WREG32(MC_VM_AGP_TOP, 0x0FFFFFFF);
2912 WREG32(MC_VM_AGP_BOT, 0x0FFFFFFF);
2913 }
2914 if (evergreen_mc_wait_for_idle(rdev)) {
2915 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
2916 }
2917 evergreen_mc_resume(rdev, &save);
2918 /* we need to own VRAM, so turn off the VGA renderer here
2919 * to stop it overwriting our objects */
2920 rv515_vga_render_disable(rdev);
2921 }
2922
2923 /*
2924 * CP.
2925 */
evergreen_ring_ib_execute(struct radeon_device * rdev,struct radeon_ib * ib)2926 void evergreen_ring_ib_execute(struct radeon_device *rdev, struct radeon_ib *ib)
2927 {
2928 struct radeon_ring *ring = &rdev->ring[ib->ring];
2929 u32 next_rptr;
2930
2931 /* set to DX10/11 mode */
2932 radeon_ring_write(ring, PACKET3(PACKET3_MODE_CONTROL, 0));
2933 radeon_ring_write(ring, 1);
2934
2935 if (ring->rptr_save_reg) {
2936 next_rptr = ring->wptr + 3 + 4;
2937 radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1));
2938 radeon_ring_write(ring, ((ring->rptr_save_reg -
2939 PACKET3_SET_CONFIG_REG_START) >> 2));
2940 radeon_ring_write(ring, next_rptr);
2941 } else if (rdev->wb.enabled) {
2942 next_rptr = ring->wptr + 5 + 4;
2943 radeon_ring_write(ring, PACKET3(PACKET3_MEM_WRITE, 3));
2944 radeon_ring_write(ring, ring->next_rptr_gpu_addr & 0xfffffffc);
2945 radeon_ring_write(ring, (upper_32_bits(ring->next_rptr_gpu_addr) & 0xff) | (1 << 18));
2946 radeon_ring_write(ring, next_rptr);
2947 radeon_ring_write(ring, 0);
2948 }
2949
2950 radeon_ring_write(ring, PACKET3(PACKET3_INDIRECT_BUFFER, 2));
2951 radeon_ring_write(ring,
2952 #ifdef __BIG_ENDIAN
2953 (2 << 0) |
2954 #endif
2955 (ib->gpu_addr & 0xFFFFFFFC));
2956 radeon_ring_write(ring, upper_32_bits(ib->gpu_addr) & 0xFF);
2957 radeon_ring_write(ring, ib->length_dw);
2958 }
2959
2960
evergreen_cp_load_microcode(struct radeon_device * rdev)2961 static int evergreen_cp_load_microcode(struct radeon_device *rdev)
2962 {
2963 const __be32 *fw_data;
2964 int i;
2965
2966 if (!rdev->me_fw || !rdev->pfp_fw)
2967 return -EINVAL;
2968
2969 r700_cp_stop(rdev);
2970 WREG32(CP_RB_CNTL,
2971 #ifdef __BIG_ENDIAN
2972 BUF_SWAP_32BIT |
2973 #endif
2974 RB_NO_UPDATE | RB_BLKSZ(15) | RB_BUFSZ(3));
2975
2976 fw_data = (const __be32 *)rdev->pfp_fw->data;
2977 WREG32(CP_PFP_UCODE_ADDR, 0);
2978 for (i = 0; i < EVERGREEN_PFP_UCODE_SIZE; i++)
2979 WREG32(CP_PFP_UCODE_DATA, be32_to_cpup(fw_data++));
2980 WREG32(CP_PFP_UCODE_ADDR, 0);
2981
2982 fw_data = (const __be32 *)rdev->me_fw->data;
2983 WREG32(CP_ME_RAM_WADDR, 0);
2984 for (i = 0; i < EVERGREEN_PM4_UCODE_SIZE; i++)
2985 WREG32(CP_ME_RAM_DATA, be32_to_cpup(fw_data++));
2986
2987 WREG32(CP_PFP_UCODE_ADDR, 0);
2988 WREG32(CP_ME_RAM_WADDR, 0);
2989 WREG32(CP_ME_RAM_RADDR, 0);
2990 return 0;
2991 }
2992
evergreen_cp_start(struct radeon_device * rdev)2993 static int evergreen_cp_start(struct radeon_device *rdev)
2994 {
2995 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
2996 int r, i;
2997 uint32_t cp_me;
2998
2999 r = radeon_ring_lock(rdev, ring, 7);
3000 if (r) {
3001 DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
3002 return r;
3003 }
3004 radeon_ring_write(ring, PACKET3(PACKET3_ME_INITIALIZE, 5));
3005 radeon_ring_write(ring, 0x1);
3006 radeon_ring_write(ring, 0x0);
3007 radeon_ring_write(ring, rdev->config.evergreen.max_hw_contexts - 1);
3008 radeon_ring_write(ring, PACKET3_ME_INITIALIZE_DEVICE_ID(1));
3009 radeon_ring_write(ring, 0);
3010 radeon_ring_write(ring, 0);
3011 radeon_ring_unlock_commit(rdev, ring, false);
3012
3013 cp_me = 0xff;
3014 WREG32(CP_ME_CNTL, cp_me);
3015
3016 r = radeon_ring_lock(rdev, ring, evergreen_default_size + 19);
3017 if (r) {
3018 DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
3019 return r;
3020 }
3021
3022 /* setup clear context state */
3023 radeon_ring_write(ring, PACKET3(PACKET3_PREAMBLE_CNTL, 0));
3024 radeon_ring_write(ring, PACKET3_PREAMBLE_BEGIN_CLEAR_STATE);
3025
3026 for (i = 0; i < evergreen_default_size; i++)
3027 radeon_ring_write(ring, evergreen_default_state[i]);
3028
3029 radeon_ring_write(ring, PACKET3(PACKET3_PREAMBLE_CNTL, 0));
3030 radeon_ring_write(ring, PACKET3_PREAMBLE_END_CLEAR_STATE);
3031
3032 /* set clear context state */
3033 radeon_ring_write(ring, PACKET3(PACKET3_CLEAR_STATE, 0));
3034 radeon_ring_write(ring, 0);
3035
3036 /* SQ_VTX_BASE_VTX_LOC */
3037 radeon_ring_write(ring, 0xc0026f00);
3038 radeon_ring_write(ring, 0x00000000);
3039 radeon_ring_write(ring, 0x00000000);
3040 radeon_ring_write(ring, 0x00000000);
3041
3042 /* Clear consts */
3043 radeon_ring_write(ring, 0xc0036f00);
3044 radeon_ring_write(ring, 0x00000bc4);
3045 radeon_ring_write(ring, 0xffffffff);
3046 radeon_ring_write(ring, 0xffffffff);
3047 radeon_ring_write(ring, 0xffffffff);
3048
3049 radeon_ring_write(ring, 0xc0026900);
3050 radeon_ring_write(ring, 0x00000316);
3051 radeon_ring_write(ring, 0x0000000e); /* VGT_VERTEX_REUSE_BLOCK_CNTL */
3052 radeon_ring_write(ring, 0x00000010); /* */
3053
3054 radeon_ring_unlock_commit(rdev, ring, false);
3055
3056 return 0;
3057 }
3058
evergreen_cp_resume(struct radeon_device * rdev)3059 static int evergreen_cp_resume(struct radeon_device *rdev)
3060 {
3061 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
3062 u32 tmp;
3063 u32 rb_bufsz;
3064 int r;
3065
3066 /* Reset cp; if cp is reset, then PA, SH, VGT also need to be reset */
3067 WREG32(GRBM_SOFT_RESET, (SOFT_RESET_CP |
3068 SOFT_RESET_PA |
3069 SOFT_RESET_SH |
3070 SOFT_RESET_VGT |
3071 SOFT_RESET_SPI |
3072 SOFT_RESET_SX));
3073 RREG32(GRBM_SOFT_RESET);
3074 mdelay(15);
3075 WREG32(GRBM_SOFT_RESET, 0);
3076 RREG32(GRBM_SOFT_RESET);
3077
3078 /* Set ring buffer size */
3079 rb_bufsz = order_base_2(ring->ring_size / 8);
3080 tmp = (order_base_2(RADEON_GPU_PAGE_SIZE/8) << 8) | rb_bufsz;
3081 #ifdef __BIG_ENDIAN
3082 tmp |= BUF_SWAP_32BIT;
3083 #endif
3084 WREG32(CP_RB_CNTL, tmp);
3085 WREG32(CP_SEM_WAIT_TIMER, 0x0);
3086 WREG32(CP_SEM_INCOMPLETE_TIMER_CNTL, 0x0);
3087
3088 /* Set the write pointer delay */
3089 WREG32(CP_RB_WPTR_DELAY, 0);
3090
3091 /* Initialize the ring buffer's read and write pointers */
3092 WREG32(CP_RB_CNTL, tmp | RB_RPTR_WR_ENA);
3093 WREG32(CP_RB_RPTR_WR, 0);
3094 ring->wptr = 0;
3095 WREG32(CP_RB_WPTR, ring->wptr);
3096
3097 /* set the wb address whether it's enabled or not */
3098 WREG32(CP_RB_RPTR_ADDR,
3099 ((rdev->wb.gpu_addr + RADEON_WB_CP_RPTR_OFFSET) & 0xFFFFFFFC));
3100 WREG32(CP_RB_RPTR_ADDR_HI, upper_32_bits(rdev->wb.gpu_addr + RADEON_WB_CP_RPTR_OFFSET) & 0xFF);
3101 WREG32(SCRATCH_ADDR, ((rdev->wb.gpu_addr + RADEON_WB_SCRATCH_OFFSET) >> 8) & 0xFFFFFFFF);
3102
3103 if (rdev->wb.enabled)
3104 WREG32(SCRATCH_UMSK, 0xff);
3105 else {
3106 tmp |= RB_NO_UPDATE;
3107 WREG32(SCRATCH_UMSK, 0);
3108 }
3109
3110 mdelay(1);
3111 WREG32(CP_RB_CNTL, tmp);
3112
3113 WREG32(CP_RB_BASE, ring->gpu_addr >> 8);
3114 WREG32(CP_DEBUG, (1 << 27) | (1 << 28));
3115
3116 evergreen_cp_start(rdev);
3117 ring->ready = true;
3118 r = radeon_ring_test(rdev, RADEON_RING_TYPE_GFX_INDEX, ring);
3119 if (r) {
3120 ring->ready = false;
3121 return r;
3122 }
3123 return 0;
3124 }
3125
3126 /*
3127 * Core functions
3128 */
evergreen_gpu_init(struct radeon_device * rdev)3129 static void evergreen_gpu_init(struct radeon_device *rdev)
3130 {
3131 u32 gb_addr_config;
3132 u32 mc_shared_chmap, mc_arb_ramcfg;
3133 u32 sx_debug_1;
3134 u32 smx_dc_ctl0;
3135 u32 sq_config;
3136 u32 sq_lds_resource_mgmt;
3137 u32 sq_gpr_resource_mgmt_1;
3138 u32 sq_gpr_resource_mgmt_2;
3139 u32 sq_gpr_resource_mgmt_3;
3140 u32 sq_thread_resource_mgmt;
3141 u32 sq_thread_resource_mgmt_2;
3142 u32 sq_stack_resource_mgmt_1;
3143 u32 sq_stack_resource_mgmt_2;
3144 u32 sq_stack_resource_mgmt_3;
3145 u32 vgt_cache_invalidation;
3146 u32 hdp_host_path_cntl, tmp;
3147 u32 disabled_rb_mask;
3148 int i, j, ps_thread_count;
3149
3150 switch (rdev->family) {
3151 case CHIP_CYPRESS:
3152 case CHIP_HEMLOCK:
3153 rdev->config.evergreen.num_ses = 2;
3154 rdev->config.evergreen.max_pipes = 4;
3155 rdev->config.evergreen.max_tile_pipes = 8;
3156 rdev->config.evergreen.max_simds = 10;
3157 rdev->config.evergreen.max_backends = 4 * rdev->config.evergreen.num_ses;
3158 rdev->config.evergreen.max_gprs = 256;
3159 rdev->config.evergreen.max_threads = 248;
3160 rdev->config.evergreen.max_gs_threads = 32;
3161 rdev->config.evergreen.max_stack_entries = 512;
3162 rdev->config.evergreen.sx_num_of_sets = 4;
3163 rdev->config.evergreen.sx_max_export_size = 256;
3164 rdev->config.evergreen.sx_max_export_pos_size = 64;
3165 rdev->config.evergreen.sx_max_export_smx_size = 192;
3166 rdev->config.evergreen.max_hw_contexts = 8;
3167 rdev->config.evergreen.sq_num_cf_insts = 2;
3168
3169 rdev->config.evergreen.sc_prim_fifo_size = 0x100;
3170 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3171 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3172 gb_addr_config = CYPRESS_GB_ADDR_CONFIG_GOLDEN;
3173 break;
3174 case CHIP_JUNIPER:
3175 rdev->config.evergreen.num_ses = 1;
3176 rdev->config.evergreen.max_pipes = 4;
3177 rdev->config.evergreen.max_tile_pipes = 4;
3178 rdev->config.evergreen.max_simds = 10;
3179 rdev->config.evergreen.max_backends = 4 * rdev->config.evergreen.num_ses;
3180 rdev->config.evergreen.max_gprs = 256;
3181 rdev->config.evergreen.max_threads = 248;
3182 rdev->config.evergreen.max_gs_threads = 32;
3183 rdev->config.evergreen.max_stack_entries = 512;
3184 rdev->config.evergreen.sx_num_of_sets = 4;
3185 rdev->config.evergreen.sx_max_export_size = 256;
3186 rdev->config.evergreen.sx_max_export_pos_size = 64;
3187 rdev->config.evergreen.sx_max_export_smx_size = 192;
3188 rdev->config.evergreen.max_hw_contexts = 8;
3189 rdev->config.evergreen.sq_num_cf_insts = 2;
3190
3191 rdev->config.evergreen.sc_prim_fifo_size = 0x100;
3192 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3193 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3194 gb_addr_config = JUNIPER_GB_ADDR_CONFIG_GOLDEN;
3195 break;
3196 case CHIP_REDWOOD:
3197 rdev->config.evergreen.num_ses = 1;
3198 rdev->config.evergreen.max_pipes = 4;
3199 rdev->config.evergreen.max_tile_pipes = 4;
3200 rdev->config.evergreen.max_simds = 5;
3201 rdev->config.evergreen.max_backends = 2 * rdev->config.evergreen.num_ses;
3202 rdev->config.evergreen.max_gprs = 256;
3203 rdev->config.evergreen.max_threads = 248;
3204 rdev->config.evergreen.max_gs_threads = 32;
3205 rdev->config.evergreen.max_stack_entries = 256;
3206 rdev->config.evergreen.sx_num_of_sets = 4;
3207 rdev->config.evergreen.sx_max_export_size = 256;
3208 rdev->config.evergreen.sx_max_export_pos_size = 64;
3209 rdev->config.evergreen.sx_max_export_smx_size = 192;
3210 rdev->config.evergreen.max_hw_contexts = 8;
3211 rdev->config.evergreen.sq_num_cf_insts = 2;
3212
3213 rdev->config.evergreen.sc_prim_fifo_size = 0x100;
3214 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3215 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3216 gb_addr_config = REDWOOD_GB_ADDR_CONFIG_GOLDEN;
3217 break;
3218 case CHIP_CEDAR:
3219 default:
3220 rdev->config.evergreen.num_ses = 1;
3221 rdev->config.evergreen.max_pipes = 2;
3222 rdev->config.evergreen.max_tile_pipes = 2;
3223 rdev->config.evergreen.max_simds = 2;
3224 rdev->config.evergreen.max_backends = 1 * rdev->config.evergreen.num_ses;
3225 rdev->config.evergreen.max_gprs = 256;
3226 rdev->config.evergreen.max_threads = 192;
3227 rdev->config.evergreen.max_gs_threads = 16;
3228 rdev->config.evergreen.max_stack_entries = 256;
3229 rdev->config.evergreen.sx_num_of_sets = 4;
3230 rdev->config.evergreen.sx_max_export_size = 128;
3231 rdev->config.evergreen.sx_max_export_pos_size = 32;
3232 rdev->config.evergreen.sx_max_export_smx_size = 96;
3233 rdev->config.evergreen.max_hw_contexts = 4;
3234 rdev->config.evergreen.sq_num_cf_insts = 1;
3235
3236 rdev->config.evergreen.sc_prim_fifo_size = 0x40;
3237 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3238 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3239 gb_addr_config = CEDAR_GB_ADDR_CONFIG_GOLDEN;
3240 break;
3241 case CHIP_PALM:
3242 rdev->config.evergreen.num_ses = 1;
3243 rdev->config.evergreen.max_pipes = 2;
3244 rdev->config.evergreen.max_tile_pipes = 2;
3245 rdev->config.evergreen.max_simds = 2;
3246 rdev->config.evergreen.max_backends = 1 * rdev->config.evergreen.num_ses;
3247 rdev->config.evergreen.max_gprs = 256;
3248 rdev->config.evergreen.max_threads = 192;
3249 rdev->config.evergreen.max_gs_threads = 16;
3250 rdev->config.evergreen.max_stack_entries = 256;
3251 rdev->config.evergreen.sx_num_of_sets = 4;
3252 rdev->config.evergreen.sx_max_export_size = 128;
3253 rdev->config.evergreen.sx_max_export_pos_size = 32;
3254 rdev->config.evergreen.sx_max_export_smx_size = 96;
3255 rdev->config.evergreen.max_hw_contexts = 4;
3256 rdev->config.evergreen.sq_num_cf_insts = 1;
3257
3258 rdev->config.evergreen.sc_prim_fifo_size = 0x40;
3259 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3260 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3261 gb_addr_config = CEDAR_GB_ADDR_CONFIG_GOLDEN;
3262 break;
3263 case CHIP_SUMO:
3264 rdev->config.evergreen.num_ses = 1;
3265 rdev->config.evergreen.max_pipes = 4;
3266 rdev->config.evergreen.max_tile_pipes = 4;
3267 if (rdev->pdev->device == 0x9648)
3268 rdev->config.evergreen.max_simds = 3;
3269 else if ((rdev->pdev->device == 0x9647) ||
3270 (rdev->pdev->device == 0x964a))
3271 rdev->config.evergreen.max_simds = 4;
3272 else
3273 rdev->config.evergreen.max_simds = 5;
3274 rdev->config.evergreen.max_backends = 2 * rdev->config.evergreen.num_ses;
3275 rdev->config.evergreen.max_gprs = 256;
3276 rdev->config.evergreen.max_threads = 248;
3277 rdev->config.evergreen.max_gs_threads = 32;
3278 rdev->config.evergreen.max_stack_entries = 256;
3279 rdev->config.evergreen.sx_num_of_sets = 4;
3280 rdev->config.evergreen.sx_max_export_size = 256;
3281 rdev->config.evergreen.sx_max_export_pos_size = 64;
3282 rdev->config.evergreen.sx_max_export_smx_size = 192;
3283 rdev->config.evergreen.max_hw_contexts = 8;
3284 rdev->config.evergreen.sq_num_cf_insts = 2;
3285
3286 rdev->config.evergreen.sc_prim_fifo_size = 0x40;
3287 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3288 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3289 gb_addr_config = SUMO_GB_ADDR_CONFIG_GOLDEN;
3290 break;
3291 case CHIP_SUMO2:
3292 rdev->config.evergreen.num_ses = 1;
3293 rdev->config.evergreen.max_pipes = 4;
3294 rdev->config.evergreen.max_tile_pipes = 4;
3295 rdev->config.evergreen.max_simds = 2;
3296 rdev->config.evergreen.max_backends = 1 * rdev->config.evergreen.num_ses;
3297 rdev->config.evergreen.max_gprs = 256;
3298 rdev->config.evergreen.max_threads = 248;
3299 rdev->config.evergreen.max_gs_threads = 32;
3300 rdev->config.evergreen.max_stack_entries = 512;
3301 rdev->config.evergreen.sx_num_of_sets = 4;
3302 rdev->config.evergreen.sx_max_export_size = 256;
3303 rdev->config.evergreen.sx_max_export_pos_size = 64;
3304 rdev->config.evergreen.sx_max_export_smx_size = 192;
3305 rdev->config.evergreen.max_hw_contexts = 4;
3306 rdev->config.evergreen.sq_num_cf_insts = 2;
3307
3308 rdev->config.evergreen.sc_prim_fifo_size = 0x40;
3309 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3310 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3311 gb_addr_config = SUMO2_GB_ADDR_CONFIG_GOLDEN;
3312 break;
3313 case CHIP_BARTS:
3314 rdev->config.evergreen.num_ses = 2;
3315 rdev->config.evergreen.max_pipes = 4;
3316 rdev->config.evergreen.max_tile_pipes = 8;
3317 rdev->config.evergreen.max_simds = 7;
3318 rdev->config.evergreen.max_backends = 4 * rdev->config.evergreen.num_ses;
3319 rdev->config.evergreen.max_gprs = 256;
3320 rdev->config.evergreen.max_threads = 248;
3321 rdev->config.evergreen.max_gs_threads = 32;
3322 rdev->config.evergreen.max_stack_entries = 512;
3323 rdev->config.evergreen.sx_num_of_sets = 4;
3324 rdev->config.evergreen.sx_max_export_size = 256;
3325 rdev->config.evergreen.sx_max_export_pos_size = 64;
3326 rdev->config.evergreen.sx_max_export_smx_size = 192;
3327 rdev->config.evergreen.max_hw_contexts = 8;
3328 rdev->config.evergreen.sq_num_cf_insts = 2;
3329
3330 rdev->config.evergreen.sc_prim_fifo_size = 0x100;
3331 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3332 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3333 gb_addr_config = BARTS_GB_ADDR_CONFIG_GOLDEN;
3334 break;
3335 case CHIP_TURKS:
3336 rdev->config.evergreen.num_ses = 1;
3337 rdev->config.evergreen.max_pipes = 4;
3338 rdev->config.evergreen.max_tile_pipes = 4;
3339 rdev->config.evergreen.max_simds = 6;
3340 rdev->config.evergreen.max_backends = 2 * rdev->config.evergreen.num_ses;
3341 rdev->config.evergreen.max_gprs = 256;
3342 rdev->config.evergreen.max_threads = 248;
3343 rdev->config.evergreen.max_gs_threads = 32;
3344 rdev->config.evergreen.max_stack_entries = 256;
3345 rdev->config.evergreen.sx_num_of_sets = 4;
3346 rdev->config.evergreen.sx_max_export_size = 256;
3347 rdev->config.evergreen.sx_max_export_pos_size = 64;
3348 rdev->config.evergreen.sx_max_export_smx_size = 192;
3349 rdev->config.evergreen.max_hw_contexts = 8;
3350 rdev->config.evergreen.sq_num_cf_insts = 2;
3351
3352 rdev->config.evergreen.sc_prim_fifo_size = 0x100;
3353 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3354 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3355 gb_addr_config = TURKS_GB_ADDR_CONFIG_GOLDEN;
3356 break;
3357 case CHIP_CAICOS:
3358 rdev->config.evergreen.num_ses = 1;
3359 rdev->config.evergreen.max_pipes = 2;
3360 rdev->config.evergreen.max_tile_pipes = 2;
3361 rdev->config.evergreen.max_simds = 2;
3362 rdev->config.evergreen.max_backends = 1 * rdev->config.evergreen.num_ses;
3363 rdev->config.evergreen.max_gprs = 256;
3364 rdev->config.evergreen.max_threads = 192;
3365 rdev->config.evergreen.max_gs_threads = 16;
3366 rdev->config.evergreen.max_stack_entries = 256;
3367 rdev->config.evergreen.sx_num_of_sets = 4;
3368 rdev->config.evergreen.sx_max_export_size = 128;
3369 rdev->config.evergreen.sx_max_export_pos_size = 32;
3370 rdev->config.evergreen.sx_max_export_smx_size = 96;
3371 rdev->config.evergreen.max_hw_contexts = 4;
3372 rdev->config.evergreen.sq_num_cf_insts = 1;
3373
3374 rdev->config.evergreen.sc_prim_fifo_size = 0x40;
3375 rdev->config.evergreen.sc_hiz_tile_fifo_size = 0x30;
3376 rdev->config.evergreen.sc_earlyz_tile_fifo_size = 0x130;
3377 gb_addr_config = CAICOS_GB_ADDR_CONFIG_GOLDEN;
3378 break;
3379 }
3380
3381 /* Initialize HDP */
3382 for (i = 0, j = 0; i < 32; i++, j += 0x18) {
3383 WREG32((0x2c14 + j), 0x00000000);
3384 WREG32((0x2c18 + j), 0x00000000);
3385 WREG32((0x2c1c + j), 0x00000000);
3386 WREG32((0x2c20 + j), 0x00000000);
3387 WREG32((0x2c24 + j), 0x00000000);
3388 }
3389
3390 WREG32(GRBM_CNTL, GRBM_READ_TIMEOUT(0xff));
3391 WREG32(SRBM_INT_CNTL, 0x1);
3392 WREG32(SRBM_INT_ACK, 0x1);
3393
3394 evergreen_fix_pci_max_read_req_size(rdev);
3395
3396 mc_shared_chmap = RREG32(MC_SHARED_CHMAP);
3397 if ((rdev->family == CHIP_PALM) ||
3398 (rdev->family == CHIP_SUMO) ||
3399 (rdev->family == CHIP_SUMO2))
3400 mc_arb_ramcfg = RREG32(FUS_MC_ARB_RAMCFG);
3401 else
3402 mc_arb_ramcfg = RREG32(MC_ARB_RAMCFG);
3403
3404 /* setup tiling info dword. gb_addr_config is not adequate since it does
3405 * not have bank info, so create a custom tiling dword.
3406 * bits 3:0 num_pipes
3407 * bits 7:4 num_banks
3408 * bits 11:8 group_size
3409 * bits 15:12 row_size
3410 */
3411 rdev->config.evergreen.tile_config = 0;
3412 switch (rdev->config.evergreen.max_tile_pipes) {
3413 case 1:
3414 default:
3415 rdev->config.evergreen.tile_config |= (0 << 0);
3416 break;
3417 case 2:
3418 rdev->config.evergreen.tile_config |= (1 << 0);
3419 break;
3420 case 4:
3421 rdev->config.evergreen.tile_config |= (2 << 0);
3422 break;
3423 case 8:
3424 rdev->config.evergreen.tile_config |= (3 << 0);
3425 break;
3426 }
3427 /* num banks is 8 on all fusion asics. 0 = 4, 1 = 8, 2 = 16 */
3428 if (rdev->flags & RADEON_IS_IGP)
3429 rdev->config.evergreen.tile_config |= 1 << 4;
3430 else {
3431 switch ((mc_arb_ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT) {
3432 case 0: /* four banks */
3433 rdev->config.evergreen.tile_config |= 0 << 4;
3434 break;
3435 case 1: /* eight banks */
3436 rdev->config.evergreen.tile_config |= 1 << 4;
3437 break;
3438 case 2: /* sixteen banks */
3439 default:
3440 rdev->config.evergreen.tile_config |= 2 << 4;
3441 break;
3442 }
3443 }
3444 rdev->config.evergreen.tile_config |= 0 << 8;
3445 rdev->config.evergreen.tile_config |=
3446 ((gb_addr_config & 0x30000000) >> 28) << 12;
3447
3448 if ((rdev->family >= CHIP_CEDAR) && (rdev->family <= CHIP_HEMLOCK)) {
3449 u32 efuse_straps_4;
3450 u32 efuse_straps_3;
3451
3452 efuse_straps_4 = RREG32_RCU(0x204);
3453 efuse_straps_3 = RREG32_RCU(0x203);
3454 tmp = (((efuse_straps_4 & 0xf) << 4) |
3455 ((efuse_straps_3 & 0xf0000000) >> 28));
3456 } else {
3457 tmp = 0;
3458 for (i = (rdev->config.evergreen.num_ses - 1); i >= 0; i--) {
3459 u32 rb_disable_bitmap;
3460
3461 WREG32(GRBM_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_INDEX(i));
3462 WREG32(RLC_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_INDEX(i));
3463 rb_disable_bitmap = (RREG32(CC_RB_BACKEND_DISABLE) & 0x00ff0000) >> 16;
3464 tmp <<= 4;
3465 tmp |= rb_disable_bitmap;
3466 }
3467 }
3468 /* enabled rb are just the one not disabled :) */
3469 disabled_rb_mask = tmp;
3470 tmp = 0;
3471 for (i = 0; i < rdev->config.evergreen.max_backends; i++)
3472 tmp |= (1 << i);
3473 /* if all the backends are disabled, fix it up here */
3474 if ((disabled_rb_mask & tmp) == tmp) {
3475 for (i = 0; i < rdev->config.evergreen.max_backends; i++)
3476 disabled_rb_mask &= ~(1 << i);
3477 }
3478
3479 for (i = 0; i < rdev->config.evergreen.num_ses; i++) {
3480 u32 simd_disable_bitmap;
3481
3482 WREG32(GRBM_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_INDEX(i));
3483 WREG32(RLC_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_INDEX(i));
3484 simd_disable_bitmap = (RREG32(CC_GC_SHADER_PIPE_CONFIG) & 0xffff0000) >> 16;
3485 simd_disable_bitmap |= 0xffffffff << rdev->config.evergreen.max_simds;
3486 tmp <<= 16;
3487 tmp |= simd_disable_bitmap;
3488 }
3489 rdev->config.evergreen.active_simds = hweight32(~tmp);
3490
3491 WREG32(GRBM_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_BROADCAST_WRITES);
3492 WREG32(RLC_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_BROADCAST_WRITES);
3493
3494 WREG32(GB_ADDR_CONFIG, gb_addr_config);
3495 WREG32(DMIF_ADDR_CONFIG, gb_addr_config);
3496 WREG32(HDP_ADDR_CONFIG, gb_addr_config);
3497 WREG32(DMA_TILING_CONFIG, gb_addr_config);
3498 WREG32(UVD_UDEC_ADDR_CONFIG, gb_addr_config);
3499 WREG32(UVD_UDEC_DB_ADDR_CONFIG, gb_addr_config);
3500 WREG32(UVD_UDEC_DBW_ADDR_CONFIG, gb_addr_config);
3501
3502 if ((rdev->config.evergreen.max_backends == 1) &&
3503 (rdev->flags & RADEON_IS_IGP)) {
3504 if ((disabled_rb_mask & 3) == 1) {
3505 /* RB0 disabled, RB1 enabled */
3506 tmp = 0x11111111;
3507 } else {
3508 /* RB1 disabled, RB0 enabled */
3509 tmp = 0x00000000;
3510 }
3511 } else {
3512 tmp = gb_addr_config & NUM_PIPES_MASK;
3513 tmp = r6xx_remap_render_backend(rdev, tmp, rdev->config.evergreen.max_backends,
3514 EVERGREEN_MAX_BACKENDS, disabled_rb_mask);
3515 }
3516 rdev->config.evergreen.backend_map = tmp;
3517 WREG32(GB_BACKEND_MAP, tmp);
3518
3519 WREG32(CGTS_SYS_TCC_DISABLE, 0);
3520 WREG32(CGTS_TCC_DISABLE, 0);
3521 WREG32(CGTS_USER_SYS_TCC_DISABLE, 0);
3522 WREG32(CGTS_USER_TCC_DISABLE, 0);
3523
3524 /* set HW defaults for 3D engine */
3525 WREG32(CP_QUEUE_THRESHOLDS, (ROQ_IB1_START(0x16) |
3526 ROQ_IB2_START(0x2b)));
3527
3528 WREG32(CP_MEQ_THRESHOLDS, STQ_SPLIT(0x30));
3529
3530 WREG32(TA_CNTL_AUX, (DISABLE_CUBE_ANISO |
3531 SYNC_GRADIENT |
3532 SYNC_WALKER |
3533 SYNC_ALIGNER));
3534
3535 sx_debug_1 = RREG32(SX_DEBUG_1);
3536 sx_debug_1 |= ENABLE_NEW_SMX_ADDRESS;
3537 WREG32(SX_DEBUG_1, sx_debug_1);
3538
3539
3540 smx_dc_ctl0 = RREG32(SMX_DC_CTL0);
3541 smx_dc_ctl0 &= ~NUMBER_OF_SETS(0x1ff);
3542 smx_dc_ctl0 |= NUMBER_OF_SETS(rdev->config.evergreen.sx_num_of_sets);
3543 WREG32(SMX_DC_CTL0, smx_dc_ctl0);
3544
3545 if (rdev->family <= CHIP_SUMO2)
3546 WREG32(SMX_SAR_CTL0, 0x00010000);
3547
3548 WREG32(SX_EXPORT_BUFFER_SIZES, (COLOR_BUFFER_SIZE((rdev->config.evergreen.sx_max_export_size / 4) - 1) |
3549 POSITION_BUFFER_SIZE((rdev->config.evergreen.sx_max_export_pos_size / 4) - 1) |
3550 SMX_BUFFER_SIZE((rdev->config.evergreen.sx_max_export_smx_size / 4) - 1)));
3551
3552 WREG32(PA_SC_FIFO_SIZE, (SC_PRIM_FIFO_SIZE(rdev->config.evergreen.sc_prim_fifo_size) |
3553 SC_HIZ_TILE_FIFO_SIZE(rdev->config.evergreen.sc_hiz_tile_fifo_size) |
3554 SC_EARLYZ_TILE_FIFO_SIZE(rdev->config.evergreen.sc_earlyz_tile_fifo_size)));
3555
3556 WREG32(VGT_NUM_INSTANCES, 1);
3557 WREG32(SPI_CONFIG_CNTL, 0);
3558 WREG32(SPI_CONFIG_CNTL_1, VTX_DONE_DELAY(4));
3559 WREG32(CP_PERFMON_CNTL, 0);
3560
3561 WREG32(SQ_MS_FIFO_SIZES, (CACHE_FIFO_SIZE(16 * rdev->config.evergreen.sq_num_cf_insts) |
3562 FETCH_FIFO_HIWATER(0x4) |
3563 DONE_FIFO_HIWATER(0xe0) |
3564 ALU_UPDATE_FIFO_HIWATER(0x8)));
3565
3566 sq_config = RREG32(SQ_CONFIG);
3567 sq_config &= ~(PS_PRIO(3) |
3568 VS_PRIO(3) |
3569 GS_PRIO(3) |
3570 ES_PRIO(3));
3571 sq_config |= (VC_ENABLE |
3572 EXPORT_SRC_C |
3573 PS_PRIO(0) |
3574 VS_PRIO(1) |
3575 GS_PRIO(2) |
3576 ES_PRIO(3));
3577
3578 switch (rdev->family) {
3579 case CHIP_CEDAR:
3580 case CHIP_PALM:
3581 case CHIP_SUMO:
3582 case CHIP_SUMO2:
3583 case CHIP_CAICOS:
3584 /* no vertex cache */
3585 sq_config &= ~VC_ENABLE;
3586 break;
3587 default:
3588 break;
3589 }
3590
3591 sq_lds_resource_mgmt = RREG32(SQ_LDS_RESOURCE_MGMT);
3592
3593 sq_gpr_resource_mgmt_1 = NUM_PS_GPRS((rdev->config.evergreen.max_gprs - (4 * 2))* 12 / 32);
3594 sq_gpr_resource_mgmt_1 |= NUM_VS_GPRS((rdev->config.evergreen.max_gprs - (4 * 2)) * 6 / 32);
3595 sq_gpr_resource_mgmt_1 |= NUM_CLAUSE_TEMP_GPRS(4);
3596 sq_gpr_resource_mgmt_2 = NUM_GS_GPRS((rdev->config.evergreen.max_gprs - (4 * 2)) * 4 / 32);
3597 sq_gpr_resource_mgmt_2 |= NUM_ES_GPRS((rdev->config.evergreen.max_gprs - (4 * 2)) * 4 / 32);
3598 sq_gpr_resource_mgmt_3 = NUM_HS_GPRS((rdev->config.evergreen.max_gprs - (4 * 2)) * 3 / 32);
3599 sq_gpr_resource_mgmt_3 |= NUM_LS_GPRS((rdev->config.evergreen.max_gprs - (4 * 2)) * 3 / 32);
3600
3601 switch (rdev->family) {
3602 case CHIP_CEDAR:
3603 case CHIP_PALM:
3604 case CHIP_SUMO:
3605 case CHIP_SUMO2:
3606 ps_thread_count = 96;
3607 break;
3608 default:
3609 ps_thread_count = 128;
3610 break;
3611 }
3612
3613 sq_thread_resource_mgmt = NUM_PS_THREADS(ps_thread_count);
3614 sq_thread_resource_mgmt |= NUM_VS_THREADS((((rdev->config.evergreen.max_threads - ps_thread_count) / 6) / 8) * 8);
3615 sq_thread_resource_mgmt |= NUM_GS_THREADS((((rdev->config.evergreen.max_threads - ps_thread_count) / 6) / 8) * 8);
3616 sq_thread_resource_mgmt |= NUM_ES_THREADS((((rdev->config.evergreen.max_threads - ps_thread_count) / 6) / 8) * 8);
3617 sq_thread_resource_mgmt_2 = NUM_HS_THREADS((((rdev->config.evergreen.max_threads - ps_thread_count) / 6) / 8) * 8);
3618 sq_thread_resource_mgmt_2 |= NUM_LS_THREADS((((rdev->config.evergreen.max_threads - ps_thread_count) / 6) / 8) * 8);
3619
3620 sq_stack_resource_mgmt_1 = NUM_PS_STACK_ENTRIES((rdev->config.evergreen.max_stack_entries * 1) / 6);
3621 sq_stack_resource_mgmt_1 |= NUM_VS_STACK_ENTRIES((rdev->config.evergreen.max_stack_entries * 1) / 6);
3622 sq_stack_resource_mgmt_2 = NUM_GS_STACK_ENTRIES((rdev->config.evergreen.max_stack_entries * 1) / 6);
3623 sq_stack_resource_mgmt_2 |= NUM_ES_STACK_ENTRIES((rdev->config.evergreen.max_stack_entries * 1) / 6);
3624 sq_stack_resource_mgmt_3 = NUM_HS_STACK_ENTRIES((rdev->config.evergreen.max_stack_entries * 1) / 6);
3625 sq_stack_resource_mgmt_3 |= NUM_LS_STACK_ENTRIES((rdev->config.evergreen.max_stack_entries * 1) / 6);
3626
3627 WREG32(SQ_CONFIG, sq_config);
3628 WREG32(SQ_GPR_RESOURCE_MGMT_1, sq_gpr_resource_mgmt_1);
3629 WREG32(SQ_GPR_RESOURCE_MGMT_2, sq_gpr_resource_mgmt_2);
3630 WREG32(SQ_GPR_RESOURCE_MGMT_3, sq_gpr_resource_mgmt_3);
3631 WREG32(SQ_THREAD_RESOURCE_MGMT, sq_thread_resource_mgmt);
3632 WREG32(SQ_THREAD_RESOURCE_MGMT_2, sq_thread_resource_mgmt_2);
3633 WREG32(SQ_STACK_RESOURCE_MGMT_1, sq_stack_resource_mgmt_1);
3634 WREG32(SQ_STACK_RESOURCE_MGMT_2, sq_stack_resource_mgmt_2);
3635 WREG32(SQ_STACK_RESOURCE_MGMT_3, sq_stack_resource_mgmt_3);
3636 WREG32(SQ_DYN_GPR_CNTL_PS_FLUSH_REQ, 0);
3637 WREG32(SQ_LDS_RESOURCE_MGMT, sq_lds_resource_mgmt);
3638
3639 WREG32(PA_SC_FORCE_EOV_MAX_CNTS, (FORCE_EOV_MAX_CLK_CNT(4095) |
3640 FORCE_EOV_MAX_REZ_CNT(255)));
3641
3642 switch (rdev->family) {
3643 case CHIP_CEDAR:
3644 case CHIP_PALM:
3645 case CHIP_SUMO:
3646 case CHIP_SUMO2:
3647 case CHIP_CAICOS:
3648 vgt_cache_invalidation = CACHE_INVALIDATION(TC_ONLY);
3649 break;
3650 default:
3651 vgt_cache_invalidation = CACHE_INVALIDATION(VC_AND_TC);
3652 break;
3653 }
3654 vgt_cache_invalidation |= AUTO_INVLD_EN(ES_AND_GS_AUTO);
3655 WREG32(VGT_CACHE_INVALIDATION, vgt_cache_invalidation);
3656
3657 WREG32(VGT_GS_VERTEX_REUSE, 16);
3658 WREG32(PA_SU_LINE_STIPPLE_VALUE, 0);
3659 WREG32(PA_SC_LINE_STIPPLE_STATE, 0);
3660
3661 WREG32(VGT_VERTEX_REUSE_BLOCK_CNTL, 14);
3662 WREG32(VGT_OUT_DEALLOC_CNTL, 16);
3663
3664 WREG32(CB_PERF_CTR0_SEL_0, 0);
3665 WREG32(CB_PERF_CTR0_SEL_1, 0);
3666 WREG32(CB_PERF_CTR1_SEL_0, 0);
3667 WREG32(CB_PERF_CTR1_SEL_1, 0);
3668 WREG32(CB_PERF_CTR2_SEL_0, 0);
3669 WREG32(CB_PERF_CTR2_SEL_1, 0);
3670 WREG32(CB_PERF_CTR3_SEL_0, 0);
3671 WREG32(CB_PERF_CTR3_SEL_1, 0);
3672
3673 /* clear render buffer base addresses */
3674 WREG32(CB_COLOR0_BASE, 0);
3675 WREG32(CB_COLOR1_BASE, 0);
3676 WREG32(CB_COLOR2_BASE, 0);
3677 WREG32(CB_COLOR3_BASE, 0);
3678 WREG32(CB_COLOR4_BASE, 0);
3679 WREG32(CB_COLOR5_BASE, 0);
3680 WREG32(CB_COLOR6_BASE, 0);
3681 WREG32(CB_COLOR7_BASE, 0);
3682 WREG32(CB_COLOR8_BASE, 0);
3683 WREG32(CB_COLOR9_BASE, 0);
3684 WREG32(CB_COLOR10_BASE, 0);
3685 WREG32(CB_COLOR11_BASE, 0);
3686
3687 /* set the shader const cache sizes to 0 */
3688 for (i = SQ_ALU_CONST_BUFFER_SIZE_PS_0; i < 0x28200; i += 4)
3689 WREG32(i, 0);
3690 for (i = SQ_ALU_CONST_BUFFER_SIZE_HS_0; i < 0x29000; i += 4)
3691 WREG32(i, 0);
3692
3693 tmp = RREG32(HDP_MISC_CNTL);
3694 tmp |= HDP_FLUSH_INVALIDATE_CACHE;
3695 WREG32(HDP_MISC_CNTL, tmp);
3696
3697 hdp_host_path_cntl = RREG32(HDP_HOST_PATH_CNTL);
3698 WREG32(HDP_HOST_PATH_CNTL, hdp_host_path_cntl);
3699
3700 WREG32(PA_CL_ENHANCE, CLIP_VTX_REORDER_ENA | NUM_CLIP_SEQ(3));
3701
3702 udelay(50);
3703
3704 }
3705
evergreen_mc_init(struct radeon_device * rdev)3706 int evergreen_mc_init(struct radeon_device *rdev)
3707 {
3708 u32 tmp;
3709 int chansize, numchan;
3710
3711 /* Get VRAM informations */
3712 rdev->mc.vram_is_ddr = true;
3713 if ((rdev->family == CHIP_PALM) ||
3714 (rdev->family == CHIP_SUMO) ||
3715 (rdev->family == CHIP_SUMO2))
3716 tmp = RREG32(FUS_MC_ARB_RAMCFG);
3717 else
3718 tmp = RREG32(MC_ARB_RAMCFG);
3719 if (tmp & CHANSIZE_OVERRIDE) {
3720 chansize = 16;
3721 } else if (tmp & CHANSIZE_MASK) {
3722 chansize = 64;
3723 } else {
3724 chansize = 32;
3725 }
3726 tmp = RREG32(MC_SHARED_CHMAP);
3727 switch ((tmp & NOOFCHAN_MASK) >> NOOFCHAN_SHIFT) {
3728 case 0:
3729 default:
3730 numchan = 1;
3731 break;
3732 case 1:
3733 numchan = 2;
3734 break;
3735 case 2:
3736 numchan = 4;
3737 break;
3738 case 3:
3739 numchan = 8;
3740 break;
3741 }
3742 rdev->mc.vram_width = numchan * chansize;
3743 /* Could aper size report 0 ? */
3744 rdev->mc.aper_base = pci_resource_start(rdev->pdev, 0);
3745 rdev->mc.aper_size = pci_resource_len(rdev->pdev, 0);
3746 /* Setup GPU memory space */
3747 if ((rdev->family == CHIP_PALM) ||
3748 (rdev->family == CHIP_SUMO) ||
3749 (rdev->family == CHIP_SUMO2)) {
3750 /* size in bytes on fusion */
3751 rdev->mc.mc_vram_size = RREG32(CONFIG_MEMSIZE);
3752 rdev->mc.real_vram_size = RREG32(CONFIG_MEMSIZE);
3753 } else {
3754 /* size in MB on evergreen/cayman/tn */
3755 rdev->mc.mc_vram_size = RREG32(CONFIG_MEMSIZE) * 1024ULL * 1024ULL;
3756 rdev->mc.real_vram_size = RREG32(CONFIG_MEMSIZE) * 1024ULL * 1024ULL;
3757 }
3758 rdev->mc.visible_vram_size = rdev->mc.aper_size;
3759 r700_vram_gtt_location(rdev, &rdev->mc);
3760 radeon_update_bandwidth_info(rdev);
3761
3762 return 0;
3763 }
3764
evergreen_print_gpu_status_regs(struct radeon_device * rdev)3765 void evergreen_print_gpu_status_regs(struct radeon_device *rdev)
3766 {
3767 dev_info(rdev->dev, " GRBM_STATUS = 0x%08X\n",
3768 RREG32(GRBM_STATUS));
3769 dev_info(rdev->dev, " GRBM_STATUS_SE0 = 0x%08X\n",
3770 RREG32(GRBM_STATUS_SE0));
3771 dev_info(rdev->dev, " GRBM_STATUS_SE1 = 0x%08X\n",
3772 RREG32(GRBM_STATUS_SE1));
3773 dev_info(rdev->dev, " SRBM_STATUS = 0x%08X\n",
3774 RREG32(SRBM_STATUS));
3775 dev_info(rdev->dev, " SRBM_STATUS2 = 0x%08X\n",
3776 RREG32(SRBM_STATUS2));
3777 dev_info(rdev->dev, " R_008674_CP_STALLED_STAT1 = 0x%08X\n",
3778 RREG32(CP_STALLED_STAT1));
3779 dev_info(rdev->dev, " R_008678_CP_STALLED_STAT2 = 0x%08X\n",
3780 RREG32(CP_STALLED_STAT2));
3781 dev_info(rdev->dev, " R_00867C_CP_BUSY_STAT = 0x%08X\n",
3782 RREG32(CP_BUSY_STAT));
3783 dev_info(rdev->dev, " R_008680_CP_STAT = 0x%08X\n",
3784 RREG32(CP_STAT));
3785 dev_info(rdev->dev, " R_00D034_DMA_STATUS_REG = 0x%08X\n",
3786 RREG32(DMA_STATUS_REG));
3787 if (rdev->family >= CHIP_CAYMAN) {
3788 dev_info(rdev->dev, " R_00D834_DMA_STATUS_REG = 0x%08X\n",
3789 RREG32(DMA_STATUS_REG + 0x800));
3790 }
3791 }
3792
evergreen_is_display_hung(struct radeon_device * rdev)3793 bool evergreen_is_display_hung(struct radeon_device *rdev)
3794 {
3795 u32 crtc_hung = 0;
3796 u32 crtc_status[6];
3797 u32 i, j, tmp;
3798
3799 for (i = 0; i < rdev->num_crtc; i++) {
3800 if (RREG32(EVERGREEN_CRTC_CONTROL + crtc_offsets[i]) & EVERGREEN_CRTC_MASTER_EN) {
3801 crtc_status[i] = RREG32(EVERGREEN_CRTC_STATUS_HV_COUNT + crtc_offsets[i]);
3802 crtc_hung |= (1 << i);
3803 }
3804 }
3805
3806 for (j = 0; j < 10; j++) {
3807 for (i = 0; i < rdev->num_crtc; i++) {
3808 if (crtc_hung & (1 << i)) {
3809 tmp = RREG32(EVERGREEN_CRTC_STATUS_HV_COUNT + crtc_offsets[i]);
3810 if (tmp != crtc_status[i])
3811 crtc_hung &= ~(1 << i);
3812 }
3813 }
3814 if (crtc_hung == 0)
3815 return false;
3816 udelay(100);
3817 }
3818
3819 return true;
3820 }
3821
evergreen_gpu_check_soft_reset(struct radeon_device * rdev)3822 u32 evergreen_gpu_check_soft_reset(struct radeon_device *rdev)
3823 {
3824 u32 reset_mask = 0;
3825 u32 tmp;
3826
3827 /* GRBM_STATUS */
3828 tmp = RREG32(GRBM_STATUS);
3829 if (tmp & (PA_BUSY | SC_BUSY |
3830 SH_BUSY | SX_BUSY |
3831 TA_BUSY | VGT_BUSY |
3832 DB_BUSY | CB_BUSY |
3833 SPI_BUSY | VGT_BUSY_NO_DMA))
3834 reset_mask |= RADEON_RESET_GFX;
3835
3836 if (tmp & (CF_RQ_PENDING | PF_RQ_PENDING |
3837 CP_BUSY | CP_COHERENCY_BUSY))
3838 reset_mask |= RADEON_RESET_CP;
3839
3840 if (tmp & GRBM_EE_BUSY)
3841 reset_mask |= RADEON_RESET_GRBM | RADEON_RESET_GFX | RADEON_RESET_CP;
3842
3843 /* DMA_STATUS_REG */
3844 tmp = RREG32(DMA_STATUS_REG);
3845 if (!(tmp & DMA_IDLE))
3846 reset_mask |= RADEON_RESET_DMA;
3847
3848 /* SRBM_STATUS2 */
3849 tmp = RREG32(SRBM_STATUS2);
3850 if (tmp & DMA_BUSY)
3851 reset_mask |= RADEON_RESET_DMA;
3852
3853 /* SRBM_STATUS */
3854 tmp = RREG32(SRBM_STATUS);
3855 if (tmp & (RLC_RQ_PENDING | RLC_BUSY))
3856 reset_mask |= RADEON_RESET_RLC;
3857
3858 if (tmp & IH_BUSY)
3859 reset_mask |= RADEON_RESET_IH;
3860
3861 if (tmp & SEM_BUSY)
3862 reset_mask |= RADEON_RESET_SEM;
3863
3864 if (tmp & GRBM_RQ_PENDING)
3865 reset_mask |= RADEON_RESET_GRBM;
3866
3867 if (tmp & VMC_BUSY)
3868 reset_mask |= RADEON_RESET_VMC;
3869
3870 if (tmp & (MCB_BUSY | MCB_NON_DISPLAY_BUSY |
3871 MCC_BUSY | MCD_BUSY))
3872 reset_mask |= RADEON_RESET_MC;
3873
3874 if (evergreen_is_display_hung(rdev))
3875 reset_mask |= RADEON_RESET_DISPLAY;
3876
3877 /* VM_L2_STATUS */
3878 tmp = RREG32(VM_L2_STATUS);
3879 if (tmp & L2_BUSY)
3880 reset_mask |= RADEON_RESET_VMC;
3881
3882 /* Skip MC reset as it's mostly likely not hung, just busy */
3883 if (reset_mask & RADEON_RESET_MC) {
3884 DRM_DEBUG("MC busy: 0x%08X, clearing.\n", reset_mask);
3885 reset_mask &= ~RADEON_RESET_MC;
3886 }
3887
3888 return reset_mask;
3889 }
3890
evergreen_gpu_soft_reset(struct radeon_device * rdev,u32 reset_mask)3891 static void evergreen_gpu_soft_reset(struct radeon_device *rdev, u32 reset_mask)
3892 {
3893 struct evergreen_mc_save save;
3894 u32 grbm_soft_reset = 0, srbm_soft_reset = 0;
3895 u32 tmp;
3896
3897 if (reset_mask == 0)
3898 return;
3899
3900 dev_info(rdev->dev, "GPU softreset: 0x%08X\n", reset_mask);
3901
3902 evergreen_print_gpu_status_regs(rdev);
3903
3904 /* Disable CP parsing/prefetching */
3905 WREG32(CP_ME_CNTL, CP_ME_HALT | CP_PFP_HALT);
3906
3907 if (reset_mask & RADEON_RESET_DMA) {
3908 /* Disable DMA */
3909 tmp = RREG32(DMA_RB_CNTL);
3910 tmp &= ~DMA_RB_ENABLE;
3911 WREG32(DMA_RB_CNTL, tmp);
3912 }
3913
3914 udelay(50);
3915
3916 evergreen_mc_stop(rdev, &save);
3917 if (evergreen_mc_wait_for_idle(rdev)) {
3918 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
3919 }
3920
3921 if (reset_mask & (RADEON_RESET_GFX | RADEON_RESET_COMPUTE)) {
3922 grbm_soft_reset |= SOFT_RESET_DB |
3923 SOFT_RESET_CB |
3924 SOFT_RESET_PA |
3925 SOFT_RESET_SC |
3926 SOFT_RESET_SPI |
3927 SOFT_RESET_SX |
3928 SOFT_RESET_SH |
3929 SOFT_RESET_TC |
3930 SOFT_RESET_TA |
3931 SOFT_RESET_VC |
3932 SOFT_RESET_VGT;
3933 }
3934
3935 if (reset_mask & RADEON_RESET_CP) {
3936 grbm_soft_reset |= SOFT_RESET_CP |
3937 SOFT_RESET_VGT;
3938
3939 srbm_soft_reset |= SOFT_RESET_GRBM;
3940 }
3941
3942 if (reset_mask & RADEON_RESET_DMA)
3943 srbm_soft_reset |= SOFT_RESET_DMA;
3944
3945 if (reset_mask & RADEON_RESET_DISPLAY)
3946 srbm_soft_reset |= SOFT_RESET_DC;
3947
3948 if (reset_mask & RADEON_RESET_RLC)
3949 srbm_soft_reset |= SOFT_RESET_RLC;
3950
3951 if (reset_mask & RADEON_RESET_SEM)
3952 srbm_soft_reset |= SOFT_RESET_SEM;
3953
3954 if (reset_mask & RADEON_RESET_IH)
3955 srbm_soft_reset |= SOFT_RESET_IH;
3956
3957 if (reset_mask & RADEON_RESET_GRBM)
3958 srbm_soft_reset |= SOFT_RESET_GRBM;
3959
3960 if (reset_mask & RADEON_RESET_VMC)
3961 srbm_soft_reset |= SOFT_RESET_VMC;
3962
3963 if (!(rdev->flags & RADEON_IS_IGP)) {
3964 if (reset_mask & RADEON_RESET_MC)
3965 srbm_soft_reset |= SOFT_RESET_MC;
3966 }
3967
3968 if (grbm_soft_reset) {
3969 tmp = RREG32(GRBM_SOFT_RESET);
3970 tmp |= grbm_soft_reset;
3971 dev_info(rdev->dev, "GRBM_SOFT_RESET=0x%08X\n", tmp);
3972 WREG32(GRBM_SOFT_RESET, tmp);
3973 tmp = RREG32(GRBM_SOFT_RESET);
3974
3975 udelay(50);
3976
3977 tmp &= ~grbm_soft_reset;
3978 WREG32(GRBM_SOFT_RESET, tmp);
3979 tmp = RREG32(GRBM_SOFT_RESET);
3980 }
3981
3982 if (srbm_soft_reset) {
3983 tmp = RREG32(SRBM_SOFT_RESET);
3984 tmp |= srbm_soft_reset;
3985 dev_info(rdev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
3986 WREG32(SRBM_SOFT_RESET, tmp);
3987 tmp = RREG32(SRBM_SOFT_RESET);
3988
3989 udelay(50);
3990
3991 tmp &= ~srbm_soft_reset;
3992 WREG32(SRBM_SOFT_RESET, tmp);
3993 tmp = RREG32(SRBM_SOFT_RESET);
3994 }
3995
3996 /* Wait a little for things to settle down */
3997 udelay(50);
3998
3999 evergreen_mc_resume(rdev, &save);
4000 udelay(50);
4001
4002 evergreen_print_gpu_status_regs(rdev);
4003 }
4004
evergreen_gpu_pci_config_reset(struct radeon_device * rdev)4005 void evergreen_gpu_pci_config_reset(struct radeon_device *rdev)
4006 {
4007 struct evergreen_mc_save save;
4008 u32 tmp, i;
4009
4010 dev_info(rdev->dev, "GPU pci config reset\n");
4011
4012 /* disable dpm? */
4013
4014 /* Disable CP parsing/prefetching */
4015 WREG32(CP_ME_CNTL, CP_ME_HALT | CP_PFP_HALT);
4016 udelay(50);
4017 /* Disable DMA */
4018 tmp = RREG32(DMA_RB_CNTL);
4019 tmp &= ~DMA_RB_ENABLE;
4020 WREG32(DMA_RB_CNTL, tmp);
4021 /* XXX other engines? */
4022
4023 /* halt the rlc */
4024 r600_rlc_stop(rdev);
4025
4026 udelay(50);
4027
4028 /* set mclk/sclk to bypass */
4029 rv770_set_clk_bypass_mode(rdev);
4030 /* disable BM */
4031 pci_clear_master(rdev->pdev);
4032 /* disable mem access */
4033 evergreen_mc_stop(rdev, &save);
4034 if (evergreen_mc_wait_for_idle(rdev)) {
4035 dev_warn(rdev->dev, "Wait for MC idle timed out !\n");
4036 }
4037 /* reset */
4038 radeon_pci_config_reset(rdev);
4039 /* wait for asic to come out of reset */
4040 for (i = 0; i < rdev->usec_timeout; i++) {
4041 if (RREG32(CONFIG_MEMSIZE) != 0xffffffff)
4042 break;
4043 udelay(1);
4044 }
4045 }
4046
evergreen_asic_reset(struct radeon_device * rdev,bool hard)4047 int evergreen_asic_reset(struct radeon_device *rdev, bool hard)
4048 {
4049 u32 reset_mask;
4050
4051 if (hard) {
4052 evergreen_gpu_pci_config_reset(rdev);
4053 return 0;
4054 }
4055
4056 reset_mask = evergreen_gpu_check_soft_reset(rdev);
4057
4058 if (reset_mask)
4059 r600_set_bios_scratch_engine_hung(rdev, true);
4060
4061 /* try soft reset */
4062 evergreen_gpu_soft_reset(rdev, reset_mask);
4063
4064 reset_mask = evergreen_gpu_check_soft_reset(rdev);
4065
4066 /* try pci config reset */
4067 if (reset_mask && radeon_hard_reset)
4068 evergreen_gpu_pci_config_reset(rdev);
4069
4070 reset_mask = evergreen_gpu_check_soft_reset(rdev);
4071
4072 if (!reset_mask)
4073 r600_set_bios_scratch_engine_hung(rdev, false);
4074
4075 return 0;
4076 }
4077
4078 /**
4079 * evergreen_gfx_is_lockup - Check if the GFX engine is locked up
4080 *
4081 * @rdev: radeon_device pointer
4082 * @ring: radeon_ring structure holding ring information
4083 *
4084 * Check if the GFX engine is locked up.
4085 * Returns true if the engine appears to be locked up, false if not.
4086 */
evergreen_gfx_is_lockup(struct radeon_device * rdev,struct radeon_ring * ring)4087 bool evergreen_gfx_is_lockup(struct radeon_device *rdev, struct radeon_ring *ring)
4088 {
4089 u32 reset_mask = evergreen_gpu_check_soft_reset(rdev);
4090
4091 if (!(reset_mask & (RADEON_RESET_GFX |
4092 RADEON_RESET_COMPUTE |
4093 RADEON_RESET_CP))) {
4094 radeon_ring_lockup_update(rdev, ring);
4095 return false;
4096 }
4097 return radeon_ring_test_lockup(rdev, ring);
4098 }
4099
4100 /*
4101 * RLC
4102 */
4103 #define RLC_SAVE_RESTORE_LIST_END_MARKER 0x00000000
4104 #define RLC_CLEAR_STATE_END_MARKER 0x00000001
4105
sumo_rlc_fini(struct radeon_device * rdev)4106 void sumo_rlc_fini(struct radeon_device *rdev)
4107 {
4108 int r;
4109
4110 /* save restore block */
4111 if (rdev->rlc.save_restore_obj) {
4112 r = radeon_bo_reserve(rdev->rlc.save_restore_obj, false);
4113 if (unlikely(r != 0))
4114 dev_warn(rdev->dev, "(%d) reserve RLC sr bo failed\n", r);
4115 radeon_bo_unpin(rdev->rlc.save_restore_obj);
4116 radeon_bo_unreserve(rdev->rlc.save_restore_obj);
4117
4118 radeon_bo_unref(&rdev->rlc.save_restore_obj);
4119 rdev->rlc.save_restore_obj = NULL;
4120 }
4121
4122 /* clear state block */
4123 if (rdev->rlc.clear_state_obj) {
4124 r = radeon_bo_reserve(rdev->rlc.clear_state_obj, false);
4125 if (unlikely(r != 0))
4126 dev_warn(rdev->dev, "(%d) reserve RLC c bo failed\n", r);
4127 radeon_bo_unpin(rdev->rlc.clear_state_obj);
4128 radeon_bo_unreserve(rdev->rlc.clear_state_obj);
4129
4130 radeon_bo_unref(&rdev->rlc.clear_state_obj);
4131 rdev->rlc.clear_state_obj = NULL;
4132 }
4133
4134 /* clear state block */
4135 if (rdev->rlc.cp_table_obj) {
4136 r = radeon_bo_reserve(rdev->rlc.cp_table_obj, false);
4137 if (unlikely(r != 0))
4138 dev_warn(rdev->dev, "(%d) reserve RLC cp table bo failed\n", r);
4139 radeon_bo_unpin(rdev->rlc.cp_table_obj);
4140 radeon_bo_unreserve(rdev->rlc.cp_table_obj);
4141
4142 radeon_bo_unref(&rdev->rlc.cp_table_obj);
4143 rdev->rlc.cp_table_obj = NULL;
4144 }
4145 }
4146
4147 #define CP_ME_TABLE_SIZE 96
4148
sumo_rlc_init(struct radeon_device * rdev)4149 int sumo_rlc_init(struct radeon_device *rdev)
4150 {
4151 const u32 *src_ptr;
4152 volatile u32 *dst_ptr;
4153 u32 dws, data, i, j, k, reg_num;
4154 u32 reg_list_num, reg_list_hdr_blk_index, reg_list_blk_index = 0;
4155 u64 reg_list_mc_addr;
4156 const struct cs_section_def *cs_data;
4157 int r;
4158
4159 src_ptr = rdev->rlc.reg_list;
4160 dws = rdev->rlc.reg_list_size;
4161 if (rdev->family >= CHIP_BONAIRE) {
4162 dws += (5 * 16) + 48 + 48 + 64;
4163 }
4164 cs_data = rdev->rlc.cs_data;
4165
4166 if (src_ptr) {
4167 /* save restore block */
4168 if (rdev->rlc.save_restore_obj == NULL) {
4169 r = radeon_bo_create(rdev, dws * 4, PAGE_SIZE, true,
4170 RADEON_GEM_DOMAIN_VRAM, 0, NULL,
4171 NULL, &rdev->rlc.save_restore_obj);
4172 if (r) {
4173 dev_warn(rdev->dev, "(%d) create RLC sr bo failed\n", r);
4174 return r;
4175 }
4176 }
4177
4178 r = radeon_bo_reserve(rdev->rlc.save_restore_obj, false);
4179 if (unlikely(r != 0)) {
4180 sumo_rlc_fini(rdev);
4181 return r;
4182 }
4183 r = radeon_bo_pin(rdev->rlc.save_restore_obj, RADEON_GEM_DOMAIN_VRAM,
4184 &rdev->rlc.save_restore_gpu_addr);
4185 if (r) {
4186 radeon_bo_unreserve(rdev->rlc.save_restore_obj);
4187 dev_warn(rdev->dev, "(%d) pin RLC sr bo failed\n", r);
4188 sumo_rlc_fini(rdev);
4189 return r;
4190 }
4191
4192 r = radeon_bo_kmap(rdev->rlc.save_restore_obj, (void **)&rdev->rlc.sr_ptr);
4193 if (r) {
4194 dev_warn(rdev->dev, "(%d) map RLC sr bo failed\n", r);
4195 sumo_rlc_fini(rdev);
4196 return r;
4197 }
4198 /* write the sr buffer */
4199 dst_ptr = rdev->rlc.sr_ptr;
4200 if (rdev->family >= CHIP_TAHITI) {
4201 /* SI */
4202 for (i = 0; i < rdev->rlc.reg_list_size; i++)
4203 dst_ptr[i] = cpu_to_le32(src_ptr[i]);
4204 } else {
4205 /* ON/LN/TN */
4206 /* format:
4207 * dw0: (reg2 << 16) | reg1
4208 * dw1: reg1 save space
4209 * dw2: reg2 save space
4210 */
4211 for (i = 0; i < dws; i++) {
4212 data = src_ptr[i] >> 2;
4213 i++;
4214 if (i < dws)
4215 data |= (src_ptr[i] >> 2) << 16;
4216 j = (((i - 1) * 3) / 2);
4217 dst_ptr[j] = cpu_to_le32(data);
4218 }
4219 j = ((i * 3) / 2);
4220 dst_ptr[j] = cpu_to_le32(RLC_SAVE_RESTORE_LIST_END_MARKER);
4221 }
4222 radeon_bo_kunmap(rdev->rlc.save_restore_obj);
4223 radeon_bo_unreserve(rdev->rlc.save_restore_obj);
4224 }
4225
4226 if (cs_data) {
4227 /* clear state block */
4228 if (rdev->family >= CHIP_BONAIRE) {
4229 rdev->rlc.clear_state_size = dws = cik_get_csb_size(rdev);
4230 } else if (rdev->family >= CHIP_TAHITI) {
4231 rdev->rlc.clear_state_size = si_get_csb_size(rdev);
4232 dws = rdev->rlc.clear_state_size + (256 / 4);
4233 } else {
4234 reg_list_num = 0;
4235 dws = 0;
4236 for (i = 0; cs_data[i].section != NULL; i++) {
4237 for (j = 0; cs_data[i].section[j].extent != NULL; j++) {
4238 reg_list_num++;
4239 dws += cs_data[i].section[j].reg_count;
4240 }
4241 }
4242 reg_list_blk_index = (3 * reg_list_num + 2);
4243 dws += reg_list_blk_index;
4244 rdev->rlc.clear_state_size = dws;
4245 }
4246
4247 if (rdev->rlc.clear_state_obj == NULL) {
4248 r = radeon_bo_create(rdev, dws * 4, PAGE_SIZE, true,
4249 RADEON_GEM_DOMAIN_VRAM, 0, NULL,
4250 NULL, &rdev->rlc.clear_state_obj);
4251 if (r) {
4252 dev_warn(rdev->dev, "(%d) create RLC c bo failed\n", r);
4253 sumo_rlc_fini(rdev);
4254 return r;
4255 }
4256 }
4257 r = radeon_bo_reserve(rdev->rlc.clear_state_obj, false);
4258 if (unlikely(r != 0)) {
4259 sumo_rlc_fini(rdev);
4260 return r;
4261 }
4262 r = radeon_bo_pin(rdev->rlc.clear_state_obj, RADEON_GEM_DOMAIN_VRAM,
4263 &rdev->rlc.clear_state_gpu_addr);
4264 if (r) {
4265 radeon_bo_unreserve(rdev->rlc.clear_state_obj);
4266 dev_warn(rdev->dev, "(%d) pin RLC c bo failed\n", r);
4267 sumo_rlc_fini(rdev);
4268 return r;
4269 }
4270
4271 r = radeon_bo_kmap(rdev->rlc.clear_state_obj, (void **)&rdev->rlc.cs_ptr);
4272 if (r) {
4273 dev_warn(rdev->dev, "(%d) map RLC c bo failed\n", r);
4274 sumo_rlc_fini(rdev);
4275 return r;
4276 }
4277 /* set up the cs buffer */
4278 dst_ptr = rdev->rlc.cs_ptr;
4279 if (rdev->family >= CHIP_BONAIRE) {
4280 cik_get_csb_buffer(rdev, dst_ptr);
4281 } else if (rdev->family >= CHIP_TAHITI) {
4282 reg_list_mc_addr = rdev->rlc.clear_state_gpu_addr + 256;
4283 dst_ptr[0] = cpu_to_le32(upper_32_bits(reg_list_mc_addr));
4284 dst_ptr[1] = cpu_to_le32(lower_32_bits(reg_list_mc_addr));
4285 dst_ptr[2] = cpu_to_le32(rdev->rlc.clear_state_size);
4286 si_get_csb_buffer(rdev, &dst_ptr[(256/4)]);
4287 } else {
4288 reg_list_hdr_blk_index = 0;
4289 reg_list_mc_addr = rdev->rlc.clear_state_gpu_addr + (reg_list_blk_index * 4);
4290 data = upper_32_bits(reg_list_mc_addr);
4291 dst_ptr[reg_list_hdr_blk_index] = cpu_to_le32(data);
4292 reg_list_hdr_blk_index++;
4293 for (i = 0; cs_data[i].section != NULL; i++) {
4294 for (j = 0; cs_data[i].section[j].extent != NULL; j++) {
4295 reg_num = cs_data[i].section[j].reg_count;
4296 data = reg_list_mc_addr & 0xffffffff;
4297 dst_ptr[reg_list_hdr_blk_index] = cpu_to_le32(data);
4298 reg_list_hdr_blk_index++;
4299
4300 data = (cs_data[i].section[j].reg_index * 4) & 0xffffffff;
4301 dst_ptr[reg_list_hdr_blk_index] = cpu_to_le32(data);
4302 reg_list_hdr_blk_index++;
4303
4304 data = 0x08000000 | (reg_num * 4);
4305 dst_ptr[reg_list_hdr_blk_index] = cpu_to_le32(data);
4306 reg_list_hdr_blk_index++;
4307
4308 for (k = 0; k < reg_num; k++) {
4309 data = cs_data[i].section[j].extent[k];
4310 dst_ptr[reg_list_blk_index + k] = cpu_to_le32(data);
4311 }
4312 reg_list_mc_addr += reg_num * 4;
4313 reg_list_blk_index += reg_num;
4314 }
4315 }
4316 dst_ptr[reg_list_hdr_blk_index] = cpu_to_le32(RLC_CLEAR_STATE_END_MARKER);
4317 }
4318 radeon_bo_kunmap(rdev->rlc.clear_state_obj);
4319 radeon_bo_unreserve(rdev->rlc.clear_state_obj);
4320 }
4321
4322 if (rdev->rlc.cp_table_size) {
4323 if (rdev->rlc.cp_table_obj == NULL) {
4324 r = radeon_bo_create(rdev, rdev->rlc.cp_table_size,
4325 PAGE_SIZE, true,
4326 RADEON_GEM_DOMAIN_VRAM, 0, NULL,
4327 NULL, &rdev->rlc.cp_table_obj);
4328 if (r) {
4329 dev_warn(rdev->dev, "(%d) create RLC cp table bo failed\n", r);
4330 sumo_rlc_fini(rdev);
4331 return r;
4332 }
4333 }
4334
4335 r = radeon_bo_reserve(rdev->rlc.cp_table_obj, false);
4336 if (unlikely(r != 0)) {
4337 dev_warn(rdev->dev, "(%d) reserve RLC cp table bo failed\n", r);
4338 sumo_rlc_fini(rdev);
4339 return r;
4340 }
4341 r = radeon_bo_pin(rdev->rlc.cp_table_obj, RADEON_GEM_DOMAIN_VRAM,
4342 &rdev->rlc.cp_table_gpu_addr);
4343 if (r) {
4344 radeon_bo_unreserve(rdev->rlc.cp_table_obj);
4345 dev_warn(rdev->dev, "(%d) pin RLC cp_table bo failed\n", r);
4346 sumo_rlc_fini(rdev);
4347 return r;
4348 }
4349 r = radeon_bo_kmap(rdev->rlc.cp_table_obj, (void **)&rdev->rlc.cp_table_ptr);
4350 if (r) {
4351 dev_warn(rdev->dev, "(%d) map RLC cp table bo failed\n", r);
4352 sumo_rlc_fini(rdev);
4353 return r;
4354 }
4355
4356 cik_init_cp_pg_table(rdev);
4357
4358 radeon_bo_kunmap(rdev->rlc.cp_table_obj);
4359 radeon_bo_unreserve(rdev->rlc.cp_table_obj);
4360
4361 }
4362
4363 return 0;
4364 }
4365
evergreen_rlc_start(struct radeon_device * rdev)4366 static void evergreen_rlc_start(struct radeon_device *rdev)
4367 {
4368 u32 mask = RLC_ENABLE;
4369
4370 if (rdev->flags & RADEON_IS_IGP) {
4371 mask |= GFX_POWER_GATING_ENABLE | GFX_POWER_GATING_SRC;
4372 }
4373
4374 WREG32(RLC_CNTL, mask);
4375 }
4376
evergreen_rlc_resume(struct radeon_device * rdev)4377 int evergreen_rlc_resume(struct radeon_device *rdev)
4378 {
4379 u32 i;
4380 const __be32 *fw_data;
4381
4382 if (!rdev->rlc_fw)
4383 return -EINVAL;
4384
4385 r600_rlc_stop(rdev);
4386
4387 WREG32(RLC_HB_CNTL, 0);
4388
4389 if (rdev->flags & RADEON_IS_IGP) {
4390 if (rdev->family == CHIP_ARUBA) {
4391 u32 always_on_bitmap =
4392 3 | (3 << (16 * rdev->config.cayman.max_shader_engines));
4393 /* find out the number of active simds */
4394 u32 tmp = (RREG32(CC_GC_SHADER_PIPE_CONFIG) & 0xffff0000) >> 16;
4395 tmp |= 0xffffffff << rdev->config.cayman.max_simds_per_se;
4396 tmp = hweight32(~tmp);
4397 if (tmp == rdev->config.cayman.max_simds_per_se) {
4398 WREG32(TN_RLC_LB_ALWAYS_ACTIVE_SIMD_MASK, always_on_bitmap);
4399 WREG32(TN_RLC_LB_PARAMS, 0x00601004);
4400 WREG32(TN_RLC_LB_INIT_SIMD_MASK, 0xffffffff);
4401 WREG32(TN_RLC_LB_CNTR_INIT, 0x00000000);
4402 WREG32(TN_RLC_LB_CNTR_MAX, 0x00002000);
4403 }
4404 } else {
4405 WREG32(RLC_HB_WPTR_LSB_ADDR, 0);
4406 WREG32(RLC_HB_WPTR_MSB_ADDR, 0);
4407 }
4408 WREG32(TN_RLC_SAVE_AND_RESTORE_BASE, rdev->rlc.save_restore_gpu_addr >> 8);
4409 WREG32(TN_RLC_CLEAR_STATE_RESTORE_BASE, rdev->rlc.clear_state_gpu_addr >> 8);
4410 } else {
4411 WREG32(RLC_HB_BASE, 0);
4412 WREG32(RLC_HB_RPTR, 0);
4413 WREG32(RLC_HB_WPTR, 0);
4414 WREG32(RLC_HB_WPTR_LSB_ADDR, 0);
4415 WREG32(RLC_HB_WPTR_MSB_ADDR, 0);
4416 }
4417 WREG32(RLC_MC_CNTL, 0);
4418 WREG32(RLC_UCODE_CNTL, 0);
4419
4420 fw_data = (const __be32 *)rdev->rlc_fw->data;
4421 if (rdev->family >= CHIP_ARUBA) {
4422 for (i = 0; i < ARUBA_RLC_UCODE_SIZE; i++) {
4423 WREG32(RLC_UCODE_ADDR, i);
4424 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
4425 }
4426 } else if (rdev->family >= CHIP_CAYMAN) {
4427 for (i = 0; i < CAYMAN_RLC_UCODE_SIZE; i++) {
4428 WREG32(RLC_UCODE_ADDR, i);
4429 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
4430 }
4431 } else {
4432 for (i = 0; i < EVERGREEN_RLC_UCODE_SIZE; i++) {
4433 WREG32(RLC_UCODE_ADDR, i);
4434 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
4435 }
4436 }
4437 WREG32(RLC_UCODE_ADDR, 0);
4438
4439 evergreen_rlc_start(rdev);
4440
4441 return 0;
4442 }
4443
4444 /* Interrupts */
4445
evergreen_get_vblank_counter(struct radeon_device * rdev,int crtc)4446 u32 evergreen_get_vblank_counter(struct radeon_device *rdev, int crtc)
4447 {
4448 if (crtc >= rdev->num_crtc)
4449 return 0;
4450 else
4451 return RREG32(CRTC_STATUS_FRAME_COUNT + crtc_offsets[crtc]);
4452 }
4453
evergreen_disable_interrupt_state(struct radeon_device * rdev)4454 void evergreen_disable_interrupt_state(struct radeon_device *rdev)
4455 {
4456 int i;
4457 u32 tmp;
4458
4459 if (rdev->family >= CHIP_CAYMAN) {
4460 cayman_cp_int_cntl_setup(rdev, 0,
4461 CNTX_BUSY_INT_ENABLE | CNTX_EMPTY_INT_ENABLE);
4462 cayman_cp_int_cntl_setup(rdev, 1, 0);
4463 cayman_cp_int_cntl_setup(rdev, 2, 0);
4464 tmp = RREG32(CAYMAN_DMA1_CNTL) & ~TRAP_ENABLE;
4465 WREG32(CAYMAN_DMA1_CNTL, tmp);
4466 } else
4467 WREG32(CP_INT_CNTL, CNTX_BUSY_INT_ENABLE | CNTX_EMPTY_INT_ENABLE);
4468 tmp = RREG32(DMA_CNTL) & ~TRAP_ENABLE;
4469 WREG32(DMA_CNTL, tmp);
4470 WREG32(GRBM_INT_CNTL, 0);
4471 WREG32(SRBM_INT_CNTL, 0);
4472 for (i = 0; i < rdev->num_crtc; i++)
4473 WREG32(INT_MASK + crtc_offsets[i], 0);
4474 for (i = 0; i < rdev->num_crtc; i++)
4475 WREG32(GRPH_INT_CONTROL + crtc_offsets[i], 0);
4476
4477 /* only one DAC on DCE5 */
4478 if (!ASIC_IS_DCE5(rdev))
4479 WREG32(DACA_AUTODETECT_INT_CONTROL, 0);
4480 WREG32(DACB_AUTODETECT_INT_CONTROL, 0);
4481
4482 for (i = 0; i < 6; i++)
4483 WREG32_AND(DC_HPDx_INT_CONTROL(i), DC_HPDx_INT_POLARITY);
4484 }
4485
4486 /* Note that the order we write back regs here is important */
evergreen_irq_set(struct radeon_device * rdev)4487 int evergreen_irq_set(struct radeon_device *rdev)
4488 {
4489 int i;
4490 u32 cp_int_cntl = CNTX_BUSY_INT_ENABLE | CNTX_EMPTY_INT_ENABLE;
4491 u32 cp_int_cntl1 = 0, cp_int_cntl2 = 0;
4492 u32 grbm_int_cntl = 0;
4493 u32 dma_cntl, dma_cntl1 = 0;
4494 u32 thermal_int = 0;
4495
4496 if (!rdev->irq.installed) {
4497 WARN(1, "Can't enable IRQ/MSI because no handler is installed\n");
4498 return -EINVAL;
4499 }
4500 /* don't enable anything if the ih is disabled */
4501 if (!rdev->ih.enabled) {
4502 r600_disable_interrupts(rdev);
4503 /* force the active interrupt state to all disabled */
4504 evergreen_disable_interrupt_state(rdev);
4505 return 0;
4506 }
4507
4508 if (rdev->family == CHIP_ARUBA)
4509 thermal_int = RREG32(TN_CG_THERMAL_INT_CTRL) &
4510 ~(THERM_INT_MASK_HIGH | THERM_INT_MASK_LOW);
4511 else
4512 thermal_int = RREG32(CG_THERMAL_INT) &
4513 ~(THERM_INT_MASK_HIGH | THERM_INT_MASK_LOW);
4514
4515 dma_cntl = RREG32(DMA_CNTL) & ~TRAP_ENABLE;
4516
4517 if (rdev->family >= CHIP_CAYMAN) {
4518 /* enable CP interrupts on all rings */
4519 if (atomic_read(&rdev->irq.ring_int[RADEON_RING_TYPE_GFX_INDEX])) {
4520 DRM_DEBUG("evergreen_irq_set: sw int gfx\n");
4521 cp_int_cntl |= TIME_STAMP_INT_ENABLE;
4522 }
4523 if (atomic_read(&rdev->irq.ring_int[CAYMAN_RING_TYPE_CP1_INDEX])) {
4524 DRM_DEBUG("evergreen_irq_set: sw int cp1\n");
4525 cp_int_cntl1 |= TIME_STAMP_INT_ENABLE;
4526 }
4527 if (atomic_read(&rdev->irq.ring_int[CAYMAN_RING_TYPE_CP2_INDEX])) {
4528 DRM_DEBUG("evergreen_irq_set: sw int cp2\n");
4529 cp_int_cntl2 |= TIME_STAMP_INT_ENABLE;
4530 }
4531 } else {
4532 if (atomic_read(&rdev->irq.ring_int[RADEON_RING_TYPE_GFX_INDEX])) {
4533 DRM_DEBUG("evergreen_irq_set: sw int gfx\n");
4534 cp_int_cntl |= RB_INT_ENABLE;
4535 cp_int_cntl |= TIME_STAMP_INT_ENABLE;
4536 }
4537 }
4538
4539 if (atomic_read(&rdev->irq.ring_int[R600_RING_TYPE_DMA_INDEX])) {
4540 DRM_DEBUG("r600_irq_set: sw int dma\n");
4541 dma_cntl |= TRAP_ENABLE;
4542 }
4543
4544 if (rdev->family >= CHIP_CAYMAN) {
4545 dma_cntl1 = RREG32(CAYMAN_DMA1_CNTL) & ~TRAP_ENABLE;
4546 if (atomic_read(&rdev->irq.ring_int[CAYMAN_RING_TYPE_DMA1_INDEX])) {
4547 DRM_DEBUG("r600_irq_set: sw int dma1\n");
4548 dma_cntl1 |= TRAP_ENABLE;
4549 }
4550 }
4551
4552 if (rdev->irq.dpm_thermal) {
4553 DRM_DEBUG("dpm thermal\n");
4554 thermal_int |= THERM_INT_MASK_HIGH | THERM_INT_MASK_LOW;
4555 }
4556
4557 if (rdev->family >= CHIP_CAYMAN) {
4558 cayman_cp_int_cntl_setup(rdev, 0, cp_int_cntl);
4559 cayman_cp_int_cntl_setup(rdev, 1, cp_int_cntl1);
4560 cayman_cp_int_cntl_setup(rdev, 2, cp_int_cntl2);
4561 } else
4562 WREG32(CP_INT_CNTL, cp_int_cntl);
4563
4564 WREG32(DMA_CNTL, dma_cntl);
4565
4566 if (rdev->family >= CHIP_CAYMAN)
4567 WREG32(CAYMAN_DMA1_CNTL, dma_cntl1);
4568
4569 WREG32(GRBM_INT_CNTL, grbm_int_cntl);
4570
4571 for (i = 0; i < rdev->num_crtc; i++) {
4572 radeon_irq_kms_set_irq_n_enabled(
4573 rdev, INT_MASK + crtc_offsets[i],
4574 VBLANK_INT_MASK,
4575 rdev->irq.crtc_vblank_int[i] ||
4576 atomic_read(&rdev->irq.pflip[i]), "vblank", i);
4577 }
4578
4579 for (i = 0; i < rdev->num_crtc; i++)
4580 WREG32(GRPH_INT_CONTROL + crtc_offsets[i], GRPH_PFLIP_INT_MASK);
4581
4582 for (i = 0; i < 6; i++) {
4583 radeon_irq_kms_set_irq_n_enabled(
4584 rdev, DC_HPDx_INT_CONTROL(i),
4585 DC_HPDx_INT_EN | DC_HPDx_RX_INT_EN,
4586 rdev->irq.hpd[i], "HPD", i);
4587 }
4588
4589 if (rdev->family == CHIP_ARUBA)
4590 WREG32(TN_CG_THERMAL_INT_CTRL, thermal_int);
4591 else
4592 WREG32(CG_THERMAL_INT, thermal_int);
4593
4594 for (i = 0; i < 6; i++) {
4595 radeon_irq_kms_set_irq_n_enabled(
4596 rdev, AFMT_AUDIO_PACKET_CONTROL + crtc_offsets[i],
4597 AFMT_AZ_FORMAT_WTRIG_MASK,
4598 rdev->irq.afmt[i], "HDMI", i);
4599 }
4600
4601 /* posting read */
4602 RREG32(SRBM_STATUS);
4603
4604 return 0;
4605 }
4606
4607 /* Note that the order we write back regs here is important */
evergreen_irq_ack(struct radeon_device * rdev)4608 static void evergreen_irq_ack(struct radeon_device *rdev)
4609 {
4610 int i, j;
4611 u32 *grph_int = rdev->irq.stat_regs.evergreen.grph_int;
4612 u32 *disp_int = rdev->irq.stat_regs.evergreen.disp_int;
4613 u32 *afmt_status = rdev->irq.stat_regs.evergreen.afmt_status;
4614
4615 for (i = 0; i < 6; i++) {
4616 disp_int[i] = RREG32(evergreen_disp_int_status[i]);
4617 afmt_status[i] = RREG32(AFMT_STATUS + crtc_offsets[i]);
4618 if (i < rdev->num_crtc)
4619 grph_int[i] = RREG32(GRPH_INT_STATUS + crtc_offsets[i]);
4620 }
4621
4622 /* We write back each interrupt register in pairs of two */
4623 for (i = 0; i < rdev->num_crtc; i += 2) {
4624 for (j = i; j < (i + 2); j++) {
4625 if (grph_int[j] & GRPH_PFLIP_INT_OCCURRED)
4626 WREG32(GRPH_INT_STATUS + crtc_offsets[j],
4627 GRPH_PFLIP_INT_CLEAR);
4628 }
4629
4630 for (j = i; j < (i + 2); j++) {
4631 if (disp_int[j] & LB_D1_VBLANK_INTERRUPT)
4632 WREG32(VBLANK_STATUS + crtc_offsets[j],
4633 VBLANK_ACK);
4634 if (disp_int[j] & LB_D1_VLINE_INTERRUPT)
4635 WREG32(VLINE_STATUS + crtc_offsets[j],
4636 VLINE_ACK);
4637 }
4638 }
4639
4640 for (i = 0; i < 6; i++) {
4641 if (disp_int[i] & DC_HPD1_INTERRUPT)
4642 WREG32_OR(DC_HPDx_INT_CONTROL(i), DC_HPDx_INT_ACK);
4643 }
4644
4645 for (i = 0; i < 6; i++) {
4646 if (disp_int[i] & DC_HPD1_RX_INTERRUPT)
4647 WREG32_OR(DC_HPDx_INT_CONTROL(i), DC_HPDx_RX_INT_ACK);
4648 }
4649
4650 for (i = 0; i < 6; i++) {
4651 if (afmt_status[i] & AFMT_AZ_FORMAT_WTRIG)
4652 WREG32_OR(AFMT_AUDIO_PACKET_CONTROL + crtc_offsets[i],
4653 AFMT_AZ_FORMAT_WTRIG_ACK);
4654 }
4655 }
4656
evergreen_irq_disable(struct radeon_device * rdev)4657 static void evergreen_irq_disable(struct radeon_device *rdev)
4658 {
4659 r600_disable_interrupts(rdev);
4660 /* Wait and acknowledge irq */
4661 mdelay(1);
4662 evergreen_irq_ack(rdev);
4663 evergreen_disable_interrupt_state(rdev);
4664 }
4665
evergreen_irq_suspend(struct radeon_device * rdev)4666 void evergreen_irq_suspend(struct radeon_device *rdev)
4667 {
4668 evergreen_irq_disable(rdev);
4669 r600_rlc_stop(rdev);
4670 }
4671
evergreen_get_ih_wptr(struct radeon_device * rdev)4672 static u32 evergreen_get_ih_wptr(struct radeon_device *rdev)
4673 {
4674 u32 wptr, tmp;
4675
4676 if (rdev->wb.enabled)
4677 wptr = le32_to_cpu(rdev->wb.wb[R600_WB_IH_WPTR_OFFSET/4]);
4678 else
4679 wptr = RREG32(IH_RB_WPTR);
4680
4681 if (wptr & RB_OVERFLOW) {
4682 wptr &= ~RB_OVERFLOW;
4683 /* When a ring buffer overflow happen start parsing interrupt
4684 * from the last not overwritten vector (wptr + 16). Hopefully
4685 * this should allow us to catchup.
4686 */
4687 dev_warn(rdev->dev, "IH ring buffer overflow (0x%08X, 0x%08X, 0x%08X)\n",
4688 wptr, rdev->ih.rptr, (wptr + 16) & rdev->ih.ptr_mask);
4689 rdev->ih.rptr = (wptr + 16) & rdev->ih.ptr_mask;
4690 tmp = RREG32(IH_RB_CNTL);
4691 tmp |= IH_WPTR_OVERFLOW_CLEAR;
4692 WREG32(IH_RB_CNTL, tmp);
4693 }
4694 return (wptr & rdev->ih.ptr_mask);
4695 }
4696
evergreen_irq_process(struct radeon_device * rdev)4697 int evergreen_irq_process(struct radeon_device *rdev)
4698 {
4699 u32 *disp_int = rdev->irq.stat_regs.evergreen.disp_int;
4700 u32 *afmt_status = rdev->irq.stat_regs.evergreen.afmt_status;
4701 u32 crtc_idx, hpd_idx, afmt_idx;
4702 u32 mask;
4703 u32 wptr;
4704 u32 rptr;
4705 u32 src_id, src_data;
4706 u32 ring_index;
4707 bool queue_hotplug = false;
4708 bool queue_hdmi = false;
4709 bool queue_dp = false;
4710 bool queue_thermal = false;
4711 u32 status, addr;
4712 const char *event_name;
4713
4714 if (!rdev->ih.enabled || rdev->shutdown)
4715 return IRQ_NONE;
4716
4717 wptr = evergreen_get_ih_wptr(rdev);
4718
4719 restart_ih:
4720 /* is somebody else already processing irqs? */
4721 if (atomic_xchg(&rdev->ih.lock, 1))
4722 return IRQ_NONE;
4723
4724 rptr = rdev->ih.rptr;
4725 DRM_DEBUG("evergreen_irq_process start: rptr %d, wptr %d\n", rptr, wptr);
4726
4727 /* Order reading of wptr vs. reading of IH ring data */
4728 rmb();
4729
4730 /* display interrupts */
4731 evergreen_irq_ack(rdev);
4732
4733 while (rptr != wptr) {
4734 /* wptr/rptr are in bytes! */
4735 ring_index = rptr / 4;
4736 src_id = le32_to_cpu(rdev->ih.ring[ring_index]) & 0xff;
4737 src_data = le32_to_cpu(rdev->ih.ring[ring_index + 1]) & 0xfffffff;
4738
4739 switch (src_id) {
4740 case 1: /* D1 vblank/vline */
4741 case 2: /* D2 vblank/vline */
4742 case 3: /* D3 vblank/vline */
4743 case 4: /* D4 vblank/vline */
4744 case 5: /* D5 vblank/vline */
4745 case 6: /* D6 vblank/vline */
4746 crtc_idx = src_id - 1;
4747
4748 if (src_data == 0) { /* vblank */
4749 mask = LB_D1_VBLANK_INTERRUPT;
4750 event_name = "vblank";
4751
4752 if (rdev->irq.crtc_vblank_int[crtc_idx]) {
4753 drm_handle_vblank(rdev->ddev, crtc_idx);
4754 rdev->pm.vblank_sync = true;
4755 wake_up(&rdev->irq.vblank_queue);
4756 }
4757 if (atomic_read(&rdev->irq.pflip[crtc_idx])) {
4758 radeon_crtc_handle_vblank(rdev,
4759 crtc_idx);
4760 }
4761
4762 } else if (src_data == 1) { /* vline */
4763 mask = LB_D1_VLINE_INTERRUPT;
4764 event_name = "vline";
4765 } else {
4766 DRM_DEBUG("Unhandled interrupt: %d %d\n",
4767 src_id, src_data);
4768 break;
4769 }
4770
4771 if (!(disp_int[crtc_idx] & mask)) {
4772 DRM_DEBUG("IH: D%d %s - IH event w/o asserted irq bit?\n",
4773 crtc_idx + 1, event_name);
4774 }
4775
4776 disp_int[crtc_idx] &= ~mask;
4777 DRM_DEBUG("IH: D%d %s\n", crtc_idx + 1, event_name);
4778
4779 break;
4780 case 8: /* D1 page flip */
4781 case 10: /* D2 page flip */
4782 case 12: /* D3 page flip */
4783 case 14: /* D4 page flip */
4784 case 16: /* D5 page flip */
4785 case 18: /* D6 page flip */
4786 DRM_DEBUG("IH: D%d flip\n", ((src_id - 8) >> 1) + 1);
4787 if (radeon_use_pflipirq > 0)
4788 radeon_crtc_handle_flip(rdev, (src_id - 8) >> 1);
4789 break;
4790 case 42: /* HPD hotplug */
4791 if (src_data <= 5) {
4792 hpd_idx = src_data;
4793 mask = DC_HPD1_INTERRUPT;
4794 queue_hotplug = true;
4795 event_name = "HPD";
4796
4797 } else if (src_data <= 11) {
4798 hpd_idx = src_data - 6;
4799 mask = DC_HPD1_RX_INTERRUPT;
4800 queue_dp = true;
4801 event_name = "HPD_RX";
4802
4803 } else {
4804 DRM_DEBUG("Unhandled interrupt: %d %d\n",
4805 src_id, src_data);
4806 break;
4807 }
4808
4809 if (!(disp_int[hpd_idx] & mask))
4810 DRM_DEBUG("IH: IH event w/o asserted irq bit?\n");
4811
4812 disp_int[hpd_idx] &= ~mask;
4813 DRM_DEBUG("IH: %s%d\n", event_name, hpd_idx + 1);
4814
4815 break;
4816 case 44: /* hdmi */
4817 afmt_idx = src_data;
4818 if (!(afmt_status[afmt_idx] & AFMT_AZ_FORMAT_WTRIG))
4819 DRM_DEBUG("IH: IH event w/o asserted irq bit?\n");
4820
4821 if (afmt_idx > 5) {
4822 DRM_ERROR("Unhandled interrupt: %d %d\n",
4823 src_id, src_data);
4824 break;
4825 }
4826 afmt_status[afmt_idx] &= ~AFMT_AZ_FORMAT_WTRIG;
4827 queue_hdmi = true;
4828 DRM_DEBUG("IH: HDMI%d\n", afmt_idx + 1);
4829 break;
4830 case 96:
4831 DRM_ERROR("SRBM_READ_ERROR: 0x%x\n", RREG32(SRBM_READ_ERROR));
4832 WREG32(SRBM_INT_ACK, 0x1);
4833 break;
4834 case 124: /* UVD */
4835 DRM_DEBUG("IH: UVD int: 0x%08x\n", src_data);
4836 radeon_fence_process(rdev, R600_RING_TYPE_UVD_INDEX);
4837 break;
4838 case 146:
4839 case 147:
4840 addr = RREG32(VM_CONTEXT1_PROTECTION_FAULT_ADDR);
4841 status = RREG32(VM_CONTEXT1_PROTECTION_FAULT_STATUS);
4842 /* reset addr and status */
4843 WREG32_P(VM_CONTEXT1_CNTL2, 1, ~1);
4844 if (addr == 0x0 && status == 0x0)
4845 break;
4846 dev_err(rdev->dev, "GPU fault detected: %d 0x%08x\n", src_id, src_data);
4847 dev_err(rdev->dev, " VM_CONTEXT1_PROTECTION_FAULT_ADDR 0x%08X\n",
4848 addr);
4849 dev_err(rdev->dev, " VM_CONTEXT1_PROTECTION_FAULT_STATUS 0x%08X\n",
4850 status);
4851 cayman_vm_decode_fault(rdev, status, addr);
4852 break;
4853 case 176: /* CP_INT in ring buffer */
4854 case 177: /* CP_INT in IB1 */
4855 case 178: /* CP_INT in IB2 */
4856 DRM_DEBUG("IH: CP int: 0x%08x\n", src_data);
4857 radeon_fence_process(rdev, RADEON_RING_TYPE_GFX_INDEX);
4858 break;
4859 case 181: /* CP EOP event */
4860 DRM_DEBUG("IH: CP EOP\n");
4861 if (rdev->family >= CHIP_CAYMAN) {
4862 switch (src_data) {
4863 case 0:
4864 radeon_fence_process(rdev, RADEON_RING_TYPE_GFX_INDEX);
4865 break;
4866 case 1:
4867 radeon_fence_process(rdev, CAYMAN_RING_TYPE_CP1_INDEX);
4868 break;
4869 case 2:
4870 radeon_fence_process(rdev, CAYMAN_RING_TYPE_CP2_INDEX);
4871 break;
4872 }
4873 } else
4874 radeon_fence_process(rdev, RADEON_RING_TYPE_GFX_INDEX);
4875 break;
4876 case 224: /* DMA trap event */
4877 DRM_DEBUG("IH: DMA trap\n");
4878 radeon_fence_process(rdev, R600_RING_TYPE_DMA_INDEX);
4879 break;
4880 case 230: /* thermal low to high */
4881 DRM_DEBUG("IH: thermal low to high\n");
4882 rdev->pm.dpm.thermal.high_to_low = false;
4883 queue_thermal = true;
4884 break;
4885 case 231: /* thermal high to low */
4886 DRM_DEBUG("IH: thermal high to low\n");
4887 rdev->pm.dpm.thermal.high_to_low = true;
4888 queue_thermal = true;
4889 break;
4890 case 233: /* GUI IDLE */
4891 DRM_DEBUG("IH: GUI idle\n");
4892 break;
4893 case 244: /* DMA trap event */
4894 if (rdev->family >= CHIP_CAYMAN) {
4895 DRM_DEBUG("IH: DMA1 trap\n");
4896 radeon_fence_process(rdev, CAYMAN_RING_TYPE_DMA1_INDEX);
4897 }
4898 break;
4899 default:
4900 DRM_DEBUG("Unhandled interrupt: %d %d\n", src_id, src_data);
4901 break;
4902 }
4903
4904 /* wptr/rptr are in bytes! */
4905 rptr += 16;
4906 rptr &= rdev->ih.ptr_mask;
4907 WREG32(IH_RB_RPTR, rptr);
4908 }
4909 if (queue_dp)
4910 schedule_work(&rdev->dp_work);
4911 if (queue_hotplug)
4912 schedule_delayed_work(&rdev->hotplug_work, 0);
4913 if (queue_hdmi)
4914 schedule_work(&rdev->audio_work);
4915 if (queue_thermal && rdev->pm.dpm_enabled)
4916 schedule_work(&rdev->pm.dpm.thermal.work);
4917 rdev->ih.rptr = rptr;
4918 atomic_set(&rdev->ih.lock, 0);
4919
4920 /* make sure wptr hasn't changed while processing */
4921 wptr = evergreen_get_ih_wptr(rdev);
4922 if (wptr != rptr)
4923 goto restart_ih;
4924
4925 return IRQ_HANDLED;
4926 }
4927
evergreen_uvd_init(struct radeon_device * rdev)4928 static void evergreen_uvd_init(struct radeon_device *rdev)
4929 {
4930 int r;
4931
4932 if (!rdev->has_uvd)
4933 return;
4934
4935 r = radeon_uvd_init(rdev);
4936 if (r) {
4937 dev_err(rdev->dev, "failed UVD (%d) init.\n", r);
4938 /*
4939 * At this point rdev->uvd.vcpu_bo is NULL which trickles down
4940 * to early fails uvd_v2_2_resume() and thus nothing happens
4941 * there. So it is pointless to try to go through that code
4942 * hence why we disable uvd here.
4943 */
4944 rdev->has_uvd = 0;
4945 return;
4946 }
4947 rdev->ring[R600_RING_TYPE_UVD_INDEX].ring_obj = NULL;
4948 r600_ring_init(rdev, &rdev->ring[R600_RING_TYPE_UVD_INDEX], 4096);
4949 }
4950
evergreen_uvd_start(struct radeon_device * rdev)4951 static void evergreen_uvd_start(struct radeon_device *rdev)
4952 {
4953 int r;
4954
4955 if (!rdev->has_uvd)
4956 return;
4957
4958 r = uvd_v2_2_resume(rdev);
4959 if (r) {
4960 dev_err(rdev->dev, "failed UVD resume (%d).\n", r);
4961 goto error;
4962 }
4963 r = radeon_fence_driver_start_ring(rdev, R600_RING_TYPE_UVD_INDEX);
4964 if (r) {
4965 dev_err(rdev->dev, "failed initializing UVD fences (%d).\n", r);
4966 goto error;
4967 }
4968 return;
4969
4970 error:
4971 rdev->ring[R600_RING_TYPE_UVD_INDEX].ring_size = 0;
4972 }
4973
evergreen_uvd_resume(struct radeon_device * rdev)4974 static void evergreen_uvd_resume(struct radeon_device *rdev)
4975 {
4976 struct radeon_ring *ring;
4977 int r;
4978
4979 if (!rdev->has_uvd || !rdev->ring[R600_RING_TYPE_UVD_INDEX].ring_size)
4980 return;
4981
4982 ring = &rdev->ring[R600_RING_TYPE_UVD_INDEX];
4983 r = radeon_ring_init(rdev, ring, ring->ring_size, 0, PACKET0(UVD_NO_OP, 0));
4984 if (r) {
4985 dev_err(rdev->dev, "failed initializing UVD ring (%d).\n", r);
4986 return;
4987 }
4988 r = uvd_v1_0_init(rdev);
4989 if (r) {
4990 dev_err(rdev->dev, "failed initializing UVD (%d).\n", r);
4991 return;
4992 }
4993 }
4994
evergreen_startup(struct radeon_device * rdev)4995 static int evergreen_startup(struct radeon_device *rdev)
4996 {
4997 struct radeon_ring *ring;
4998 int r;
4999
5000 /* enable pcie gen2 link */
5001 evergreen_pcie_gen2_enable(rdev);
5002 /* enable aspm */
5003 evergreen_program_aspm(rdev);
5004
5005 /* scratch needs to be initialized before MC */
5006 r = r600_vram_scratch_init(rdev);
5007 if (r)
5008 return r;
5009
5010 evergreen_mc_program(rdev);
5011
5012 if (ASIC_IS_DCE5(rdev) && !rdev->pm.dpm_enabled) {
5013 r = ni_mc_load_microcode(rdev);
5014 if (r) {
5015 DRM_ERROR("Failed to load MC firmware!\n");
5016 return r;
5017 }
5018 }
5019
5020 if (rdev->flags & RADEON_IS_AGP) {
5021 evergreen_agp_enable(rdev);
5022 } else {
5023 r = evergreen_pcie_gart_enable(rdev);
5024 if (r)
5025 return r;
5026 }
5027 evergreen_gpu_init(rdev);
5028
5029 /* allocate rlc buffers */
5030 if (rdev->flags & RADEON_IS_IGP) {
5031 rdev->rlc.reg_list = sumo_rlc_save_restore_register_list;
5032 rdev->rlc.reg_list_size =
5033 (u32)ARRAY_SIZE(sumo_rlc_save_restore_register_list);
5034 rdev->rlc.cs_data = evergreen_cs_data;
5035 r = sumo_rlc_init(rdev);
5036 if (r) {
5037 DRM_ERROR("Failed to init rlc BOs!\n");
5038 return r;
5039 }
5040 }
5041
5042 /* allocate wb buffer */
5043 r = radeon_wb_init(rdev);
5044 if (r)
5045 return r;
5046
5047 r = radeon_fence_driver_start_ring(rdev, RADEON_RING_TYPE_GFX_INDEX);
5048 if (r) {
5049 dev_err(rdev->dev, "failed initializing CP fences (%d).\n", r);
5050 return r;
5051 }
5052
5053 r = radeon_fence_driver_start_ring(rdev, R600_RING_TYPE_DMA_INDEX);
5054 if (r) {
5055 dev_err(rdev->dev, "failed initializing DMA fences (%d).\n", r);
5056 return r;
5057 }
5058
5059 evergreen_uvd_start(rdev);
5060
5061 /* Enable IRQ */
5062 if (!rdev->irq.installed) {
5063 r = radeon_irq_kms_init(rdev);
5064 if (r)
5065 return r;
5066 }
5067
5068 r = r600_irq_init(rdev);
5069 if (r) {
5070 DRM_ERROR("radeon: IH init failed (%d).\n", r);
5071 radeon_irq_kms_fini(rdev);
5072 return r;
5073 }
5074 evergreen_irq_set(rdev);
5075
5076 ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
5077 r = radeon_ring_init(rdev, ring, ring->ring_size, RADEON_WB_CP_RPTR_OFFSET,
5078 RADEON_CP_PACKET2);
5079 if (r)
5080 return r;
5081
5082 ring = &rdev->ring[R600_RING_TYPE_DMA_INDEX];
5083 r = radeon_ring_init(rdev, ring, ring->ring_size, R600_WB_DMA_RPTR_OFFSET,
5084 DMA_PACKET(DMA_PACKET_NOP, 0, 0));
5085 if (r)
5086 return r;
5087
5088 r = evergreen_cp_load_microcode(rdev);
5089 if (r)
5090 return r;
5091 r = evergreen_cp_resume(rdev);
5092 if (r)
5093 return r;
5094 r = r600_dma_resume(rdev);
5095 if (r)
5096 return r;
5097
5098 evergreen_uvd_resume(rdev);
5099
5100 r = radeon_ib_pool_init(rdev);
5101 if (r) {
5102 dev_err(rdev->dev, "IB initialization failed (%d).\n", r);
5103 return r;
5104 }
5105
5106 r = radeon_audio_init(rdev);
5107 if (r) {
5108 DRM_ERROR("radeon: audio init failed\n");
5109 return r;
5110 }
5111
5112 return 0;
5113 }
5114
evergreen_resume(struct radeon_device * rdev)5115 int evergreen_resume(struct radeon_device *rdev)
5116 {
5117 int r;
5118
5119 /* reset the asic, the gfx blocks are often in a bad state
5120 * after the driver is unloaded or after a resume
5121 */
5122 if (radeon_asic_reset(rdev))
5123 dev_warn(rdev->dev, "GPU reset failed !\n");
5124 /* Do not reset GPU before posting, on rv770 hw unlike on r500 hw,
5125 * posting will perform necessary task to bring back GPU into good
5126 * shape.
5127 */
5128 /* post card */
5129 atom_asic_init(rdev->mode_info.atom_context);
5130
5131 /* init golden registers */
5132 evergreen_init_golden_registers(rdev);
5133
5134 if (rdev->pm.pm_method == PM_METHOD_DPM)
5135 radeon_pm_resume(rdev);
5136
5137 rdev->accel_working = true;
5138 r = evergreen_startup(rdev);
5139 if (r) {
5140 DRM_ERROR("evergreen startup failed on resume\n");
5141 rdev->accel_working = false;
5142 return r;
5143 }
5144
5145 return r;
5146
5147 }
5148
evergreen_suspend(struct radeon_device * rdev)5149 int evergreen_suspend(struct radeon_device *rdev)
5150 {
5151 radeon_pm_suspend(rdev);
5152 radeon_audio_fini(rdev);
5153 if (rdev->has_uvd) {
5154 uvd_v1_0_fini(rdev);
5155 radeon_uvd_suspend(rdev);
5156 }
5157 r700_cp_stop(rdev);
5158 r600_dma_stop(rdev);
5159 evergreen_irq_suspend(rdev);
5160 radeon_wb_disable(rdev);
5161 evergreen_pcie_gart_disable(rdev);
5162
5163 return 0;
5164 }
5165
5166 /* Plan is to move initialization in that function and use
5167 * helper function so that radeon_device_init pretty much
5168 * do nothing more than calling asic specific function. This
5169 * should also allow to remove a bunch of callback function
5170 * like vram_info.
5171 */
evergreen_init(struct radeon_device * rdev)5172 int evergreen_init(struct radeon_device *rdev)
5173 {
5174 int r;
5175
5176 /* Read BIOS */
5177 if (!radeon_get_bios(rdev)) {
5178 if (ASIC_IS_AVIVO(rdev))
5179 return -EINVAL;
5180 }
5181 /* Must be an ATOMBIOS */
5182 if (!rdev->is_atom_bios) {
5183 dev_err(rdev->dev, "Expecting atombios for evergreen GPU\n");
5184 return -EINVAL;
5185 }
5186 r = radeon_atombios_init(rdev);
5187 if (r)
5188 return r;
5189 /* reset the asic, the gfx blocks are often in a bad state
5190 * after the driver is unloaded or after a resume
5191 */
5192 if (radeon_asic_reset(rdev))
5193 dev_warn(rdev->dev, "GPU reset failed !\n");
5194 /* Post card if necessary */
5195 if (!radeon_card_posted(rdev)) {
5196 if (!rdev->bios) {
5197 dev_err(rdev->dev, "Card not posted and no BIOS - ignoring\n");
5198 return -EINVAL;
5199 }
5200 DRM_INFO("GPU not posted. posting now...\n");
5201 atom_asic_init(rdev->mode_info.atom_context);
5202 }
5203 /* init golden registers */
5204 evergreen_init_golden_registers(rdev);
5205 /* Initialize scratch registers */
5206 r600_scratch_init(rdev);
5207 /* Initialize surface registers */
5208 radeon_surface_init(rdev);
5209 /* Initialize clocks */
5210 radeon_get_clock_info(rdev->ddev);
5211 /* Fence driver */
5212 r = radeon_fence_driver_init(rdev);
5213 if (r)
5214 return r;
5215 /* initialize AGP */
5216 if (rdev->flags & RADEON_IS_AGP) {
5217 r = radeon_agp_init(rdev);
5218 if (r)
5219 radeon_agp_disable(rdev);
5220 }
5221 /* initialize memory controller */
5222 r = evergreen_mc_init(rdev);
5223 if (r)
5224 return r;
5225 /* Memory manager */
5226 r = radeon_bo_init(rdev);
5227 if (r)
5228 return r;
5229
5230 if (ASIC_IS_DCE5(rdev)) {
5231 if (!rdev->me_fw || !rdev->pfp_fw || !rdev->rlc_fw || !rdev->mc_fw) {
5232 r = ni_init_microcode(rdev);
5233 if (r) {
5234 DRM_ERROR("Failed to load firmware!\n");
5235 return r;
5236 }
5237 }
5238 } else {
5239 if (!rdev->me_fw || !rdev->pfp_fw || !rdev->rlc_fw) {
5240 r = r600_init_microcode(rdev);
5241 if (r) {
5242 DRM_ERROR("Failed to load firmware!\n");
5243 return r;
5244 }
5245 }
5246 }
5247
5248 /* Initialize power management */
5249 radeon_pm_init(rdev);
5250
5251 rdev->ring[RADEON_RING_TYPE_GFX_INDEX].ring_obj = NULL;
5252 r600_ring_init(rdev, &rdev->ring[RADEON_RING_TYPE_GFX_INDEX], 1024 * 1024);
5253
5254 rdev->ring[R600_RING_TYPE_DMA_INDEX].ring_obj = NULL;
5255 r600_ring_init(rdev, &rdev->ring[R600_RING_TYPE_DMA_INDEX], 64 * 1024);
5256
5257 evergreen_uvd_init(rdev);
5258
5259 rdev->ih.ring_obj = NULL;
5260 r600_ih_ring_init(rdev, 64 * 1024);
5261
5262 r = r600_pcie_gart_init(rdev);
5263 if (r)
5264 return r;
5265
5266 rdev->accel_working = true;
5267 r = evergreen_startup(rdev);
5268 if (r) {
5269 dev_err(rdev->dev, "disabling GPU acceleration\n");
5270 r700_cp_fini(rdev);
5271 r600_dma_fini(rdev);
5272 r600_irq_fini(rdev);
5273 if (rdev->flags & RADEON_IS_IGP)
5274 sumo_rlc_fini(rdev);
5275 radeon_wb_fini(rdev);
5276 radeon_ib_pool_fini(rdev);
5277 radeon_irq_kms_fini(rdev);
5278 evergreen_pcie_gart_fini(rdev);
5279 rdev->accel_working = false;
5280 }
5281
5282 /* Don't start up if the MC ucode is missing on BTC parts.
5283 * The default clocks and voltages before the MC ucode
5284 * is loaded are not suffient for advanced operations.
5285 */
5286 if (ASIC_IS_DCE5(rdev)) {
5287 if (!rdev->mc_fw && !(rdev->flags & RADEON_IS_IGP)) {
5288 DRM_ERROR("radeon: MC ucode required for NI+.\n");
5289 return -EINVAL;
5290 }
5291 }
5292
5293 return 0;
5294 }
5295
evergreen_fini(struct radeon_device * rdev)5296 void evergreen_fini(struct radeon_device *rdev)
5297 {
5298 radeon_pm_fini(rdev);
5299 radeon_audio_fini(rdev);
5300 r700_cp_fini(rdev);
5301 r600_dma_fini(rdev);
5302 r600_irq_fini(rdev);
5303 if (rdev->flags & RADEON_IS_IGP)
5304 sumo_rlc_fini(rdev);
5305 radeon_wb_fini(rdev);
5306 radeon_ib_pool_fini(rdev);
5307 radeon_irq_kms_fini(rdev);
5308 uvd_v1_0_fini(rdev);
5309 radeon_uvd_fini(rdev);
5310 evergreen_pcie_gart_fini(rdev);
5311 r600_vram_scratch_fini(rdev);
5312 radeon_gem_fini(rdev);
5313 radeon_fence_driver_fini(rdev);
5314 radeon_agp_fini(rdev);
5315 radeon_bo_fini(rdev);
5316 radeon_atombios_fini(rdev);
5317 kfree(rdev->bios);
5318 rdev->bios = NULL;
5319 }
5320
evergreen_pcie_gen2_enable(struct radeon_device * rdev)5321 void evergreen_pcie_gen2_enable(struct radeon_device *rdev)
5322 {
5323 u32 link_width_cntl, speed_cntl;
5324
5325 if (radeon_pcie_gen2 == 0)
5326 return;
5327
5328 if (rdev->flags & RADEON_IS_IGP)
5329 return;
5330
5331 if (!(rdev->flags & RADEON_IS_PCIE))
5332 return;
5333
5334 /* x2 cards have a special sequence */
5335 if (ASIC_IS_X2(rdev))
5336 return;
5337
5338 if ((rdev->pdev->bus->max_bus_speed != PCIE_SPEED_5_0GT) &&
5339 (rdev->pdev->bus->max_bus_speed != PCIE_SPEED_8_0GT))
5340 return;
5341
5342 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
5343 if (speed_cntl & LC_CURRENT_DATA_RATE) {
5344 DRM_INFO("PCIE gen 2 link speeds already enabled\n");
5345 return;
5346 }
5347
5348 DRM_INFO("enabling PCIE gen 2 link speeds, disable with radeon.pcie_gen2=0\n");
5349
5350 if ((speed_cntl & LC_OTHER_SIDE_EVER_SENT_GEN2) ||
5351 (speed_cntl & LC_OTHER_SIDE_SUPPORTS_GEN2)) {
5352
5353 link_width_cntl = RREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL);
5354 link_width_cntl &= ~LC_UPCONFIGURE_DIS;
5355 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
5356
5357 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
5358 speed_cntl &= ~LC_TARGET_LINK_SPEED_OVERRIDE_EN;
5359 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
5360
5361 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
5362 speed_cntl |= LC_CLR_FAILED_SPD_CHANGE_CNT;
5363 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
5364
5365 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
5366 speed_cntl &= ~LC_CLR_FAILED_SPD_CHANGE_CNT;
5367 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
5368
5369 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
5370 speed_cntl |= LC_GEN2_EN_STRAP;
5371 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
5372
5373 } else {
5374 link_width_cntl = RREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL);
5375 /* XXX: only disable it if gen1 bridge vendor == 0x111d or 0x1106 */
5376 if (1)
5377 link_width_cntl |= LC_UPCONFIGURE_DIS;
5378 else
5379 link_width_cntl &= ~LC_UPCONFIGURE_DIS;
5380 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
5381 }
5382 }
5383
evergreen_program_aspm(struct radeon_device * rdev)5384 void evergreen_program_aspm(struct radeon_device *rdev)
5385 {
5386 u32 data, orig;
5387 u32 pcie_lc_cntl, pcie_lc_cntl_old;
5388 bool disable_l0s, disable_l1 = false, disable_plloff_in_l1 = false;
5389 /* fusion_platform = true
5390 * if the system is a fusion system
5391 * (APU or DGPU in a fusion system).
5392 * todo: check if the system is a fusion platform.
5393 */
5394 bool fusion_platform = false;
5395
5396 if (radeon_aspm == 0)
5397 return;
5398
5399 if (!(rdev->flags & RADEON_IS_PCIE))
5400 return;
5401
5402 switch (rdev->family) {
5403 case CHIP_CYPRESS:
5404 case CHIP_HEMLOCK:
5405 case CHIP_JUNIPER:
5406 case CHIP_REDWOOD:
5407 case CHIP_CEDAR:
5408 case CHIP_SUMO:
5409 case CHIP_SUMO2:
5410 case CHIP_PALM:
5411 case CHIP_ARUBA:
5412 disable_l0s = true;
5413 break;
5414 default:
5415 disable_l0s = false;
5416 break;
5417 }
5418
5419 if (rdev->flags & RADEON_IS_IGP)
5420 fusion_platform = true; /* XXX also dGPUs in a fusion system */
5421
5422 data = orig = RREG32_PIF_PHY0(PB0_PIF_PAIRING);
5423 if (fusion_platform)
5424 data &= ~MULTI_PIF;
5425 else
5426 data |= MULTI_PIF;
5427 if (data != orig)
5428 WREG32_PIF_PHY0(PB0_PIF_PAIRING, data);
5429
5430 data = orig = RREG32_PIF_PHY1(PB1_PIF_PAIRING);
5431 if (fusion_platform)
5432 data &= ~MULTI_PIF;
5433 else
5434 data |= MULTI_PIF;
5435 if (data != orig)
5436 WREG32_PIF_PHY1(PB1_PIF_PAIRING, data);
5437
5438 pcie_lc_cntl = pcie_lc_cntl_old = RREG32_PCIE_PORT(PCIE_LC_CNTL);
5439 pcie_lc_cntl &= ~(LC_L0S_INACTIVITY_MASK | LC_L1_INACTIVITY_MASK);
5440 if (!disable_l0s) {
5441 if (rdev->family >= CHIP_BARTS)
5442 pcie_lc_cntl |= LC_L0S_INACTIVITY(7);
5443 else
5444 pcie_lc_cntl |= LC_L0S_INACTIVITY(3);
5445 }
5446
5447 if (!disable_l1) {
5448 if (rdev->family >= CHIP_BARTS)
5449 pcie_lc_cntl |= LC_L1_INACTIVITY(7);
5450 else
5451 pcie_lc_cntl |= LC_L1_INACTIVITY(8);
5452
5453 if (!disable_plloff_in_l1) {
5454 data = orig = RREG32_PIF_PHY0(PB0_PIF_PWRDOWN_0);
5455 data &= ~(PLL_POWER_STATE_IN_OFF_0_MASK | PLL_POWER_STATE_IN_TXS2_0_MASK);
5456 data |= PLL_POWER_STATE_IN_OFF_0(7) | PLL_POWER_STATE_IN_TXS2_0(7);
5457 if (data != orig)
5458 WREG32_PIF_PHY0(PB0_PIF_PWRDOWN_0, data);
5459
5460 data = orig = RREG32_PIF_PHY0(PB0_PIF_PWRDOWN_1);
5461 data &= ~(PLL_POWER_STATE_IN_OFF_1_MASK | PLL_POWER_STATE_IN_TXS2_1_MASK);
5462 data |= PLL_POWER_STATE_IN_OFF_1(7) | PLL_POWER_STATE_IN_TXS2_1(7);
5463 if (data != orig)
5464 WREG32_PIF_PHY0(PB0_PIF_PWRDOWN_1, data);
5465
5466 data = orig = RREG32_PIF_PHY1(PB1_PIF_PWRDOWN_0);
5467 data &= ~(PLL_POWER_STATE_IN_OFF_0_MASK | PLL_POWER_STATE_IN_TXS2_0_MASK);
5468 data |= PLL_POWER_STATE_IN_OFF_0(7) | PLL_POWER_STATE_IN_TXS2_0(7);
5469 if (data != orig)
5470 WREG32_PIF_PHY1(PB1_PIF_PWRDOWN_0, data);
5471
5472 data = orig = RREG32_PIF_PHY1(PB1_PIF_PWRDOWN_1);
5473 data &= ~(PLL_POWER_STATE_IN_OFF_1_MASK | PLL_POWER_STATE_IN_TXS2_1_MASK);
5474 data |= PLL_POWER_STATE_IN_OFF_1(7) | PLL_POWER_STATE_IN_TXS2_1(7);
5475 if (data != orig)
5476 WREG32_PIF_PHY1(PB1_PIF_PWRDOWN_1, data);
5477
5478 if (rdev->family >= CHIP_BARTS) {
5479 data = orig = RREG32_PIF_PHY0(PB0_PIF_PWRDOWN_0);
5480 data &= ~PLL_RAMP_UP_TIME_0_MASK;
5481 data |= PLL_RAMP_UP_TIME_0(4);
5482 if (data != orig)
5483 WREG32_PIF_PHY0(PB0_PIF_PWRDOWN_0, data);
5484
5485 data = orig = RREG32_PIF_PHY0(PB0_PIF_PWRDOWN_1);
5486 data &= ~PLL_RAMP_UP_TIME_1_MASK;
5487 data |= PLL_RAMP_UP_TIME_1(4);
5488 if (data != orig)
5489 WREG32_PIF_PHY0(PB0_PIF_PWRDOWN_1, data);
5490
5491 data = orig = RREG32_PIF_PHY1(PB1_PIF_PWRDOWN_0);
5492 data &= ~PLL_RAMP_UP_TIME_0_MASK;
5493 data |= PLL_RAMP_UP_TIME_0(4);
5494 if (data != orig)
5495 WREG32_PIF_PHY1(PB1_PIF_PWRDOWN_0, data);
5496
5497 data = orig = RREG32_PIF_PHY1(PB1_PIF_PWRDOWN_1);
5498 data &= ~PLL_RAMP_UP_TIME_1_MASK;
5499 data |= PLL_RAMP_UP_TIME_1(4);
5500 if (data != orig)
5501 WREG32_PIF_PHY1(PB1_PIF_PWRDOWN_1, data);
5502 }
5503
5504 data = orig = RREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL);
5505 data &= ~LC_DYN_LANES_PWR_STATE_MASK;
5506 data |= LC_DYN_LANES_PWR_STATE(3);
5507 if (data != orig)
5508 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, data);
5509
5510 if (rdev->family >= CHIP_BARTS) {
5511 data = orig = RREG32_PIF_PHY0(PB0_PIF_CNTL);
5512 data &= ~LS2_EXIT_TIME_MASK;
5513 data |= LS2_EXIT_TIME(1);
5514 if (data != orig)
5515 WREG32_PIF_PHY0(PB0_PIF_CNTL, data);
5516
5517 data = orig = RREG32_PIF_PHY1(PB1_PIF_CNTL);
5518 data &= ~LS2_EXIT_TIME_MASK;
5519 data |= LS2_EXIT_TIME(1);
5520 if (data != orig)
5521 WREG32_PIF_PHY1(PB1_PIF_CNTL, data);
5522 }
5523 }
5524 }
5525
5526 /* evergreen parts only */
5527 if (rdev->family < CHIP_BARTS)
5528 pcie_lc_cntl |= LC_PMI_TO_L1_DIS;
5529
5530 if (pcie_lc_cntl != pcie_lc_cntl_old)
5531 WREG32_PCIE_PORT(PCIE_LC_CNTL, pcie_lc_cntl);
5532 }
5533