2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
28 #include <linux/firmware.h>
29 #include <linux/platform_device.h>
30 #include <linux/slab.h>
33 #include "radeon_asic.h"
34 #include <drm/radeon_drm.h>
39 #define R700_PFP_UCODE_SIZE 848
40 #define R700_PM4_UCODE_SIZE 1360
42 static void rv770_gpu_init(struct radeon_device *rdev);
43 void rv770_fini(struct radeon_device *rdev);
44 static void rv770_pcie_gen2_enable(struct radeon_device *rdev);
45 int evergreen_set_uvd_clocks(struct radeon_device *rdev, u32 vclk, u32 dclk);
47 int rv770_set_uvd_clocks(struct radeon_device *rdev, u32 vclk, u32 dclk)
49 unsigned fb_div = 0, vclk_div = 0, dclk_div = 0;
52 /* RV740 uses evergreen uvd clk programming */
53 if (rdev->family == CHIP_RV740)
54 return evergreen_set_uvd_clocks(rdev, vclk, dclk);
56 /* bypass vclk and dclk with bclk */
57 WREG32_P(CG_UPLL_FUNC_CNTL_2,
58 VCLK_SRC_SEL(1) | DCLK_SRC_SEL(1),
59 ~(VCLK_SRC_SEL_MASK | DCLK_SRC_SEL_MASK));
62 /* keep the Bypass mode, put PLL to sleep */
63 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_SLEEP_MASK, ~UPLL_SLEEP_MASK);
67 r = radeon_uvd_calc_upll_dividers(rdev, vclk, dclk, 50000, 160000,
68 43663, 0x03FFFFFE, 1, 30, ~0,
69 &fb_div, &vclk_div, &dclk_div);
77 /* set UPLL_FB_DIV to 0x50000 */
78 WREG32_P(CG_UPLL_FUNC_CNTL_3, UPLL_FB_DIV(0x50000), ~UPLL_FB_DIV_MASK);
80 /* deassert UPLL_RESET and UPLL_SLEEP */
81 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~(UPLL_RESET_MASK | UPLL_SLEEP_MASK));
83 /* assert BYPASS EN and FB_DIV[0] <- ??? why? */
84 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_BYPASS_EN_MASK, ~UPLL_BYPASS_EN_MASK);
85 WREG32_P(CG_UPLL_FUNC_CNTL_3, UPLL_FB_DIV(1), ~UPLL_FB_DIV(1));
87 r = radeon_uvd_send_upll_ctlreq(rdev, CG_UPLL_FUNC_CNTL);
91 /* assert PLL_RESET */
92 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_RESET_MASK, ~UPLL_RESET_MASK);
94 /* set the required FB_DIV, REF_DIV, Post divder values */
95 WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_REF_DIV(1), ~UPLL_REF_DIV_MASK);
96 WREG32_P(CG_UPLL_FUNC_CNTL_2,
97 UPLL_SW_HILEN(vclk_div >> 1) |
98 UPLL_SW_LOLEN((vclk_div >> 1) + (vclk_div & 1)) |
99 UPLL_SW_HILEN2(dclk_div >> 1) |
100 UPLL_SW_LOLEN2((dclk_div >> 1) + (dclk_div & 1)),
103 WREG32_P(CG_UPLL_FUNC_CNTL_3, UPLL_FB_DIV(fb_div),
106 /* give the PLL some time to settle */
109 /* deassert PLL_RESET */
110 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_RESET_MASK);
114 /* deassert BYPASS EN and FB_DIV[0] <- ??? why? */
115 WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_BYPASS_EN_MASK);
116 WREG32_P(CG_UPLL_FUNC_CNTL_3, 0, ~UPLL_FB_DIV(1));
118 r = radeon_uvd_send_upll_ctlreq(rdev, CG_UPLL_FUNC_CNTL);
122 /* switch VCLK and DCLK selection */
123 WREG32_P(CG_UPLL_FUNC_CNTL_2,
124 VCLK_SRC_SEL(2) | DCLK_SRC_SEL(2),
125 ~(VCLK_SRC_SEL_MASK | DCLK_SRC_SEL_MASK));
132 static const u32 r7xx_golden_registers[] =
134 0x8d00, 0xffffffff, 0x0e0e0074,
135 0x8d04, 0xffffffff, 0x013a2b34,
136 0x9508, 0xffffffff, 0x00000002,
137 0x8b20, 0xffffffff, 0,
138 0x88c4, 0xffffffff, 0x000000c2,
139 0x28350, 0xffffffff, 0,
140 0x9058, 0xffffffff, 0x0fffc40f,
141 0x240c, 0xffffffff, 0x00000380,
142 0x733c, 0xffffffff, 0x00000002,
143 0x2650, 0x00040000, 0,
144 0x20bc, 0x00040000, 0,
145 0x7300, 0xffffffff, 0x001000f0
148 static const u32 r7xx_golden_dyn_gpr_registers[] =
150 0x8db0, 0xffffffff, 0x98989898,
151 0x8db4, 0xffffffff, 0x98989898,
152 0x8db8, 0xffffffff, 0x98989898,
153 0x8dbc, 0xffffffff, 0x98989898,
154 0x8dc0, 0xffffffff, 0x98989898,
155 0x8dc4, 0xffffffff, 0x98989898,
156 0x8dc8, 0xffffffff, 0x98989898,
157 0x8dcc, 0xffffffff, 0x98989898,
158 0x88c4, 0xffffffff, 0x00000082
161 static const u32 rv770_golden_registers[] =
163 0x562c, 0xffffffff, 0,
164 0x3f90, 0xffffffff, 0,
165 0x9148, 0xffffffff, 0,
166 0x3f94, 0xffffffff, 0,
167 0x914c, 0xffffffff, 0,
168 0x9698, 0x18000000, 0x18000000
171 static const u32 rv770ce_golden_registers[] =
173 0x562c, 0xffffffff, 0,
174 0x3f90, 0xffffffff, 0x00cc0000,
175 0x9148, 0xffffffff, 0x00cc0000,
176 0x3f94, 0xffffffff, 0x00cc0000,
177 0x914c, 0xffffffff, 0x00cc0000,
178 0x9b7c, 0xffffffff, 0x00fa0000,
179 0x3f8c, 0xffffffff, 0x00fa0000,
180 0x9698, 0x18000000, 0x18000000
183 static const u32 rv770_mgcg_init[] =
185 0x8bcc, 0xffffffff, 0x130300f9,
186 0x5448, 0xffffffff, 0x100,
187 0x55e4, 0xffffffff, 0x100,
188 0x160c, 0xffffffff, 0x100,
189 0x5644, 0xffffffff, 0x100,
190 0xc164, 0xffffffff, 0x100,
191 0x8a18, 0xffffffff, 0x100,
192 0x897c, 0xffffffff, 0x8000100,
193 0x8b28, 0xffffffff, 0x3c000100,
194 0x9144, 0xffffffff, 0x100,
195 0x9a1c, 0xffffffff, 0x10000,
196 0x9a50, 0xffffffff, 0x100,
197 0x9a1c, 0xffffffff, 0x10001,
198 0x9a50, 0xffffffff, 0x100,
199 0x9a1c, 0xffffffff, 0x10002,
200 0x9a50, 0xffffffff, 0x100,
201 0x9a1c, 0xffffffff, 0x10003,
202 0x9a50, 0xffffffff, 0x100,
203 0x9a1c, 0xffffffff, 0x0,
204 0x9870, 0xffffffff, 0x100,
205 0x8d58, 0xffffffff, 0x100,
206 0x9500, 0xffffffff, 0x0,
207 0x9510, 0xffffffff, 0x100,
208 0x9500, 0xffffffff, 0x1,
209 0x9510, 0xffffffff, 0x100,
210 0x9500, 0xffffffff, 0x2,
211 0x9510, 0xffffffff, 0x100,
212 0x9500, 0xffffffff, 0x3,
213 0x9510, 0xffffffff, 0x100,
214 0x9500, 0xffffffff, 0x4,
215 0x9510, 0xffffffff, 0x100,
216 0x9500, 0xffffffff, 0x5,
217 0x9510, 0xffffffff, 0x100,
218 0x9500, 0xffffffff, 0x6,
219 0x9510, 0xffffffff, 0x100,
220 0x9500, 0xffffffff, 0x7,
221 0x9510, 0xffffffff, 0x100,
222 0x9500, 0xffffffff, 0x8,
223 0x9510, 0xffffffff, 0x100,
224 0x9500, 0xffffffff, 0x9,
225 0x9510, 0xffffffff, 0x100,
226 0x9500, 0xffffffff, 0x8000,
227 0x9490, 0xffffffff, 0x0,
228 0x949c, 0xffffffff, 0x100,
229 0x9490, 0xffffffff, 0x1,
230 0x949c, 0xffffffff, 0x100,
231 0x9490, 0xffffffff, 0x2,
232 0x949c, 0xffffffff, 0x100,
233 0x9490, 0xffffffff, 0x3,
234 0x949c, 0xffffffff, 0x100,
235 0x9490, 0xffffffff, 0x4,
236 0x949c, 0xffffffff, 0x100,
237 0x9490, 0xffffffff, 0x5,
238 0x949c, 0xffffffff, 0x100,
239 0x9490, 0xffffffff, 0x6,
240 0x949c, 0xffffffff, 0x100,
241 0x9490, 0xffffffff, 0x7,
242 0x949c, 0xffffffff, 0x100,
243 0x9490, 0xffffffff, 0x8,
244 0x949c, 0xffffffff, 0x100,
245 0x9490, 0xffffffff, 0x9,
246 0x949c, 0xffffffff, 0x100,
247 0x9490, 0xffffffff, 0x8000,
248 0x9604, 0xffffffff, 0x0,
249 0x9654, 0xffffffff, 0x100,
250 0x9604, 0xffffffff, 0x1,
251 0x9654, 0xffffffff, 0x100,
252 0x9604, 0xffffffff, 0x2,
253 0x9654, 0xffffffff, 0x100,
254 0x9604, 0xffffffff, 0x3,
255 0x9654, 0xffffffff, 0x100,
256 0x9604, 0xffffffff, 0x4,
257 0x9654, 0xffffffff, 0x100,
258 0x9604, 0xffffffff, 0x5,
259 0x9654, 0xffffffff, 0x100,
260 0x9604, 0xffffffff, 0x6,
261 0x9654, 0xffffffff, 0x100,
262 0x9604, 0xffffffff, 0x7,
263 0x9654, 0xffffffff, 0x100,
264 0x9604, 0xffffffff, 0x8,
265 0x9654, 0xffffffff, 0x100,
266 0x9604, 0xffffffff, 0x9,
267 0x9654, 0xffffffff, 0x100,
268 0x9604, 0xffffffff, 0x80000000,
269 0x9030, 0xffffffff, 0x100,
270 0x9034, 0xffffffff, 0x100,
271 0x9038, 0xffffffff, 0x100,
272 0x903c, 0xffffffff, 0x100,
273 0x9040, 0xffffffff, 0x100,
274 0xa200, 0xffffffff, 0x100,
275 0xa204, 0xffffffff, 0x100,
276 0xa208, 0xffffffff, 0x100,
277 0xa20c, 0xffffffff, 0x100,
278 0x971c, 0xffffffff, 0x100,
279 0x915c, 0xffffffff, 0x00020001,
280 0x9160, 0xffffffff, 0x00040003,
281 0x916c, 0xffffffff, 0x00060005,
282 0x9170, 0xffffffff, 0x00080007,
283 0x9174, 0xffffffff, 0x000a0009,
284 0x9178, 0xffffffff, 0x000c000b,
285 0x917c, 0xffffffff, 0x000e000d,
286 0x9180, 0xffffffff, 0x0010000f,
287 0x918c, 0xffffffff, 0x00120011,
288 0x9190, 0xffffffff, 0x00140013,
289 0x9194, 0xffffffff, 0x00020001,
290 0x9198, 0xffffffff, 0x00040003,
291 0x919c, 0xffffffff, 0x00060005,
292 0x91a8, 0xffffffff, 0x00080007,
293 0x91ac, 0xffffffff, 0x000a0009,
294 0x91b0, 0xffffffff, 0x000c000b,
295 0x91b4, 0xffffffff, 0x000e000d,
296 0x91b8, 0xffffffff, 0x0010000f,
297 0x91c4, 0xffffffff, 0x00120011,
298 0x91c8, 0xffffffff, 0x00140013,
299 0x91cc, 0xffffffff, 0x00020001,
300 0x91d0, 0xffffffff, 0x00040003,
301 0x91d4, 0xffffffff, 0x00060005,
302 0x91e0, 0xffffffff, 0x00080007,
303 0x91e4, 0xffffffff, 0x000a0009,
304 0x91e8, 0xffffffff, 0x000c000b,
305 0x91ec, 0xffffffff, 0x00020001,
306 0x91f0, 0xffffffff, 0x00040003,
307 0x91f4, 0xffffffff, 0x00060005,
308 0x9200, 0xffffffff, 0x00080007,
309 0x9204, 0xffffffff, 0x000a0009,
310 0x9208, 0xffffffff, 0x000c000b,
311 0x920c, 0xffffffff, 0x000e000d,
312 0x9210, 0xffffffff, 0x0010000f,
313 0x921c, 0xffffffff, 0x00120011,
314 0x9220, 0xffffffff, 0x00140013,
315 0x9224, 0xffffffff, 0x00020001,
316 0x9228, 0xffffffff, 0x00040003,
317 0x922c, 0xffffffff, 0x00060005,
318 0x9238, 0xffffffff, 0x00080007,
319 0x923c, 0xffffffff, 0x000a0009,
320 0x9240, 0xffffffff, 0x000c000b,
321 0x9244, 0xffffffff, 0x000e000d,
322 0x9248, 0xffffffff, 0x0010000f,
323 0x9254, 0xffffffff, 0x00120011,
324 0x9258, 0xffffffff, 0x00140013,
325 0x925c, 0xffffffff, 0x00020001,
326 0x9260, 0xffffffff, 0x00040003,
327 0x9264, 0xffffffff, 0x00060005,
328 0x9270, 0xffffffff, 0x00080007,
329 0x9274, 0xffffffff, 0x000a0009,
330 0x9278, 0xffffffff, 0x000c000b,
331 0x927c, 0xffffffff, 0x000e000d,
332 0x9280, 0xffffffff, 0x0010000f,
333 0x928c, 0xffffffff, 0x00120011,
334 0x9290, 0xffffffff, 0x00140013,
335 0x9294, 0xffffffff, 0x00020001,
336 0x929c, 0xffffffff, 0x00040003,
337 0x92a0, 0xffffffff, 0x00060005,
338 0x92a4, 0xffffffff, 0x00080007
341 static const u32 rv710_golden_registers[] =
343 0x3f90, 0x00ff0000, 0x00fc0000,
344 0x9148, 0x00ff0000, 0x00fc0000,
345 0x3f94, 0x00ff0000, 0x00fc0000,
346 0x914c, 0x00ff0000, 0x00fc0000,
347 0xb4c, 0x00000020, 0x00000020,
348 0xa180, 0xffffffff, 0x00003f3f
351 static const u32 rv710_mgcg_init[] =
353 0x8bcc, 0xffffffff, 0x13030040,
354 0x5448, 0xffffffff, 0x100,
355 0x55e4, 0xffffffff, 0x100,
356 0x160c, 0xffffffff, 0x100,
357 0x5644, 0xffffffff, 0x100,
358 0xc164, 0xffffffff, 0x100,
359 0x8a18, 0xffffffff, 0x100,
360 0x897c, 0xffffffff, 0x8000100,
361 0x8b28, 0xffffffff, 0x3c000100,
362 0x9144, 0xffffffff, 0x100,
363 0x9a1c, 0xffffffff, 0x10000,
364 0x9a50, 0xffffffff, 0x100,
365 0x9a1c, 0xffffffff, 0x0,
366 0x9870, 0xffffffff, 0x100,
367 0x8d58, 0xffffffff, 0x100,
368 0x9500, 0xffffffff, 0x0,
369 0x9510, 0xffffffff, 0x100,
370 0x9500, 0xffffffff, 0x1,
371 0x9510, 0xffffffff, 0x100,
372 0x9500, 0xffffffff, 0x8000,
373 0x9490, 0xffffffff, 0x0,
374 0x949c, 0xffffffff, 0x100,
375 0x9490, 0xffffffff, 0x1,
376 0x949c, 0xffffffff, 0x100,
377 0x9490, 0xffffffff, 0x8000,
378 0x9604, 0xffffffff, 0x0,
379 0x9654, 0xffffffff, 0x100,
380 0x9604, 0xffffffff, 0x1,
381 0x9654, 0xffffffff, 0x100,
382 0x9604, 0xffffffff, 0x80000000,
383 0x9030, 0xffffffff, 0x100,
384 0x9034, 0xffffffff, 0x100,
385 0x9038, 0xffffffff, 0x100,
386 0x903c, 0xffffffff, 0x100,
387 0x9040, 0xffffffff, 0x100,
388 0xa200, 0xffffffff, 0x100,
389 0xa204, 0xffffffff, 0x100,
390 0xa208, 0xffffffff, 0x100,
391 0xa20c, 0xffffffff, 0x100,
392 0x971c, 0xffffffff, 0x100,
393 0x915c, 0xffffffff, 0x00020001,
394 0x9174, 0xffffffff, 0x00000003,
395 0x9178, 0xffffffff, 0x00050001,
396 0x917c, 0xffffffff, 0x00030002,
397 0x918c, 0xffffffff, 0x00000004,
398 0x9190, 0xffffffff, 0x00070006,
399 0x9194, 0xffffffff, 0x00050001,
400 0x9198, 0xffffffff, 0x00030002,
401 0x91a8, 0xffffffff, 0x00000004,
402 0x91ac, 0xffffffff, 0x00070006,
403 0x91e8, 0xffffffff, 0x00000001,
404 0x9294, 0xffffffff, 0x00000001,
405 0x929c, 0xffffffff, 0x00000002,
406 0x92a0, 0xffffffff, 0x00040003,
407 0x9150, 0xffffffff, 0x4d940000
410 static const u32 rv730_golden_registers[] =
412 0x3f90, 0x00ff0000, 0x00f00000,
413 0x9148, 0x00ff0000, 0x00f00000,
414 0x3f94, 0x00ff0000, 0x00f00000,
415 0x914c, 0x00ff0000, 0x00f00000,
416 0x900c, 0xffffffff, 0x003b033f,
417 0xb4c, 0x00000020, 0x00000020,
418 0xa180, 0xffffffff, 0x00003f3f
421 static const u32 rv730_mgcg_init[] =
423 0x8bcc, 0xffffffff, 0x130300f9,
424 0x5448, 0xffffffff, 0x100,
425 0x55e4, 0xffffffff, 0x100,
426 0x160c, 0xffffffff, 0x100,
427 0x5644, 0xffffffff, 0x100,
428 0xc164, 0xffffffff, 0x100,
429 0x8a18, 0xffffffff, 0x100,
430 0x897c, 0xffffffff, 0x8000100,
431 0x8b28, 0xffffffff, 0x3c000100,
432 0x9144, 0xffffffff, 0x100,
433 0x9a1c, 0xffffffff, 0x10000,
434 0x9a50, 0xffffffff, 0x100,
435 0x9a1c, 0xffffffff, 0x10001,
436 0x9a50, 0xffffffff, 0x100,
437 0x9a1c, 0xffffffff, 0x0,
438 0x9870, 0xffffffff, 0x100,
439 0x8d58, 0xffffffff, 0x100,
440 0x9500, 0xffffffff, 0x0,
441 0x9510, 0xffffffff, 0x100,
442 0x9500, 0xffffffff, 0x1,
443 0x9510, 0xffffffff, 0x100,
444 0x9500, 0xffffffff, 0x2,
445 0x9510, 0xffffffff, 0x100,
446 0x9500, 0xffffffff, 0x3,
447 0x9510, 0xffffffff, 0x100,
448 0x9500, 0xffffffff, 0x4,
449 0x9510, 0xffffffff, 0x100,
450 0x9500, 0xffffffff, 0x5,
451 0x9510, 0xffffffff, 0x100,
452 0x9500, 0xffffffff, 0x6,
453 0x9510, 0xffffffff, 0x100,
454 0x9500, 0xffffffff, 0x7,
455 0x9510, 0xffffffff, 0x100,
456 0x9500, 0xffffffff, 0x8000,
457 0x9490, 0xffffffff, 0x0,
458 0x949c, 0xffffffff, 0x100,
459 0x9490, 0xffffffff, 0x1,
460 0x949c, 0xffffffff, 0x100,
461 0x9490, 0xffffffff, 0x2,
462 0x949c, 0xffffffff, 0x100,
463 0x9490, 0xffffffff, 0x3,
464 0x949c, 0xffffffff, 0x100,
465 0x9490, 0xffffffff, 0x4,
466 0x949c, 0xffffffff, 0x100,
467 0x9490, 0xffffffff, 0x5,
468 0x949c, 0xffffffff, 0x100,
469 0x9490, 0xffffffff, 0x6,
470 0x949c, 0xffffffff, 0x100,
471 0x9490, 0xffffffff, 0x7,
472 0x949c, 0xffffffff, 0x100,
473 0x9490, 0xffffffff, 0x8000,
474 0x9604, 0xffffffff, 0x0,
475 0x9654, 0xffffffff, 0x100,
476 0x9604, 0xffffffff, 0x1,
477 0x9654, 0xffffffff, 0x100,
478 0x9604, 0xffffffff, 0x2,
479 0x9654, 0xffffffff, 0x100,
480 0x9604, 0xffffffff, 0x3,
481 0x9654, 0xffffffff, 0x100,
482 0x9604, 0xffffffff, 0x4,
483 0x9654, 0xffffffff, 0x100,
484 0x9604, 0xffffffff, 0x5,
485 0x9654, 0xffffffff, 0x100,
486 0x9604, 0xffffffff, 0x6,
487 0x9654, 0xffffffff, 0x100,
488 0x9604, 0xffffffff, 0x7,
489 0x9654, 0xffffffff, 0x100,
490 0x9604, 0xffffffff, 0x80000000,
491 0x9030, 0xffffffff, 0x100,
492 0x9034, 0xffffffff, 0x100,
493 0x9038, 0xffffffff, 0x100,
494 0x903c, 0xffffffff, 0x100,
495 0x9040, 0xffffffff, 0x100,
496 0xa200, 0xffffffff, 0x100,
497 0xa204, 0xffffffff, 0x100,
498 0xa208, 0xffffffff, 0x100,
499 0xa20c, 0xffffffff, 0x100,
500 0x971c, 0xffffffff, 0x100,
501 0x915c, 0xffffffff, 0x00020001,
502 0x916c, 0xffffffff, 0x00040003,
503 0x9170, 0xffffffff, 0x00000005,
504 0x9178, 0xffffffff, 0x00050001,
505 0x917c, 0xffffffff, 0x00030002,
506 0x918c, 0xffffffff, 0x00000004,
507 0x9190, 0xffffffff, 0x00070006,
508 0x9194, 0xffffffff, 0x00050001,
509 0x9198, 0xffffffff, 0x00030002,
510 0x91a8, 0xffffffff, 0x00000004,
511 0x91ac, 0xffffffff, 0x00070006,
512 0x91b0, 0xffffffff, 0x00050001,
513 0x91b4, 0xffffffff, 0x00030002,
514 0x91c4, 0xffffffff, 0x00000004,
515 0x91c8, 0xffffffff, 0x00070006,
516 0x91cc, 0xffffffff, 0x00050001,
517 0x91d0, 0xffffffff, 0x00030002,
518 0x91e0, 0xffffffff, 0x00000004,
519 0x91e4, 0xffffffff, 0x00070006,
520 0x91e8, 0xffffffff, 0x00000001,
521 0x91ec, 0xffffffff, 0x00050001,
522 0x91f0, 0xffffffff, 0x00030002,
523 0x9200, 0xffffffff, 0x00000004,
524 0x9204, 0xffffffff, 0x00070006,
525 0x9208, 0xffffffff, 0x00050001,
526 0x920c, 0xffffffff, 0x00030002,
527 0x921c, 0xffffffff, 0x00000004,
528 0x9220, 0xffffffff, 0x00070006,
529 0x9224, 0xffffffff, 0x00050001,
530 0x9228, 0xffffffff, 0x00030002,
531 0x9238, 0xffffffff, 0x00000004,
532 0x923c, 0xffffffff, 0x00070006,
533 0x9240, 0xffffffff, 0x00050001,
534 0x9244, 0xffffffff, 0x00030002,
535 0x9254, 0xffffffff, 0x00000004,
536 0x9258, 0xffffffff, 0x00070006,
537 0x9294, 0xffffffff, 0x00000001,
538 0x929c, 0xffffffff, 0x00000002,
539 0x92a0, 0xffffffff, 0x00040003,
540 0x92a4, 0xffffffff, 0x00000005
543 static const u32 rv740_golden_registers[] =
545 0x88c4, 0xffffffff, 0x00000082,
546 0x28a50, 0xfffffffc, 0x00000004,
547 0x2650, 0x00040000, 0,
548 0x20bc, 0x00040000, 0,
549 0x733c, 0xffffffff, 0x00000002,
550 0x7300, 0xffffffff, 0x001000f0,
551 0x3f90, 0x00ff0000, 0,
552 0x9148, 0x00ff0000, 0,
553 0x3f94, 0x00ff0000, 0,
554 0x914c, 0x00ff0000, 0,
555 0x240c, 0xffffffff, 0x00000380,
556 0x8a14, 0x00000007, 0x00000007,
557 0x8b24, 0xffffffff, 0x00ff0fff,
558 0x28a4c, 0xffffffff, 0x00004000,
559 0xa180, 0xffffffff, 0x00003f3f,
560 0x8d00, 0xffffffff, 0x0e0e003a,
561 0x8d04, 0xffffffff, 0x013a0e2a,
562 0x8c00, 0xffffffff, 0xe400000f,
563 0x8db0, 0xffffffff, 0x98989898,
564 0x8db4, 0xffffffff, 0x98989898,
565 0x8db8, 0xffffffff, 0x98989898,
566 0x8dbc, 0xffffffff, 0x98989898,
567 0x8dc0, 0xffffffff, 0x98989898,
568 0x8dc4, 0xffffffff, 0x98989898,
569 0x8dc8, 0xffffffff, 0x98989898,
570 0x8dcc, 0xffffffff, 0x98989898,
571 0x9058, 0xffffffff, 0x0fffc40f,
572 0x900c, 0xffffffff, 0x003b033f,
573 0x28350, 0xffffffff, 0,
574 0x8cf0, 0x1fffffff, 0x08e00420,
575 0x9508, 0xffffffff, 0x00000002,
576 0x88c4, 0xffffffff, 0x000000c2,
577 0x9698, 0x18000000, 0x18000000
580 static const u32 rv740_mgcg_init[] =
582 0x8bcc, 0xffffffff, 0x13030100,
583 0x5448, 0xffffffff, 0x100,
584 0x55e4, 0xffffffff, 0x100,
585 0x160c, 0xffffffff, 0x100,
586 0x5644, 0xffffffff, 0x100,
587 0xc164, 0xffffffff, 0x100,
588 0x8a18, 0xffffffff, 0x100,
589 0x897c, 0xffffffff, 0x100,
590 0x8b28, 0xffffffff, 0x100,
591 0x9144, 0xffffffff, 0x100,
592 0x9a1c, 0xffffffff, 0x10000,
593 0x9a50, 0xffffffff, 0x100,
594 0x9a1c, 0xffffffff, 0x10001,
595 0x9a50, 0xffffffff, 0x100,
596 0x9a1c, 0xffffffff, 0x10002,
597 0x9a50, 0xffffffff, 0x100,
598 0x9a1c, 0xffffffff, 0x10003,
599 0x9a50, 0xffffffff, 0x100,
600 0x9a1c, 0xffffffff, 0x0,
601 0x9870, 0xffffffff, 0x100,
602 0x8d58, 0xffffffff, 0x100,
603 0x9500, 0xffffffff, 0x0,
604 0x9510, 0xffffffff, 0x100,
605 0x9500, 0xffffffff, 0x1,
606 0x9510, 0xffffffff, 0x100,
607 0x9500, 0xffffffff, 0x2,
608 0x9510, 0xffffffff, 0x100,
609 0x9500, 0xffffffff, 0x3,
610 0x9510, 0xffffffff, 0x100,
611 0x9500, 0xffffffff, 0x4,
612 0x9510, 0xffffffff, 0x100,
613 0x9500, 0xffffffff, 0x5,
614 0x9510, 0xffffffff, 0x100,
615 0x9500, 0xffffffff, 0x6,
616 0x9510, 0xffffffff, 0x100,
617 0x9500, 0xffffffff, 0x7,
618 0x9510, 0xffffffff, 0x100,
619 0x9500, 0xffffffff, 0x8000,
620 0x9490, 0xffffffff, 0x0,
621 0x949c, 0xffffffff, 0x100,
622 0x9490, 0xffffffff, 0x1,
623 0x949c, 0xffffffff, 0x100,
624 0x9490, 0xffffffff, 0x2,
625 0x949c, 0xffffffff, 0x100,
626 0x9490, 0xffffffff, 0x3,
627 0x949c, 0xffffffff, 0x100,
628 0x9490, 0xffffffff, 0x4,
629 0x949c, 0xffffffff, 0x100,
630 0x9490, 0xffffffff, 0x5,
631 0x949c, 0xffffffff, 0x100,
632 0x9490, 0xffffffff, 0x6,
633 0x949c, 0xffffffff, 0x100,
634 0x9490, 0xffffffff, 0x7,
635 0x949c, 0xffffffff, 0x100,
636 0x9490, 0xffffffff, 0x8000,
637 0x9604, 0xffffffff, 0x0,
638 0x9654, 0xffffffff, 0x100,
639 0x9604, 0xffffffff, 0x1,
640 0x9654, 0xffffffff, 0x100,
641 0x9604, 0xffffffff, 0x2,
642 0x9654, 0xffffffff, 0x100,
643 0x9604, 0xffffffff, 0x3,
644 0x9654, 0xffffffff, 0x100,
645 0x9604, 0xffffffff, 0x4,
646 0x9654, 0xffffffff, 0x100,
647 0x9604, 0xffffffff, 0x5,
648 0x9654, 0xffffffff, 0x100,
649 0x9604, 0xffffffff, 0x6,
650 0x9654, 0xffffffff, 0x100,
651 0x9604, 0xffffffff, 0x7,
652 0x9654, 0xffffffff, 0x100,
653 0x9604, 0xffffffff, 0x80000000,
654 0x9030, 0xffffffff, 0x100,
655 0x9034, 0xffffffff, 0x100,
656 0x9038, 0xffffffff, 0x100,
657 0x903c, 0xffffffff, 0x100,
658 0x9040, 0xffffffff, 0x100,
659 0xa200, 0xffffffff, 0x100,
660 0xa204, 0xffffffff, 0x100,
661 0xa208, 0xffffffff, 0x100,
662 0xa20c, 0xffffffff, 0x100,
663 0x971c, 0xffffffff, 0x100,
664 0x915c, 0xffffffff, 0x00020001,
665 0x9160, 0xffffffff, 0x00040003,
666 0x916c, 0xffffffff, 0x00060005,
667 0x9170, 0xffffffff, 0x00080007,
668 0x9174, 0xffffffff, 0x000a0009,
669 0x9178, 0xffffffff, 0x000c000b,
670 0x917c, 0xffffffff, 0x000e000d,
671 0x9180, 0xffffffff, 0x0010000f,
672 0x918c, 0xffffffff, 0x00120011,
673 0x9190, 0xffffffff, 0x00140013,
674 0x9194, 0xffffffff, 0x00020001,
675 0x9198, 0xffffffff, 0x00040003,
676 0x919c, 0xffffffff, 0x00060005,
677 0x91a8, 0xffffffff, 0x00080007,
678 0x91ac, 0xffffffff, 0x000a0009,
679 0x91b0, 0xffffffff, 0x000c000b,
680 0x91b4, 0xffffffff, 0x000e000d,
681 0x91b8, 0xffffffff, 0x0010000f,
682 0x91c4, 0xffffffff, 0x00120011,
683 0x91c8, 0xffffffff, 0x00140013,
684 0x91cc, 0xffffffff, 0x00020001,
685 0x91d0, 0xffffffff, 0x00040003,
686 0x91d4, 0xffffffff, 0x00060005,
687 0x91e0, 0xffffffff, 0x00080007,
688 0x91e4, 0xffffffff, 0x000a0009,
689 0x91e8, 0xffffffff, 0x000c000b,
690 0x91ec, 0xffffffff, 0x00020001,
691 0x91f0, 0xffffffff, 0x00040003,
692 0x91f4, 0xffffffff, 0x00060005,
693 0x9200, 0xffffffff, 0x00080007,
694 0x9204, 0xffffffff, 0x000a0009,
695 0x9208, 0xffffffff, 0x000c000b,
696 0x920c, 0xffffffff, 0x000e000d,
697 0x9210, 0xffffffff, 0x0010000f,
698 0x921c, 0xffffffff, 0x00120011,
699 0x9220, 0xffffffff, 0x00140013,
700 0x9224, 0xffffffff, 0x00020001,
701 0x9228, 0xffffffff, 0x00040003,
702 0x922c, 0xffffffff, 0x00060005,
703 0x9238, 0xffffffff, 0x00080007,
704 0x923c, 0xffffffff, 0x000a0009,
705 0x9240, 0xffffffff, 0x000c000b,
706 0x9244, 0xffffffff, 0x000e000d,
707 0x9248, 0xffffffff, 0x0010000f,
708 0x9254, 0xffffffff, 0x00120011,
709 0x9258, 0xffffffff, 0x00140013,
710 0x9294, 0xffffffff, 0x00020001,
711 0x929c, 0xffffffff, 0x00040003,
712 0x92a0, 0xffffffff, 0x00060005,
713 0x92a4, 0xffffffff, 0x00080007
716 static void rv770_init_golden_registers(struct radeon_device *rdev)
718 switch (rdev->family) {
720 radeon_program_register_sequence(rdev,
721 r7xx_golden_registers,
722 (const u32)ARRAY_SIZE(r7xx_golden_registers));
723 radeon_program_register_sequence(rdev,
724 r7xx_golden_dyn_gpr_registers,
725 (const u32)ARRAY_SIZE(r7xx_golden_dyn_gpr_registers));
726 if (rdev->pdev->device == 0x994e)
727 radeon_program_register_sequence(rdev,
728 rv770ce_golden_registers,
729 (const u32)ARRAY_SIZE(rv770ce_golden_registers));
731 radeon_program_register_sequence(rdev,
732 rv770_golden_registers,
733 (const u32)ARRAY_SIZE(rv770_golden_registers));
734 radeon_program_register_sequence(rdev,
736 (const u32)ARRAY_SIZE(rv770_mgcg_init));
739 radeon_program_register_sequence(rdev,
740 r7xx_golden_registers,
741 (const u32)ARRAY_SIZE(r7xx_golden_registers));
742 radeon_program_register_sequence(rdev,
743 r7xx_golden_dyn_gpr_registers,
744 (const u32)ARRAY_SIZE(r7xx_golden_dyn_gpr_registers));
745 radeon_program_register_sequence(rdev,
746 rv730_golden_registers,
747 (const u32)ARRAY_SIZE(rv730_golden_registers));
748 radeon_program_register_sequence(rdev,
750 (const u32)ARRAY_SIZE(rv730_mgcg_init));
753 radeon_program_register_sequence(rdev,
754 r7xx_golden_registers,
755 (const u32)ARRAY_SIZE(r7xx_golden_registers));
756 radeon_program_register_sequence(rdev,
757 r7xx_golden_dyn_gpr_registers,
758 (const u32)ARRAY_SIZE(r7xx_golden_dyn_gpr_registers));
759 radeon_program_register_sequence(rdev,
760 rv710_golden_registers,
761 (const u32)ARRAY_SIZE(rv710_golden_registers));
762 radeon_program_register_sequence(rdev,
764 (const u32)ARRAY_SIZE(rv710_mgcg_init));
767 radeon_program_register_sequence(rdev,
768 rv740_golden_registers,
769 (const u32)ARRAY_SIZE(rv740_golden_registers));
770 radeon_program_register_sequence(rdev,
772 (const u32)ARRAY_SIZE(rv740_mgcg_init));
779 #define PCIE_BUS_CLK 10000
780 #define TCLK (PCIE_BUS_CLK / 10)
783 * rv770_get_xclk - get the xclk
785 * @rdev: radeon_device pointer
787 * Returns the reference clock used by the gfx engine
790 u32 rv770_get_xclk(struct radeon_device *rdev)
792 u32 reference_clock = rdev->clock.spll.reference_freq;
793 u32 tmp = RREG32(CG_CLKPIN_CNTL);
795 if (tmp & MUX_TCLK_TO_XCLK)
798 if (tmp & XTALIN_DIVIDE)
799 return reference_clock / 4;
801 return reference_clock;
804 int rv770_uvd_resume(struct radeon_device *rdev)
807 uint32_t chip_id, size;
810 r = radeon_uvd_resume(rdev);
814 /* programm the VCPU memory controller bits 0-27 */
815 addr = rdev->uvd.gpu_addr >> 3;
816 size = RADEON_GPU_PAGE_ALIGN(rdev->uvd_fw->size + 4) >> 3;
817 WREG32(UVD_VCPU_CACHE_OFFSET0, addr);
818 WREG32(UVD_VCPU_CACHE_SIZE0, size);
821 size = RADEON_UVD_STACK_SIZE >> 3;
822 WREG32(UVD_VCPU_CACHE_OFFSET1, addr);
823 WREG32(UVD_VCPU_CACHE_SIZE1, size);
826 size = RADEON_UVD_HEAP_SIZE >> 3;
827 WREG32(UVD_VCPU_CACHE_OFFSET2, addr);
828 WREG32(UVD_VCPU_CACHE_SIZE2, size);
831 addr = (rdev->uvd.gpu_addr >> 28) & 0xF;
832 WREG32(UVD_LMI_ADDR_EXT, (addr << 12) | (addr << 0));
835 addr = (rdev->uvd.gpu_addr >> 32) & 0xFF;
836 WREG32(UVD_LMI_EXT40_ADDR, addr | (0x9 << 16) | (0x1 << 31));
838 /* tell firmware which hardware it is running on */
839 switch (rdev->family) {
843 chip_id = 0x01000005;
846 chip_id = 0x01000006;
849 chip_id = 0x01000007;
853 chip_id = 0x01000008;
856 chip_id = 0x01000009;
859 chip_id = 0x0100000a;
862 chip_id = 0x0100000b;
866 chip_id = 0x0100000c;
869 chip_id = 0x0100000e;
872 chip_id = 0x0100000f;
875 chip_id = 0x01000010;
878 chip_id = 0x01000011;
881 chip_id = 0x01000012;
884 chip_id = 0x01000014;
887 chip_id = 0x01000015;
890 chip_id = 0x01000016;
893 chip_id = 0x01000017;
896 WREG32(UVD_VCPU_CHIP_ID, chip_id);
901 u32 rv770_page_flip(struct radeon_device *rdev, int crtc_id, u64 crtc_base)
903 struct radeon_crtc *radeon_crtc = rdev->mode_info.crtcs[crtc_id];
904 u32 tmp = RREG32(AVIVO_D1GRPH_UPDATE + radeon_crtc->crtc_offset);
907 /* Lock the graphics update lock */
908 tmp |= AVIVO_D1GRPH_UPDATE_LOCK;
909 WREG32(AVIVO_D1GRPH_UPDATE + radeon_crtc->crtc_offset, tmp);
911 /* update the scanout addresses */
912 if (radeon_crtc->crtc_id) {
913 WREG32(D2GRPH_SECONDARY_SURFACE_ADDRESS_HIGH, upper_32_bits(crtc_base));
914 WREG32(D2GRPH_PRIMARY_SURFACE_ADDRESS_HIGH, upper_32_bits(crtc_base));
916 WREG32(D1GRPH_SECONDARY_SURFACE_ADDRESS_HIGH, upper_32_bits(crtc_base));
917 WREG32(D1GRPH_PRIMARY_SURFACE_ADDRESS_HIGH, upper_32_bits(crtc_base));
919 WREG32(D1GRPH_SECONDARY_SURFACE_ADDRESS + radeon_crtc->crtc_offset,
921 WREG32(D1GRPH_PRIMARY_SURFACE_ADDRESS + radeon_crtc->crtc_offset,
924 /* Wait for update_pending to go high. */
925 for (i = 0; i < rdev->usec_timeout; i++) {
926 if (RREG32(AVIVO_D1GRPH_UPDATE + radeon_crtc->crtc_offset) & AVIVO_D1GRPH_SURFACE_UPDATE_PENDING)
930 DRM_DEBUG("Update pending now high. Unlocking vupdate_lock.\n");
932 /* Unlock the lock, so double-buffering can take place inside vblank */
933 tmp &= ~AVIVO_D1GRPH_UPDATE_LOCK;
934 WREG32(AVIVO_D1GRPH_UPDATE + radeon_crtc->crtc_offset, tmp);
936 /* Return current update_pending status: */
937 return RREG32(AVIVO_D1GRPH_UPDATE + radeon_crtc->crtc_offset) & AVIVO_D1GRPH_SURFACE_UPDATE_PENDING;
940 /* get temperature in millidegrees */
941 int rv770_get_temp(struct radeon_device *rdev)
943 u32 temp = (RREG32(CG_MULT_THERMAL_STATUS) & ASIC_T_MASK) >>
949 else if (temp & 0x200)
951 else if (temp & 0x100) {
952 actual_temp = temp & 0x1ff;
953 actual_temp |= ~0x1ff;
955 actual_temp = temp & 0xff;
957 return (actual_temp * 1000) / 2;
960 void rv770_pm_misc(struct radeon_device *rdev)
962 int req_ps_idx = rdev->pm.requested_power_state_index;
963 int req_cm_idx = rdev->pm.requested_clock_mode_index;
964 struct radeon_power_state *ps = &rdev->pm.power_state[req_ps_idx];
965 struct radeon_voltage *voltage = &ps->clock_info[req_cm_idx].voltage;
967 if ((voltage->type == VOLTAGE_SW) && voltage->voltage) {
968 /* 0xff01 is a flag rather then an actual voltage */
969 if (voltage->voltage == 0xff01)
971 if (voltage->voltage != rdev->pm.current_vddc) {
972 radeon_atom_set_voltage(rdev, voltage->voltage, SET_VOLTAGE_TYPE_ASIC_VDDC);
973 rdev->pm.current_vddc = voltage->voltage;
974 DRM_DEBUG("Setting: v: %d\n", voltage->voltage);
982 static int rv770_pcie_gart_enable(struct radeon_device *rdev)
987 if (rdev->gart.robj == NULL) {
988 dev_err(rdev->dev, "No VRAM object for PCIE GART.\n");
991 r = radeon_gart_table_vram_pin(rdev);
994 radeon_gart_restore(rdev);
996 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
997 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
998 EFFECTIVE_L2_QUEUE_SIZE(7));
999 WREG32(VM_L2_CNTL2, 0);
1000 WREG32(VM_L2_CNTL3, BANK_SELECT(0) | CACHE_UPDATE_MODE(2));
1001 /* Setup TLB control */
1002 tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
1003 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
1004 SYSTEM_APERTURE_UNMAPPED_ACCESS_PASS_THRU |
1005 EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5);
1006 WREG32(MC_VM_MD_L1_TLB0_CNTL, tmp);
1007 WREG32(MC_VM_MD_L1_TLB1_CNTL, tmp);
1008 WREG32(MC_VM_MD_L1_TLB2_CNTL, tmp);
1009 if (rdev->family == CHIP_RV740)
1010 WREG32(MC_VM_MD_L1_TLB3_CNTL, tmp);
1011 WREG32(MC_VM_MB_L1_TLB0_CNTL, tmp);
1012 WREG32(MC_VM_MB_L1_TLB1_CNTL, tmp);
1013 WREG32(MC_VM_MB_L1_TLB2_CNTL, tmp);
1014 WREG32(MC_VM_MB_L1_TLB3_CNTL, tmp);
1015 WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR, rdev->mc.gtt_start >> 12);
1016 WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR, rdev->mc.gtt_end >> 12);
1017 WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR, rdev->gart.table_addr >> 12);
1018 WREG32(VM_CONTEXT0_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(0) |
1019 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT);
1020 WREG32(VM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
1021 (u32)(rdev->dummy_page.addr >> 12));
1022 for (i = 1; i < 7; i++)
1023 WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
1025 r600_pcie_gart_tlb_flush(rdev);
1026 DRM_INFO("PCIE GART of %uM enabled (table at 0x%016llX).\n",
1027 (unsigned)(rdev->mc.gtt_size >> 20),
1028 (unsigned long long)rdev->gart.table_addr);
1029 rdev->gart.ready = true;
1033 static void rv770_pcie_gart_disable(struct radeon_device *rdev)
1038 /* Disable all tables */
1039 for (i = 0; i < 7; i++)
1040 WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
1042 /* Setup L2 cache */
1043 WREG32(VM_L2_CNTL, ENABLE_L2_FRAGMENT_PROCESSING |
1044 EFFECTIVE_L2_QUEUE_SIZE(7));
1045 WREG32(VM_L2_CNTL2, 0);
1046 WREG32(VM_L2_CNTL3, BANK_SELECT(0) | CACHE_UPDATE_MODE(2));
1047 /* Setup TLB control */
1048 tmp = EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5);
1049 WREG32(MC_VM_MD_L1_TLB0_CNTL, tmp);
1050 WREG32(MC_VM_MD_L1_TLB1_CNTL, tmp);
1051 WREG32(MC_VM_MD_L1_TLB2_CNTL, tmp);
1052 WREG32(MC_VM_MB_L1_TLB0_CNTL, tmp);
1053 WREG32(MC_VM_MB_L1_TLB1_CNTL, tmp);
1054 WREG32(MC_VM_MB_L1_TLB2_CNTL, tmp);
1055 WREG32(MC_VM_MB_L1_TLB3_CNTL, tmp);
1056 radeon_gart_table_vram_unpin(rdev);
1059 static void rv770_pcie_gart_fini(struct radeon_device *rdev)
1061 radeon_gart_fini(rdev);
1062 rv770_pcie_gart_disable(rdev);
1063 radeon_gart_table_vram_free(rdev);
1067 static void rv770_agp_enable(struct radeon_device *rdev)
1072 /* Setup L2 cache */
1073 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
1074 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
1075 EFFECTIVE_L2_QUEUE_SIZE(7));
1076 WREG32(VM_L2_CNTL2, 0);
1077 WREG32(VM_L2_CNTL3, BANK_SELECT(0) | CACHE_UPDATE_MODE(2));
1078 /* Setup TLB control */
1079 tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
1080 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
1081 SYSTEM_APERTURE_UNMAPPED_ACCESS_PASS_THRU |
1082 EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5);
1083 WREG32(MC_VM_MD_L1_TLB0_CNTL, tmp);
1084 WREG32(MC_VM_MD_L1_TLB1_CNTL, tmp);
1085 WREG32(MC_VM_MD_L1_TLB2_CNTL, tmp);
1086 WREG32(MC_VM_MB_L1_TLB0_CNTL, tmp);
1087 WREG32(MC_VM_MB_L1_TLB1_CNTL, tmp);
1088 WREG32(MC_VM_MB_L1_TLB2_CNTL, tmp);
1089 WREG32(MC_VM_MB_L1_TLB3_CNTL, tmp);
1090 for (i = 0; i < 7; i++)
1091 WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
1094 static void rv770_mc_program(struct radeon_device *rdev)
1096 struct rv515_mc_save save;
1100 /* Initialize HDP */
1101 for (i = 0, j = 0; i < 32; i++, j += 0x18) {
1102 WREG32((0x2c14 + j), 0x00000000);
1103 WREG32((0x2c18 + j), 0x00000000);
1104 WREG32((0x2c1c + j), 0x00000000);
1105 WREG32((0x2c20 + j), 0x00000000);
1106 WREG32((0x2c24 + j), 0x00000000);
1108 /* r7xx hw bug. Read from HDP_DEBUG1 rather
1109 * than writing to HDP_REG_COHERENCY_FLUSH_CNTL
1111 tmp = RREG32(HDP_DEBUG1);
1113 rv515_mc_stop(rdev, &save);
1114 if (r600_mc_wait_for_idle(rdev)) {
1115 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
1117 /* Lockout access through VGA aperture*/
1118 WREG32(VGA_HDP_CONTROL, VGA_MEMORY_DISABLE);
1119 /* Update configuration */
1120 if (rdev->flags & RADEON_IS_AGP) {
1121 if (rdev->mc.vram_start < rdev->mc.gtt_start) {
1122 /* VRAM before AGP */
1123 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
1124 rdev->mc.vram_start >> 12);
1125 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
1126 rdev->mc.gtt_end >> 12);
1128 /* VRAM after AGP */
1129 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
1130 rdev->mc.gtt_start >> 12);
1131 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
1132 rdev->mc.vram_end >> 12);
1135 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
1136 rdev->mc.vram_start >> 12);
1137 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
1138 rdev->mc.vram_end >> 12);
1140 WREG32(MC_VM_SYSTEM_APERTURE_DEFAULT_ADDR, rdev->vram_scratch.gpu_addr >> 12);
1141 tmp = ((rdev->mc.vram_end >> 24) & 0xFFFF) << 16;
1142 tmp |= ((rdev->mc.vram_start >> 24) & 0xFFFF);
1143 WREG32(MC_VM_FB_LOCATION, tmp);
1144 WREG32(HDP_NONSURFACE_BASE, (rdev->mc.vram_start >> 8));
1145 WREG32(HDP_NONSURFACE_INFO, (2 << 7));
1146 WREG32(HDP_NONSURFACE_SIZE, 0x3FFFFFFF);
1147 if (rdev->flags & RADEON_IS_AGP) {
1148 WREG32(MC_VM_AGP_TOP, rdev->mc.gtt_end >> 16);
1149 WREG32(MC_VM_AGP_BOT, rdev->mc.gtt_start >> 16);
1150 WREG32(MC_VM_AGP_BASE, rdev->mc.agp_base >> 22);
1152 WREG32(MC_VM_AGP_BASE, 0);
1153 WREG32(MC_VM_AGP_TOP, 0x0FFFFFFF);
1154 WREG32(MC_VM_AGP_BOT, 0x0FFFFFFF);
1156 if (r600_mc_wait_for_idle(rdev)) {
1157 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
1159 rv515_mc_resume(rdev, &save);
1160 /* we need to own VRAM, so turn off the VGA renderer here
1161 * to stop it overwriting our objects */
1162 rv515_vga_render_disable(rdev);
1169 void r700_cp_stop(struct radeon_device *rdev)
1171 radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size);
1172 WREG32(CP_ME_CNTL, (CP_ME_HALT | CP_PFP_HALT));
1173 WREG32(SCRATCH_UMSK, 0);
1174 rdev->ring[RADEON_RING_TYPE_GFX_INDEX].ready = false;
1177 static int rv770_cp_load_microcode(struct radeon_device *rdev)
1179 const __be32 *fw_data;
1182 if (!rdev->me_fw || !rdev->pfp_fw)
1190 RB_NO_UPDATE | RB_BLKSZ(15) | RB_BUFSZ(3));
1193 WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
1194 RREG32(GRBM_SOFT_RESET);
1196 WREG32(GRBM_SOFT_RESET, 0);
1198 fw_data = (const __be32 *)rdev->pfp_fw->data;
1199 WREG32(CP_PFP_UCODE_ADDR, 0);
1200 for (i = 0; i < R700_PFP_UCODE_SIZE; i++)
1201 WREG32(CP_PFP_UCODE_DATA, be32_to_cpup(fw_data++));
1202 WREG32(CP_PFP_UCODE_ADDR, 0);
1204 fw_data = (const __be32 *)rdev->me_fw->data;
1205 WREG32(CP_ME_RAM_WADDR, 0);
1206 for (i = 0; i < R700_PM4_UCODE_SIZE; i++)
1207 WREG32(CP_ME_RAM_DATA, be32_to_cpup(fw_data++));
1209 WREG32(CP_PFP_UCODE_ADDR, 0);
1210 WREG32(CP_ME_RAM_WADDR, 0);
1211 WREG32(CP_ME_RAM_RADDR, 0);
1215 void r700_cp_fini(struct radeon_device *rdev)
1217 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
1219 radeon_ring_fini(rdev, ring);
1220 radeon_scratch_free(rdev, ring->rptr_save_reg);
1226 static void rv770_gpu_init(struct radeon_device *rdev)
1228 int i, j, num_qd_pipes;
1233 u32 num_gs_verts_per_thread;
1235 u32 gs_prim_buffer_depth = 0;
1236 u32 sq_ms_fifo_sizes;
1238 u32 sq_thread_resource_mgmt;
1239 u32 hdp_host_path_cntl;
1240 u32 sq_dyn_gpr_size_simd_ab_0;
1241 u32 gb_tiling_config = 0;
1242 u32 cc_rb_backend_disable = 0;
1243 u32 cc_gc_shader_pipe_config = 0;
1246 u32 inactive_pipes, shader_pipe_config;
1247 u32 disabled_rb_mask;
1248 unsigned active_number;
1250 /* setup chip specs */
1251 rdev->config.rv770.tiling_group_size = 256;
1252 switch (rdev->family) {
1254 rdev->config.rv770.max_pipes = 4;
1255 rdev->config.rv770.max_tile_pipes = 8;
1256 rdev->config.rv770.max_simds = 10;
1257 rdev->config.rv770.max_backends = 4;
1258 rdev->config.rv770.max_gprs = 256;
1259 rdev->config.rv770.max_threads = 248;
1260 rdev->config.rv770.max_stack_entries = 512;
1261 rdev->config.rv770.max_hw_contexts = 8;
1262 rdev->config.rv770.max_gs_threads = 16 * 2;
1263 rdev->config.rv770.sx_max_export_size = 128;
1264 rdev->config.rv770.sx_max_export_pos_size = 16;
1265 rdev->config.rv770.sx_max_export_smx_size = 112;
1266 rdev->config.rv770.sq_num_cf_insts = 2;
1268 rdev->config.rv770.sx_num_of_sets = 7;
1269 rdev->config.rv770.sc_prim_fifo_size = 0xF9;
1270 rdev->config.rv770.sc_hiz_tile_fifo_size = 0x30;
1271 rdev->config.rv770.sc_earlyz_tile_fifo_fize = 0x130;
1274 rdev->config.rv770.max_pipes = 2;
1275 rdev->config.rv770.max_tile_pipes = 4;
1276 rdev->config.rv770.max_simds = 8;
1277 rdev->config.rv770.max_backends = 2;
1278 rdev->config.rv770.max_gprs = 128;
1279 rdev->config.rv770.max_threads = 248;
1280 rdev->config.rv770.max_stack_entries = 256;
1281 rdev->config.rv770.max_hw_contexts = 8;
1282 rdev->config.rv770.max_gs_threads = 16 * 2;
1283 rdev->config.rv770.sx_max_export_size = 256;
1284 rdev->config.rv770.sx_max_export_pos_size = 32;
1285 rdev->config.rv770.sx_max_export_smx_size = 224;
1286 rdev->config.rv770.sq_num_cf_insts = 2;
1288 rdev->config.rv770.sx_num_of_sets = 7;
1289 rdev->config.rv770.sc_prim_fifo_size = 0xf9;
1290 rdev->config.rv770.sc_hiz_tile_fifo_size = 0x30;
1291 rdev->config.rv770.sc_earlyz_tile_fifo_fize = 0x130;
1292 if (rdev->config.rv770.sx_max_export_pos_size > 16) {
1293 rdev->config.rv770.sx_max_export_pos_size -= 16;
1294 rdev->config.rv770.sx_max_export_smx_size += 16;
1298 rdev->config.rv770.max_pipes = 2;
1299 rdev->config.rv770.max_tile_pipes = 2;
1300 rdev->config.rv770.max_simds = 2;
1301 rdev->config.rv770.max_backends = 1;
1302 rdev->config.rv770.max_gprs = 256;
1303 rdev->config.rv770.max_threads = 192;
1304 rdev->config.rv770.max_stack_entries = 256;
1305 rdev->config.rv770.max_hw_contexts = 4;
1306 rdev->config.rv770.max_gs_threads = 8 * 2;
1307 rdev->config.rv770.sx_max_export_size = 128;
1308 rdev->config.rv770.sx_max_export_pos_size = 16;
1309 rdev->config.rv770.sx_max_export_smx_size = 112;
1310 rdev->config.rv770.sq_num_cf_insts = 1;
1312 rdev->config.rv770.sx_num_of_sets = 7;
1313 rdev->config.rv770.sc_prim_fifo_size = 0x40;
1314 rdev->config.rv770.sc_hiz_tile_fifo_size = 0x30;
1315 rdev->config.rv770.sc_earlyz_tile_fifo_fize = 0x130;
1318 rdev->config.rv770.max_pipes = 4;
1319 rdev->config.rv770.max_tile_pipes = 4;
1320 rdev->config.rv770.max_simds = 8;
1321 rdev->config.rv770.max_backends = 4;
1322 rdev->config.rv770.max_gprs = 256;
1323 rdev->config.rv770.max_threads = 248;
1324 rdev->config.rv770.max_stack_entries = 512;
1325 rdev->config.rv770.max_hw_contexts = 8;
1326 rdev->config.rv770.max_gs_threads = 16 * 2;
1327 rdev->config.rv770.sx_max_export_size = 256;
1328 rdev->config.rv770.sx_max_export_pos_size = 32;
1329 rdev->config.rv770.sx_max_export_smx_size = 224;
1330 rdev->config.rv770.sq_num_cf_insts = 2;
1332 rdev->config.rv770.sx_num_of_sets = 7;
1333 rdev->config.rv770.sc_prim_fifo_size = 0x100;
1334 rdev->config.rv770.sc_hiz_tile_fifo_size = 0x30;
1335 rdev->config.rv770.sc_earlyz_tile_fifo_fize = 0x130;
1337 if (rdev->config.rv770.sx_max_export_pos_size > 16) {
1338 rdev->config.rv770.sx_max_export_pos_size -= 16;
1339 rdev->config.rv770.sx_max_export_smx_size += 16;
1346 /* Initialize HDP */
1348 for (i = 0; i < 32; i++) {
1349 WREG32((0x2c14 + j), 0x00000000);
1350 WREG32((0x2c18 + j), 0x00000000);
1351 WREG32((0x2c1c + j), 0x00000000);
1352 WREG32((0x2c20 + j), 0x00000000);
1353 WREG32((0x2c24 + j), 0x00000000);
1357 WREG32(GRBM_CNTL, GRBM_READ_TIMEOUT(0xff));
1359 /* setup tiling, simd, pipe config */
1360 mc_arb_ramcfg = RREG32(MC_ARB_RAMCFG);
1362 shader_pipe_config = RREG32(CC_GC_SHADER_PIPE_CONFIG);
1363 inactive_pipes = (shader_pipe_config & INACTIVE_QD_PIPES_MASK) >> INACTIVE_QD_PIPES_SHIFT;
1364 for (i = 0, tmp = 1, active_number = 0; i < R7XX_MAX_PIPES; i++) {
1365 if (!(inactive_pipes & tmp)) {
1370 if (active_number == 1) {
1371 WREG32(SPI_CONFIG_CNTL, DISABLE_INTERP_1);
1373 WREG32(SPI_CONFIG_CNTL, 0);
1376 cc_rb_backend_disable = RREG32(CC_RB_BACKEND_DISABLE) & 0x00ff0000;
1377 tmp = R7XX_MAX_BACKENDS - r600_count_pipe_bits(cc_rb_backend_disable >> 16);
1378 if (tmp < rdev->config.rv770.max_backends) {
1379 rdev->config.rv770.max_backends = tmp;
1382 cc_gc_shader_pipe_config = RREG32(CC_GC_SHADER_PIPE_CONFIG) & 0xffffff00;
1383 tmp = R7XX_MAX_PIPES - r600_count_pipe_bits((cc_gc_shader_pipe_config >> 8) & R7XX_MAX_PIPES_MASK);
1384 if (tmp < rdev->config.rv770.max_pipes) {
1385 rdev->config.rv770.max_pipes = tmp;
1387 tmp = R7XX_MAX_SIMDS - r600_count_pipe_bits((cc_gc_shader_pipe_config >> 16) & R7XX_MAX_SIMDS_MASK);
1388 if (tmp < rdev->config.rv770.max_simds) {
1389 rdev->config.rv770.max_simds = tmp;
1392 switch (rdev->config.rv770.max_tile_pipes) {
1395 gb_tiling_config = PIPE_TILING(0);
1398 gb_tiling_config = PIPE_TILING(1);
1401 gb_tiling_config = PIPE_TILING(2);
1404 gb_tiling_config = PIPE_TILING(3);
1407 rdev->config.rv770.tiling_npipes = rdev->config.rv770.max_tile_pipes;
1409 disabled_rb_mask = (RREG32(CC_RB_BACKEND_DISABLE) >> 16) & R7XX_MAX_BACKENDS_MASK;
1410 tmp = (gb_tiling_config & PIPE_TILING__MASK) >> PIPE_TILING__SHIFT;
1411 tmp = r6xx_remap_render_backend(rdev, tmp, rdev->config.rv770.max_backends,
1412 R7XX_MAX_BACKENDS, disabled_rb_mask);
1413 gb_tiling_config |= tmp << 16;
1414 rdev->config.rv770.backend_map = tmp;
1416 if (rdev->family == CHIP_RV770)
1417 gb_tiling_config |= BANK_TILING(1);
1419 if ((mc_arb_ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT)
1420 gb_tiling_config |= BANK_TILING(1);
1422 gb_tiling_config |= BANK_TILING(0);
1424 rdev->config.rv770.tiling_nbanks = 4 << ((gb_tiling_config >> 4) & 0x3);
1425 gb_tiling_config |= GROUP_SIZE((mc_arb_ramcfg & BURSTLENGTH_MASK) >> BURSTLENGTH_SHIFT);
1426 if (((mc_arb_ramcfg & NOOFROWS_MASK) >> NOOFROWS_SHIFT) > 3) {
1427 gb_tiling_config |= ROW_TILING(3);
1428 gb_tiling_config |= SAMPLE_SPLIT(3);
1431 ROW_TILING(((mc_arb_ramcfg & NOOFROWS_MASK) >> NOOFROWS_SHIFT));
1433 SAMPLE_SPLIT(((mc_arb_ramcfg & NOOFROWS_MASK) >> NOOFROWS_SHIFT));
1436 gb_tiling_config |= BANK_SWAPS(1);
1437 rdev->config.rv770.tile_config = gb_tiling_config;
1439 WREG32(GB_TILING_CONFIG, gb_tiling_config);
1440 WREG32(DCP_TILING_CONFIG, (gb_tiling_config & 0xffff));
1441 WREG32(HDP_TILING_CONFIG, (gb_tiling_config & 0xffff));
1442 WREG32(DMA_TILING_CONFIG, (gb_tiling_config & 0xffff));
1443 WREG32(DMA_TILING_CONFIG2, (gb_tiling_config & 0xffff));
1444 if (rdev->family == CHIP_RV730) {
1445 WREG32(UVD_UDEC_DB_TILING_CONFIG, (gb_tiling_config & 0xffff));
1446 WREG32(UVD_UDEC_DBW_TILING_CONFIG, (gb_tiling_config & 0xffff));
1447 WREG32(UVD_UDEC_TILING_CONFIG, (gb_tiling_config & 0xffff));
1450 WREG32(CGTS_SYS_TCC_DISABLE, 0);
1451 WREG32(CGTS_TCC_DISABLE, 0);
1452 WREG32(CGTS_USER_SYS_TCC_DISABLE, 0);
1453 WREG32(CGTS_USER_TCC_DISABLE, 0);
1456 num_qd_pipes = R7XX_MAX_PIPES - r600_count_pipe_bits((cc_gc_shader_pipe_config & INACTIVE_QD_PIPES_MASK) >> 8);
1457 WREG32(VGT_OUT_DEALLOC_CNTL, (num_qd_pipes * 4) & DEALLOC_DIST_MASK);
1458 WREG32(VGT_VERTEX_REUSE_BLOCK_CNTL, ((num_qd_pipes * 4) - 2) & VTX_REUSE_DEPTH_MASK);
1460 /* set HW defaults for 3D engine */
1461 WREG32(CP_QUEUE_THRESHOLDS, (ROQ_IB1_START(0x16) |
1462 ROQ_IB2_START(0x2b)));
1464 WREG32(CP_MEQ_THRESHOLDS, STQ_SPLIT(0x30));
1466 ta_aux_cntl = RREG32(TA_CNTL_AUX);
1467 WREG32(TA_CNTL_AUX, ta_aux_cntl | DISABLE_CUBE_ANISO);
1469 sx_debug_1 = RREG32(SX_DEBUG_1);
1470 sx_debug_1 |= ENABLE_NEW_SMX_ADDRESS;
1471 WREG32(SX_DEBUG_1, sx_debug_1);
1473 smx_dc_ctl0 = RREG32(SMX_DC_CTL0);
1474 smx_dc_ctl0 &= ~CACHE_DEPTH(0x1ff);
1475 smx_dc_ctl0 |= CACHE_DEPTH((rdev->config.rv770.sx_num_of_sets * 64) - 1);
1476 WREG32(SMX_DC_CTL0, smx_dc_ctl0);
1478 if (rdev->family != CHIP_RV740)
1479 WREG32(SMX_EVENT_CTL, (ES_FLUSH_CTL(4) |
1484 if (rdev->family != CHIP_RV770)
1485 WREG32(SMX_SAR_CTL0, 0x00003f3f);
1487 db_debug3 = RREG32(DB_DEBUG3);
1488 db_debug3 &= ~DB_CLK_OFF_DELAY(0x1f);
1489 switch (rdev->family) {
1492 db_debug3 |= DB_CLK_OFF_DELAY(0x1f);
1497 db_debug3 |= DB_CLK_OFF_DELAY(2);
1500 WREG32(DB_DEBUG3, db_debug3);
1502 if (rdev->family != CHIP_RV770) {
1503 db_debug4 = RREG32(DB_DEBUG4);
1504 db_debug4 |= DISABLE_TILE_COVERED_FOR_PS_ITER;
1505 WREG32(DB_DEBUG4, db_debug4);
1508 WREG32(SX_EXPORT_BUFFER_SIZES, (COLOR_BUFFER_SIZE((rdev->config.rv770.sx_max_export_size / 4) - 1) |
1509 POSITION_BUFFER_SIZE((rdev->config.rv770.sx_max_export_pos_size / 4) - 1) |
1510 SMX_BUFFER_SIZE((rdev->config.rv770.sx_max_export_smx_size / 4) - 1)));
1512 WREG32(PA_SC_FIFO_SIZE, (SC_PRIM_FIFO_SIZE(rdev->config.rv770.sc_prim_fifo_size) |
1513 SC_HIZ_TILE_FIFO_SIZE(rdev->config.rv770.sc_hiz_tile_fifo_size) |
1514 SC_EARLYZ_TILE_FIFO_SIZE(rdev->config.rv770.sc_earlyz_tile_fifo_fize)));
1516 WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
1518 WREG32(VGT_NUM_INSTANCES, 1);
1520 WREG32(SPI_CONFIG_CNTL_1, VTX_DONE_DELAY(4));
1522 WREG32(CP_PERFMON_CNTL, 0);
1524 sq_ms_fifo_sizes = (CACHE_FIFO_SIZE(16 * rdev->config.rv770.sq_num_cf_insts) |
1525 DONE_FIFO_HIWATER(0xe0) |
1526 ALU_UPDATE_FIFO_HIWATER(0x8));
1527 switch (rdev->family) {
1531 sq_ms_fifo_sizes |= FETCH_FIFO_HIWATER(0x1);
1535 sq_ms_fifo_sizes |= FETCH_FIFO_HIWATER(0x4);
1538 WREG32(SQ_MS_FIFO_SIZES, sq_ms_fifo_sizes);
1540 /* SQ_CONFIG, SQ_GPR_RESOURCE_MGMT, SQ_THREAD_RESOURCE_MGMT, SQ_STACK_RESOURCE_MGMT
1541 * should be adjusted as needed by the 2D/3D drivers. This just sets default values
1543 sq_config = RREG32(SQ_CONFIG);
1544 sq_config &= ~(PS_PRIO(3) |
1548 sq_config |= (DX9_CONSTS |
1555 if (rdev->family == CHIP_RV710)
1556 /* no vertex cache */
1557 sq_config &= ~VC_ENABLE;
1559 WREG32(SQ_CONFIG, sq_config);
1561 WREG32(SQ_GPR_RESOURCE_MGMT_1, (NUM_PS_GPRS((rdev->config.rv770.max_gprs * 24)/64) |
1562 NUM_VS_GPRS((rdev->config.rv770.max_gprs * 24)/64) |
1563 NUM_CLAUSE_TEMP_GPRS(((rdev->config.rv770.max_gprs * 24)/64)/2)));
1565 WREG32(SQ_GPR_RESOURCE_MGMT_2, (NUM_GS_GPRS((rdev->config.rv770.max_gprs * 7)/64) |
1566 NUM_ES_GPRS((rdev->config.rv770.max_gprs * 7)/64)));
1568 sq_thread_resource_mgmt = (NUM_PS_THREADS((rdev->config.rv770.max_threads * 4)/8) |
1569 NUM_VS_THREADS((rdev->config.rv770.max_threads * 2)/8) |
1570 NUM_ES_THREADS((rdev->config.rv770.max_threads * 1)/8));
1571 if (((rdev->config.rv770.max_threads * 1) / 8) > rdev->config.rv770.max_gs_threads)
1572 sq_thread_resource_mgmt |= NUM_GS_THREADS(rdev->config.rv770.max_gs_threads);
1574 sq_thread_resource_mgmt |= NUM_GS_THREADS((rdev->config.rv770.max_gs_threads * 1)/8);
1575 WREG32(SQ_THREAD_RESOURCE_MGMT, sq_thread_resource_mgmt);
1577 WREG32(SQ_STACK_RESOURCE_MGMT_1, (NUM_PS_STACK_ENTRIES((rdev->config.rv770.max_stack_entries * 1)/4) |
1578 NUM_VS_STACK_ENTRIES((rdev->config.rv770.max_stack_entries * 1)/4)));
1580 WREG32(SQ_STACK_RESOURCE_MGMT_2, (NUM_GS_STACK_ENTRIES((rdev->config.rv770.max_stack_entries * 1)/4) |
1581 NUM_ES_STACK_ENTRIES((rdev->config.rv770.max_stack_entries * 1)/4)));
1583 sq_dyn_gpr_size_simd_ab_0 = (SIMDA_RING0((rdev->config.rv770.max_gprs * 38)/64) |
1584 SIMDA_RING1((rdev->config.rv770.max_gprs * 38)/64) |
1585 SIMDB_RING0((rdev->config.rv770.max_gprs * 38)/64) |
1586 SIMDB_RING1((rdev->config.rv770.max_gprs * 38)/64));
1588 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_0, sq_dyn_gpr_size_simd_ab_0);
1589 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_1, sq_dyn_gpr_size_simd_ab_0);
1590 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_2, sq_dyn_gpr_size_simd_ab_0);
1591 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_3, sq_dyn_gpr_size_simd_ab_0);
1592 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_4, sq_dyn_gpr_size_simd_ab_0);
1593 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_5, sq_dyn_gpr_size_simd_ab_0);
1594 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_6, sq_dyn_gpr_size_simd_ab_0);
1595 WREG32(SQ_DYN_GPR_SIZE_SIMD_AB_7, sq_dyn_gpr_size_simd_ab_0);
1597 WREG32(PA_SC_FORCE_EOV_MAX_CNTS, (FORCE_EOV_MAX_CLK_CNT(4095) |
1598 FORCE_EOV_MAX_REZ_CNT(255)));
1600 if (rdev->family == CHIP_RV710)
1601 WREG32(VGT_CACHE_INVALIDATION, (CACHE_INVALIDATION(TC_ONLY) |
1602 AUTO_INVLD_EN(ES_AND_GS_AUTO)));
1604 WREG32(VGT_CACHE_INVALIDATION, (CACHE_INVALIDATION(VC_AND_TC) |
1605 AUTO_INVLD_EN(ES_AND_GS_AUTO)));
1607 switch (rdev->family) {
1611 gs_prim_buffer_depth = 384;
1614 gs_prim_buffer_depth = 128;
1620 num_gs_verts_per_thread = rdev->config.rv770.max_pipes * 16;
1621 vgt_gs_per_es = gs_prim_buffer_depth + num_gs_verts_per_thread;
1622 /* Max value for this is 256 */
1623 if (vgt_gs_per_es > 256)
1624 vgt_gs_per_es = 256;
1626 WREG32(VGT_ES_PER_GS, 128);
1627 WREG32(VGT_GS_PER_ES, vgt_gs_per_es);
1628 WREG32(VGT_GS_PER_VS, 2);
1630 /* more default values. 2D/3D driver should adjust as needed */
1631 WREG32(VGT_GS_VERTEX_REUSE, 16);
1632 WREG32(PA_SC_LINE_STIPPLE_STATE, 0);
1633 WREG32(VGT_STRMOUT_EN, 0);
1635 WREG32(PA_SC_MODE_CNTL, 0);
1636 WREG32(PA_SC_EDGERULE, 0xaaaaaaaa);
1637 WREG32(PA_SC_AA_CONFIG, 0);
1638 WREG32(PA_SC_CLIPRECT_RULE, 0xffff);
1639 WREG32(PA_SC_LINE_STIPPLE, 0);
1640 WREG32(SPI_INPUT_Z, 0);
1641 WREG32(SPI_PS_IN_CONTROL_0, NUM_INTERP(2));
1642 WREG32(CB_COLOR7_FRAG, 0);
1644 /* clear render buffer base addresses */
1645 WREG32(CB_COLOR0_BASE, 0);
1646 WREG32(CB_COLOR1_BASE, 0);
1647 WREG32(CB_COLOR2_BASE, 0);
1648 WREG32(CB_COLOR3_BASE, 0);
1649 WREG32(CB_COLOR4_BASE, 0);
1650 WREG32(CB_COLOR5_BASE, 0);
1651 WREG32(CB_COLOR6_BASE, 0);
1652 WREG32(CB_COLOR7_BASE, 0);
1654 WREG32(TCP_CNTL, 0);
1656 hdp_host_path_cntl = RREG32(HDP_HOST_PATH_CNTL);
1657 WREG32(HDP_HOST_PATH_CNTL, hdp_host_path_cntl);
1659 WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
1661 WREG32(PA_CL_ENHANCE, (CLIP_VTX_REORDER_ENA |
1663 WREG32(VC_ENHANCE, 0);
1666 void r700_vram_gtt_location(struct radeon_device *rdev, struct radeon_mc *mc)
1668 u64 size_bf, size_af;
1670 if (mc->mc_vram_size > 0xE0000000) {
1671 /* leave room for at least 512M GTT */
1672 dev_warn(rdev->dev, "limiting VRAM\n");
1673 mc->real_vram_size = 0xE0000000;
1674 mc->mc_vram_size = 0xE0000000;
1676 if (rdev->flags & RADEON_IS_AGP) {
1677 size_bf = mc->gtt_start;
1678 size_af = mc->mc_mask - mc->gtt_end;
1679 if (size_bf > size_af) {
1680 if (mc->mc_vram_size > size_bf) {
1681 dev_warn(rdev->dev, "limiting VRAM\n");
1682 mc->real_vram_size = size_bf;
1683 mc->mc_vram_size = size_bf;
1685 mc->vram_start = mc->gtt_start - mc->mc_vram_size;
1687 if (mc->mc_vram_size > size_af) {
1688 dev_warn(rdev->dev, "limiting VRAM\n");
1689 mc->real_vram_size = size_af;
1690 mc->mc_vram_size = size_af;
1692 mc->vram_start = mc->gtt_end + 1;
1694 mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
1695 dev_info(rdev->dev, "VRAM: %lluM 0x%08llX - 0x%08llX (%lluM used)\n",
1696 mc->mc_vram_size >> 20, mc->vram_start,
1697 mc->vram_end, mc->real_vram_size >> 20);
1699 radeon_vram_location(rdev, &rdev->mc, 0);
1700 rdev->mc.gtt_base_align = 0;
1701 radeon_gtt_location(rdev, mc);
1705 static int rv770_mc_init(struct radeon_device *rdev)
1708 int chansize, numchan;
1710 /* Get VRAM informations */
1711 rdev->mc.vram_is_ddr = true;
1712 tmp = RREG32(MC_ARB_RAMCFG);
1713 if (tmp & CHANSIZE_OVERRIDE) {
1715 } else if (tmp & CHANSIZE_MASK) {
1720 tmp = RREG32(MC_SHARED_CHMAP);
1721 switch ((tmp & NOOFCHAN_MASK) >> NOOFCHAN_SHIFT) {
1736 rdev->mc.vram_width = numchan * chansize;
1737 /* Could aper size report 0 ? */
1738 rdev->mc.aper_base = pci_resource_start(rdev->pdev, 0);
1739 rdev->mc.aper_size = pci_resource_len(rdev->pdev, 0);
1740 /* Setup GPU memory space */
1741 rdev->mc.mc_vram_size = RREG32(CONFIG_MEMSIZE);
1742 rdev->mc.real_vram_size = RREG32(CONFIG_MEMSIZE);
1743 rdev->mc.visible_vram_size = rdev->mc.aper_size;
1744 r700_vram_gtt_location(rdev, &rdev->mc);
1745 radeon_update_bandwidth_info(rdev);
1751 * rv770_copy_dma - copy pages using the DMA engine
1753 * @rdev: radeon_device pointer
1754 * @src_offset: src GPU address
1755 * @dst_offset: dst GPU address
1756 * @num_gpu_pages: number of GPU pages to xfer
1757 * @fence: radeon fence object
1759 * Copy GPU paging using the DMA engine (r7xx).
1760 * Used by the radeon ttm implementation to move pages if
1761 * registered as the asic copy callback.
1763 int rv770_copy_dma(struct radeon_device *rdev,
1764 uint64_t src_offset, uint64_t dst_offset,
1765 unsigned num_gpu_pages,
1766 struct radeon_fence **fence)
1768 struct radeon_semaphore *sem = NULL;
1769 int ring_index = rdev->asic->copy.dma_ring_index;
1770 struct radeon_ring *ring = &rdev->ring[ring_index];
1771 u32 size_in_dw, cur_size_in_dw;
1775 r = radeon_semaphore_create(rdev, &sem);
1777 DRM_ERROR("radeon: moving bo (%d).\n", r);
1781 size_in_dw = (num_gpu_pages << RADEON_GPU_PAGE_SHIFT) / 4;
1782 num_loops = DIV_ROUND_UP(size_in_dw, 0xFFFF);
1783 r = radeon_ring_lock(rdev, ring, num_loops * 5 + 8);
1785 DRM_ERROR("radeon: moving bo (%d).\n", r);
1786 radeon_semaphore_free(rdev, &sem, NULL);
1790 if (radeon_fence_need_sync(*fence, ring->idx)) {
1791 radeon_semaphore_sync_rings(rdev, sem, (*fence)->ring,
1793 radeon_fence_note_sync(*fence, ring->idx);
1795 radeon_semaphore_free(rdev, &sem, NULL);
1798 for (i = 0; i < num_loops; i++) {
1799 cur_size_in_dw = size_in_dw;
1800 if (cur_size_in_dw > 0xFFFF)
1801 cur_size_in_dw = 0xFFFF;
1802 size_in_dw -= cur_size_in_dw;
1803 radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_COPY, 0, 0, cur_size_in_dw));
1804 radeon_ring_write(ring, dst_offset & 0xfffffffc);
1805 radeon_ring_write(ring, src_offset & 0xfffffffc);
1806 radeon_ring_write(ring, upper_32_bits(dst_offset) & 0xff);
1807 radeon_ring_write(ring, upper_32_bits(src_offset) & 0xff);
1808 src_offset += cur_size_in_dw * 4;
1809 dst_offset += cur_size_in_dw * 4;
1812 r = radeon_fence_emit(rdev, fence, ring->idx);
1814 radeon_ring_unlock_undo(rdev, ring);
1818 radeon_ring_unlock_commit(rdev, ring);
1819 radeon_semaphore_free(rdev, &sem, *fence);
1824 static int rv770_startup(struct radeon_device *rdev)
1826 struct radeon_ring *ring;
1829 /* enable pcie gen2 link */
1830 rv770_pcie_gen2_enable(rdev);
1832 rv770_mc_program(rdev);
1834 if (!rdev->me_fw || !rdev->pfp_fw || !rdev->rlc_fw) {
1835 r = r600_init_microcode(rdev);
1837 DRM_ERROR("Failed to load firmware!\n");
1842 r = r600_vram_scratch_init(rdev);
1846 if (rdev->flags & RADEON_IS_AGP) {
1847 rv770_agp_enable(rdev);
1849 r = rv770_pcie_gart_enable(rdev);
1854 rv770_gpu_init(rdev);
1855 r = r600_blit_init(rdev);
1857 r600_blit_fini(rdev);
1858 rdev->asic->copy.copy = NULL;
1859 dev_warn(rdev->dev, "failed blitter (%d) falling back to memcpy\n", r);
1862 /* allocate wb buffer */
1863 r = radeon_wb_init(rdev);
1867 r = radeon_fence_driver_start_ring(rdev, RADEON_RING_TYPE_GFX_INDEX);
1869 dev_err(rdev->dev, "failed initializing CP fences (%d).\n", r);
1873 r = radeon_fence_driver_start_ring(rdev, R600_RING_TYPE_DMA_INDEX);
1875 dev_err(rdev->dev, "failed initializing DMA fences (%d).\n", r);
1879 r = rv770_uvd_resume(rdev);
1881 r = radeon_fence_driver_start_ring(rdev,
1882 R600_RING_TYPE_UVD_INDEX);
1884 dev_err(rdev->dev, "UVD fences init error (%d).\n", r);
1888 rdev->ring[R600_RING_TYPE_UVD_INDEX].ring_size = 0;
1891 if (!rdev->irq.installed) {
1892 r = radeon_irq_kms_init(rdev);
1897 r = r600_irq_init(rdev);
1899 DRM_ERROR("radeon: IH init failed (%d).\n", r);
1900 radeon_irq_kms_fini(rdev);
1905 ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
1906 r = radeon_ring_init(rdev, ring, ring->ring_size, RADEON_WB_CP_RPTR_OFFSET,
1907 R600_CP_RB_RPTR, R600_CP_RB_WPTR,
1908 0, 0xfffff, RADEON_CP_PACKET2);
1912 ring = &rdev->ring[R600_RING_TYPE_DMA_INDEX];
1913 r = radeon_ring_init(rdev, ring, ring->ring_size, R600_WB_DMA_RPTR_OFFSET,
1914 DMA_RB_RPTR, DMA_RB_WPTR,
1915 2, 0x3fffc, DMA_PACKET(DMA_PACKET_NOP, 0, 0, 0));
1919 r = rv770_cp_load_microcode(rdev);
1922 r = r600_cp_resume(rdev);
1926 r = r600_dma_resume(rdev);
1930 ring = &rdev->ring[R600_RING_TYPE_UVD_INDEX];
1931 if (ring->ring_size) {
1932 r = radeon_ring_init(rdev, ring, ring->ring_size,
1933 R600_WB_UVD_RPTR_OFFSET,
1934 UVD_RBC_RB_RPTR, UVD_RBC_RB_WPTR,
1935 0, 0xfffff, RADEON_CP_PACKET2);
1937 r = r600_uvd_init(rdev);
1940 DRM_ERROR("radeon: failed initializing UVD (%d).\n", r);
1943 r = radeon_ib_pool_init(rdev);
1945 dev_err(rdev->dev, "IB initialization failed (%d).\n", r);
1949 r = r600_audio_init(rdev);
1951 DRM_ERROR("radeon: audio init failed\n");
1958 int rv770_resume(struct radeon_device *rdev)
1962 /* Do not reset GPU before posting, on rv770 hw unlike on r500 hw,
1963 * posting will perform necessary task to bring back GPU into good
1967 atom_asic_init(rdev->mode_info.atom_context);
1969 /* init golden registers */
1970 rv770_init_golden_registers(rdev);
1972 rdev->accel_working = true;
1973 r = rv770_startup(rdev);
1975 DRM_ERROR("r600 startup failed on resume\n");
1976 rdev->accel_working = false;
1984 int rv770_suspend(struct radeon_device *rdev)
1986 r600_audio_fini(rdev);
1987 r600_uvd_stop(rdev);
1988 radeon_uvd_suspend(rdev);
1990 r600_dma_stop(rdev);
1991 r600_irq_suspend(rdev);
1992 radeon_wb_disable(rdev);
1993 rv770_pcie_gart_disable(rdev);
1998 /* Plan is to move initialization in that function and use
1999 * helper function so that radeon_device_init pretty much
2000 * do nothing more than calling asic specific function. This
2001 * should also allow to remove a bunch of callback function
2004 int rv770_init(struct radeon_device *rdev)
2009 if (!radeon_get_bios(rdev)) {
2010 if (ASIC_IS_AVIVO(rdev))
2013 /* Must be an ATOMBIOS */
2014 if (!rdev->is_atom_bios) {
2015 dev_err(rdev->dev, "Expecting atombios for R600 GPU\n");
2018 r = radeon_atombios_init(rdev);
2021 /* Post card if necessary */
2022 if (!radeon_card_posted(rdev)) {
2024 dev_err(rdev->dev, "Card not posted and no BIOS - ignoring\n");
2027 DRM_INFO("GPU not posted. posting now...\n");
2028 atom_asic_init(rdev->mode_info.atom_context);
2030 /* init golden registers */
2031 rv770_init_golden_registers(rdev);
2032 /* Initialize scratch registers */
2033 r600_scratch_init(rdev);
2034 /* Initialize surface registers */
2035 radeon_surface_init(rdev);
2036 /* Initialize clocks */
2037 radeon_get_clock_info(rdev->ddev);
2039 r = radeon_fence_driver_init(rdev);
2042 /* initialize AGP */
2043 if (rdev->flags & RADEON_IS_AGP) {
2044 r = radeon_agp_init(rdev);
2046 radeon_agp_disable(rdev);
2048 r = rv770_mc_init(rdev);
2051 /* Memory manager */
2052 r = radeon_bo_init(rdev);
2056 rdev->ring[RADEON_RING_TYPE_GFX_INDEX].ring_obj = NULL;
2057 r600_ring_init(rdev, &rdev->ring[RADEON_RING_TYPE_GFX_INDEX], 1024 * 1024);
2059 rdev->ring[R600_RING_TYPE_DMA_INDEX].ring_obj = NULL;
2060 r600_ring_init(rdev, &rdev->ring[R600_RING_TYPE_DMA_INDEX], 64 * 1024);
2062 r = radeon_uvd_init(rdev);
2064 rdev->ring[R600_RING_TYPE_UVD_INDEX].ring_obj = NULL;
2065 r600_ring_init(rdev, &rdev->ring[R600_RING_TYPE_UVD_INDEX],
2069 rdev->ih.ring_obj = NULL;
2070 r600_ih_ring_init(rdev, 64 * 1024);
2072 r = r600_pcie_gart_init(rdev);
2076 rdev->accel_working = true;
2077 r = rv770_startup(rdev);
2079 dev_err(rdev->dev, "disabling GPU acceleration\n");
2081 r600_dma_fini(rdev);
2082 r600_irq_fini(rdev);
2083 radeon_wb_fini(rdev);
2084 radeon_ib_pool_fini(rdev);
2085 radeon_irq_kms_fini(rdev);
2086 rv770_pcie_gart_fini(rdev);
2087 rdev->accel_working = false;
2093 void rv770_fini(struct radeon_device *rdev)
2095 r600_blit_fini(rdev);
2097 r600_dma_fini(rdev);
2098 r600_irq_fini(rdev);
2099 radeon_wb_fini(rdev);
2100 radeon_ib_pool_fini(rdev);
2101 radeon_irq_kms_fini(rdev);
2102 rv770_pcie_gart_fini(rdev);
2103 r600_uvd_stop(rdev);
2104 radeon_uvd_fini(rdev);
2105 r600_vram_scratch_fini(rdev);
2106 radeon_gem_fini(rdev);
2107 radeon_fence_driver_fini(rdev);
2108 radeon_agp_fini(rdev);
2109 radeon_bo_fini(rdev);
2110 radeon_atombios_fini(rdev);
2115 static void rv770_pcie_gen2_enable(struct radeon_device *rdev)
2117 u32 link_width_cntl, lanes, speed_cntl, tmp;
2120 if (radeon_pcie_gen2 == 0)
2123 if (rdev->flags & RADEON_IS_IGP)
2126 if (!(rdev->flags & RADEON_IS_PCIE))
2129 /* x2 cards have a special sequence */
2130 if (ASIC_IS_X2(rdev))
2133 if ((rdev->pdev->bus->max_bus_speed != PCIE_SPEED_5_0GT) &&
2134 (rdev->pdev->bus->max_bus_speed != PCIE_SPEED_8_0GT))
2137 DRM_INFO("enabling PCIE gen 2 link speeds, disable with radeon.pcie_gen2=0\n");
2139 /* advertise upconfig capability */
2140 link_width_cntl = RREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL);
2141 link_width_cntl &= ~LC_UPCONFIGURE_DIS;
2142 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
2143 link_width_cntl = RREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL);
2144 if (link_width_cntl & LC_RENEGOTIATION_SUPPORT) {
2145 lanes = (link_width_cntl & LC_LINK_WIDTH_RD_MASK) >> LC_LINK_WIDTH_RD_SHIFT;
2146 link_width_cntl &= ~(LC_LINK_WIDTH_MASK |
2147 LC_RECONFIG_ARC_MISSING_ESCAPE);
2148 link_width_cntl |= lanes | LC_RECONFIG_NOW |
2149 LC_RENEGOTIATE_EN | LC_UPCONFIGURE_SUPPORT;
2150 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
2152 link_width_cntl |= LC_UPCONFIGURE_DIS;
2153 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
2156 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
2157 if ((speed_cntl & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
2158 (speed_cntl & LC_OTHER_SIDE_SUPPORTS_GEN2)) {
2160 tmp = RREG32(0x541c);
2161 WREG32(0x541c, tmp | 0x8);
2162 WREG32(MM_CFGREGS_CNTL, MM_WR_TO_CFG_EN);
2163 link_cntl2 = RREG16(0x4088);
2164 link_cntl2 &= ~TARGET_LINK_SPEED_MASK;
2166 WREG16(0x4088, link_cntl2);
2167 WREG32(MM_CFGREGS_CNTL, 0);
2169 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
2170 speed_cntl &= ~LC_TARGET_LINK_SPEED_OVERRIDE_EN;
2171 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
2173 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
2174 speed_cntl |= LC_CLR_FAILED_SPD_CHANGE_CNT;
2175 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
2177 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
2178 speed_cntl &= ~LC_CLR_FAILED_SPD_CHANGE_CNT;
2179 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
2181 speed_cntl = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
2182 speed_cntl |= LC_GEN2_EN_STRAP;
2183 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, speed_cntl);
2186 link_width_cntl = RREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL);
2187 /* XXX: only disable it if gen1 bridge vendor == 0x111d or 0x1106 */
2189 link_width_cntl |= LC_UPCONFIGURE_DIS;
2191 link_width_cntl &= ~LC_UPCONFIGURE_DIS;
2192 WREG32_PCIE_PORT(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);