blob: 7969c0c8ec200be015909a3dada502c0b09af024 [file] [log] [blame]
Alex Deucher0af62b02011-01-06 21:19:31 -05001/*
2 * Copyright 2010 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 * Authors: Alex Deucher
23 */
24#include <linux/firmware.h>
25#include <linux/platform_device.h>
26#include <linux/slab.h>
Paul Gortmakere0cd3602011-08-30 11:04:30 -040027#include <linux/module.h>
David Howells760285e2012-10-02 18:01:07 +010028#include <drm/drmP.h>
Alex Deucher0af62b02011-01-06 21:19:31 -050029#include "radeon.h"
30#include "radeon_asic.h"
David Howells760285e2012-10-02 18:01:07 +010031#include <drm/radeon_drm.h>
Alex Deucher0af62b02011-01-06 21:19:31 -050032#include "nid.h"
33#include "atom.h"
34#include "ni_reg.h"
Alex Deucher0c88a022011-03-02 20:07:31 -050035#include "cayman_blit_shaders.h"
Alex Deucher0af62b02011-01-06 21:19:31 -050036
Alex Deucher168757e2013-01-18 19:17:22 -050037extern bool evergreen_is_display_hung(struct radeon_device *rdev);
Alex Deucher187e3592013-01-18 14:51:38 -050038extern void evergreen_print_gpu_status_regs(struct radeon_device *rdev);
Alex Deucherb9952a82011-03-02 20:07:33 -050039extern void evergreen_mc_stop(struct radeon_device *rdev, struct evergreen_mc_save *save);
40extern void evergreen_mc_resume(struct radeon_device *rdev, struct evergreen_mc_save *save);
41extern int evergreen_mc_wait_for_idle(struct radeon_device *rdev);
Alex Deucher755d8192011-03-02 20:07:34 -050042extern void evergreen_mc_program(struct radeon_device *rdev);
43extern void evergreen_irq_suspend(struct radeon_device *rdev);
44extern int evergreen_mc_init(struct radeon_device *rdev);
Alex Deucherd054ac12011-09-01 17:46:15 +000045extern void evergreen_fix_pci_max_read_req_size(struct radeon_device *rdev);
Ilija Hadzicb07759b2011-09-20 10:22:58 -040046extern void evergreen_pcie_gen2_enable(struct radeon_device *rdev);
Alex Deucherc420c742012-03-20 17:18:39 -040047extern void si_rlc_fini(struct radeon_device *rdev);
48extern int si_rlc_init(struct radeon_device *rdev);
Alex Deucherb9952a82011-03-02 20:07:33 -050049
Alex Deucher0af62b02011-01-06 21:19:31 -050050#define EVERGREEN_PFP_UCODE_SIZE 1120
51#define EVERGREEN_PM4_UCODE_SIZE 1376
52#define EVERGREEN_RLC_UCODE_SIZE 768
53#define BTC_MC_UCODE_SIZE 6024
54
Alex Deucher9b8253c2011-03-02 20:07:28 -050055#define CAYMAN_PFP_UCODE_SIZE 2176
56#define CAYMAN_PM4_UCODE_SIZE 2176
57#define CAYMAN_RLC_UCODE_SIZE 1024
58#define CAYMAN_MC_UCODE_SIZE 6037
59
Alex Deucherc420c742012-03-20 17:18:39 -040060#define ARUBA_RLC_UCODE_SIZE 1536
61
Alex Deucher0af62b02011-01-06 21:19:31 -050062/* Firmware Names */
63MODULE_FIRMWARE("radeon/BARTS_pfp.bin");
64MODULE_FIRMWARE("radeon/BARTS_me.bin");
65MODULE_FIRMWARE("radeon/BARTS_mc.bin");
66MODULE_FIRMWARE("radeon/BTC_rlc.bin");
67MODULE_FIRMWARE("radeon/TURKS_pfp.bin");
68MODULE_FIRMWARE("radeon/TURKS_me.bin");
69MODULE_FIRMWARE("radeon/TURKS_mc.bin");
70MODULE_FIRMWARE("radeon/CAICOS_pfp.bin");
71MODULE_FIRMWARE("radeon/CAICOS_me.bin");
72MODULE_FIRMWARE("radeon/CAICOS_mc.bin");
Alex Deucher9b8253c2011-03-02 20:07:28 -050073MODULE_FIRMWARE("radeon/CAYMAN_pfp.bin");
74MODULE_FIRMWARE("radeon/CAYMAN_me.bin");
75MODULE_FIRMWARE("radeon/CAYMAN_mc.bin");
76MODULE_FIRMWARE("radeon/CAYMAN_rlc.bin");
Alex Deucherc420c742012-03-20 17:18:39 -040077MODULE_FIRMWARE("radeon/ARUBA_pfp.bin");
78MODULE_FIRMWARE("radeon/ARUBA_me.bin");
79MODULE_FIRMWARE("radeon/ARUBA_rlc.bin");
Alex Deucher0af62b02011-01-06 21:19:31 -050080
Alex Deuchera2c96a22013-02-28 17:58:36 -050081
82static const u32 cayman_golden_registers2[] =
83{
84 0x3e5c, 0xffffffff, 0x00000000,
85 0x3e48, 0xffffffff, 0x00000000,
86 0x3e4c, 0xffffffff, 0x00000000,
87 0x3e64, 0xffffffff, 0x00000000,
88 0x3e50, 0xffffffff, 0x00000000,
89 0x3e60, 0xffffffff, 0x00000000
90};
91
92static const u32 cayman_golden_registers[] =
93{
94 0x5eb4, 0xffffffff, 0x00000002,
95 0x5e78, 0x8f311ff1, 0x001000f0,
96 0x3f90, 0xffff0000, 0xff000000,
97 0x9148, 0xffff0000, 0xff000000,
98 0x3f94, 0xffff0000, 0xff000000,
99 0x914c, 0xffff0000, 0xff000000,
100 0xc78, 0x00000080, 0x00000080,
101 0xbd4, 0x70073777, 0x00011003,
102 0xd02c, 0xbfffff1f, 0x08421000,
103 0xd0b8, 0x73773777, 0x02011003,
104 0x5bc0, 0x00200000, 0x50100000,
105 0x98f8, 0x33773777, 0x02011003,
106 0x98fc, 0xffffffff, 0x76541032,
107 0x7030, 0x31000311, 0x00000011,
108 0x2f48, 0x33773777, 0x42010001,
109 0x6b28, 0x00000010, 0x00000012,
110 0x7728, 0x00000010, 0x00000012,
111 0x10328, 0x00000010, 0x00000012,
112 0x10f28, 0x00000010, 0x00000012,
113 0x11b28, 0x00000010, 0x00000012,
114 0x12728, 0x00000010, 0x00000012,
115 0x240c, 0x000007ff, 0x00000000,
116 0x8a14, 0xf000001f, 0x00000007,
117 0x8b24, 0x3fff3fff, 0x00ff0fff,
118 0x8b10, 0x0000ff0f, 0x00000000,
119 0x28a4c, 0x07ffffff, 0x06000000,
120 0x10c, 0x00000001, 0x00010003,
121 0xa02c, 0xffffffff, 0x0000009b,
122 0x913c, 0x0000010f, 0x01000100,
123 0x8c04, 0xf8ff00ff, 0x40600060,
124 0x28350, 0x00000f01, 0x00000000,
125 0x9508, 0x3700001f, 0x00000002,
126 0x960c, 0xffffffff, 0x54763210,
127 0x88c4, 0x001f3ae3, 0x00000082,
128 0x88d0, 0xffffffff, 0x0f40df40,
129 0x88d4, 0x0000001f, 0x00000010,
130 0x8974, 0xffffffff, 0x00000000
131};
132
133static const u32 dvst_golden_registers2[] =
134{
135 0x8f8, 0xffffffff, 0,
136 0x8fc, 0x00380000, 0,
137 0x8f8, 0xffffffff, 1,
138 0x8fc, 0x0e000000, 0
139};
140
141static const u32 dvst_golden_registers[] =
142{
143 0x690, 0x3fff3fff, 0x20c00033,
144 0x918c, 0x0fff0fff, 0x00010006,
145 0x91a8, 0x0fff0fff, 0x00010006,
146 0x9150, 0xffffdfff, 0x6e944040,
147 0x917c, 0x0fff0fff, 0x00030002,
148 0x9198, 0x0fff0fff, 0x00030002,
149 0x915c, 0x0fff0fff, 0x00010000,
150 0x3f90, 0xffff0001, 0xff000000,
151 0x9178, 0x0fff0fff, 0x00070000,
152 0x9194, 0x0fff0fff, 0x00070000,
153 0x9148, 0xffff0001, 0xff000000,
154 0x9190, 0x0fff0fff, 0x00090008,
155 0x91ac, 0x0fff0fff, 0x00090008,
156 0x3f94, 0xffff0000, 0xff000000,
157 0x914c, 0xffff0000, 0xff000000,
158 0x929c, 0x00000fff, 0x00000001,
159 0x55e4, 0xff607fff, 0xfc000100,
160 0x8a18, 0xff000fff, 0x00000100,
161 0x8b28, 0xff000fff, 0x00000100,
162 0x9144, 0xfffc0fff, 0x00000100,
163 0x6ed8, 0x00010101, 0x00010000,
164 0x9830, 0xffffffff, 0x00000000,
165 0x9834, 0xf00fffff, 0x00000400,
166 0x9838, 0xfffffffe, 0x00000000,
167 0xd0c0, 0xff000fff, 0x00000100,
168 0xd02c, 0xbfffff1f, 0x08421000,
169 0xd0b8, 0x73773777, 0x12010001,
170 0x5bb0, 0x000000f0, 0x00000070,
171 0x98f8, 0x73773777, 0x12010001,
172 0x98fc, 0xffffffff, 0x00000010,
173 0x9b7c, 0x00ff0000, 0x00fc0000,
174 0x8030, 0x00001f0f, 0x0000100a,
175 0x2f48, 0x73773777, 0x12010001,
176 0x2408, 0x00030000, 0x000c007f,
177 0x8a14, 0xf000003f, 0x00000007,
178 0x8b24, 0x3fff3fff, 0x00ff0fff,
179 0x8b10, 0x0000ff0f, 0x00000000,
180 0x28a4c, 0x07ffffff, 0x06000000,
181 0x4d8, 0x00000fff, 0x00000100,
182 0xa008, 0xffffffff, 0x00010000,
183 0x913c, 0xffff03ff, 0x01000100,
184 0x8c00, 0x000000ff, 0x00000003,
185 0x8c04, 0xf8ff00ff, 0x40600060,
186 0x8cf0, 0x1fff1fff, 0x08e00410,
187 0x28350, 0x00000f01, 0x00000000,
188 0x9508, 0xf700071f, 0x00000002,
189 0x960c, 0xffffffff, 0x54763210,
190 0x20ef8, 0x01ff01ff, 0x00000002,
191 0x20e98, 0xfffffbff, 0x00200000,
192 0x2015c, 0xffffffff, 0x00000f40,
193 0x88c4, 0x001f3ae3, 0x00000082,
194 0x8978, 0x3fffffff, 0x04050140,
195 0x88d4, 0x0000001f, 0x00000010,
196 0x8974, 0xffffffff, 0x00000000
197};
198
199static const u32 scrapper_golden_registers[] =
200{
201 0x690, 0x3fff3fff, 0x20c00033,
202 0x918c, 0x0fff0fff, 0x00010006,
203 0x918c, 0x0fff0fff, 0x00010006,
204 0x91a8, 0x0fff0fff, 0x00010006,
205 0x91a8, 0x0fff0fff, 0x00010006,
206 0x9150, 0xffffdfff, 0x6e944040,
207 0x9150, 0xffffdfff, 0x6e944040,
208 0x917c, 0x0fff0fff, 0x00030002,
209 0x917c, 0x0fff0fff, 0x00030002,
210 0x9198, 0x0fff0fff, 0x00030002,
211 0x9198, 0x0fff0fff, 0x00030002,
212 0x915c, 0x0fff0fff, 0x00010000,
213 0x915c, 0x0fff0fff, 0x00010000,
214 0x3f90, 0xffff0001, 0xff000000,
215 0x3f90, 0xffff0001, 0xff000000,
216 0x9178, 0x0fff0fff, 0x00070000,
217 0x9178, 0x0fff0fff, 0x00070000,
218 0x9194, 0x0fff0fff, 0x00070000,
219 0x9194, 0x0fff0fff, 0x00070000,
220 0x9148, 0xffff0001, 0xff000000,
221 0x9148, 0xffff0001, 0xff000000,
222 0x9190, 0x0fff0fff, 0x00090008,
223 0x9190, 0x0fff0fff, 0x00090008,
224 0x91ac, 0x0fff0fff, 0x00090008,
225 0x91ac, 0x0fff0fff, 0x00090008,
226 0x3f94, 0xffff0000, 0xff000000,
227 0x3f94, 0xffff0000, 0xff000000,
228 0x914c, 0xffff0000, 0xff000000,
229 0x914c, 0xffff0000, 0xff000000,
230 0x929c, 0x00000fff, 0x00000001,
231 0x929c, 0x00000fff, 0x00000001,
232 0x55e4, 0xff607fff, 0xfc000100,
233 0x8a18, 0xff000fff, 0x00000100,
234 0x8a18, 0xff000fff, 0x00000100,
235 0x8b28, 0xff000fff, 0x00000100,
236 0x8b28, 0xff000fff, 0x00000100,
237 0x9144, 0xfffc0fff, 0x00000100,
238 0x9144, 0xfffc0fff, 0x00000100,
239 0x6ed8, 0x00010101, 0x00010000,
240 0x9830, 0xffffffff, 0x00000000,
241 0x9830, 0xffffffff, 0x00000000,
242 0x9834, 0xf00fffff, 0x00000400,
243 0x9834, 0xf00fffff, 0x00000400,
244 0x9838, 0xfffffffe, 0x00000000,
245 0x9838, 0xfffffffe, 0x00000000,
246 0xd0c0, 0xff000fff, 0x00000100,
247 0xd02c, 0xbfffff1f, 0x08421000,
248 0xd02c, 0xbfffff1f, 0x08421000,
249 0xd0b8, 0x73773777, 0x12010001,
250 0xd0b8, 0x73773777, 0x12010001,
251 0x5bb0, 0x000000f0, 0x00000070,
252 0x98f8, 0x73773777, 0x12010001,
253 0x98f8, 0x73773777, 0x12010001,
254 0x98fc, 0xffffffff, 0x00000010,
255 0x98fc, 0xffffffff, 0x00000010,
256 0x9b7c, 0x00ff0000, 0x00fc0000,
257 0x9b7c, 0x00ff0000, 0x00fc0000,
258 0x8030, 0x00001f0f, 0x0000100a,
259 0x8030, 0x00001f0f, 0x0000100a,
260 0x2f48, 0x73773777, 0x12010001,
261 0x2f48, 0x73773777, 0x12010001,
262 0x2408, 0x00030000, 0x000c007f,
263 0x8a14, 0xf000003f, 0x00000007,
264 0x8a14, 0xf000003f, 0x00000007,
265 0x8b24, 0x3fff3fff, 0x00ff0fff,
266 0x8b24, 0x3fff3fff, 0x00ff0fff,
267 0x8b10, 0x0000ff0f, 0x00000000,
268 0x8b10, 0x0000ff0f, 0x00000000,
269 0x28a4c, 0x07ffffff, 0x06000000,
270 0x28a4c, 0x07ffffff, 0x06000000,
271 0x4d8, 0x00000fff, 0x00000100,
272 0x4d8, 0x00000fff, 0x00000100,
273 0xa008, 0xffffffff, 0x00010000,
274 0xa008, 0xffffffff, 0x00010000,
275 0x913c, 0xffff03ff, 0x01000100,
276 0x913c, 0xffff03ff, 0x01000100,
277 0x90e8, 0x001fffff, 0x010400c0,
278 0x8c00, 0x000000ff, 0x00000003,
279 0x8c00, 0x000000ff, 0x00000003,
280 0x8c04, 0xf8ff00ff, 0x40600060,
281 0x8c04, 0xf8ff00ff, 0x40600060,
282 0x8c30, 0x0000000f, 0x00040005,
283 0x8cf0, 0x1fff1fff, 0x08e00410,
284 0x8cf0, 0x1fff1fff, 0x08e00410,
285 0x900c, 0x00ffffff, 0x0017071f,
286 0x28350, 0x00000f01, 0x00000000,
287 0x28350, 0x00000f01, 0x00000000,
288 0x9508, 0xf700071f, 0x00000002,
289 0x9508, 0xf700071f, 0x00000002,
290 0x9688, 0x00300000, 0x0017000f,
291 0x960c, 0xffffffff, 0x54763210,
292 0x960c, 0xffffffff, 0x54763210,
293 0x20ef8, 0x01ff01ff, 0x00000002,
294 0x20e98, 0xfffffbff, 0x00200000,
295 0x2015c, 0xffffffff, 0x00000f40,
296 0x88c4, 0x001f3ae3, 0x00000082,
297 0x88c4, 0x001f3ae3, 0x00000082,
298 0x8978, 0x3fffffff, 0x04050140,
299 0x8978, 0x3fffffff, 0x04050140,
300 0x88d4, 0x0000001f, 0x00000010,
301 0x88d4, 0x0000001f, 0x00000010,
302 0x8974, 0xffffffff, 0x00000000,
303 0x8974, 0xffffffff, 0x00000000
304};
305
306static void ni_init_golden_registers(struct radeon_device *rdev)
307{
308 switch (rdev->family) {
309 case CHIP_CAYMAN:
310 radeon_program_register_sequence(rdev,
311 cayman_golden_registers,
312 (const u32)ARRAY_SIZE(cayman_golden_registers));
313 radeon_program_register_sequence(rdev,
314 cayman_golden_registers2,
315 (const u32)ARRAY_SIZE(cayman_golden_registers2));
316 break;
317 case CHIP_ARUBA:
318 if ((rdev->pdev->device == 0x9900) ||
319 (rdev->pdev->device == 0x9901) ||
320 (rdev->pdev->device == 0x9903) ||
321 (rdev->pdev->device == 0x9904) ||
322 (rdev->pdev->device == 0x9905) ||
323 (rdev->pdev->device == 0x9906) ||
324 (rdev->pdev->device == 0x9907) ||
325 (rdev->pdev->device == 0x9908) ||
326 (rdev->pdev->device == 0x9909) ||
327 (rdev->pdev->device == 0x990A) ||
328 (rdev->pdev->device == 0x990B) ||
329 (rdev->pdev->device == 0x990C) ||
330 (rdev->pdev->device == 0x990D) ||
331 (rdev->pdev->device == 0x990E) ||
332 (rdev->pdev->device == 0x990F) ||
333 (rdev->pdev->device == 0x9910) ||
334 (rdev->pdev->device == 0x9913) ||
335 (rdev->pdev->device == 0x9917) ||
336 (rdev->pdev->device == 0x9918)) {
337 radeon_program_register_sequence(rdev,
338 dvst_golden_registers,
339 (const u32)ARRAY_SIZE(dvst_golden_registers));
340 radeon_program_register_sequence(rdev,
341 dvst_golden_registers2,
342 (const u32)ARRAY_SIZE(dvst_golden_registers2));
343 } else {
344 radeon_program_register_sequence(rdev,
345 scrapper_golden_registers,
346 (const u32)ARRAY_SIZE(scrapper_golden_registers));
347 radeon_program_register_sequence(rdev,
348 dvst_golden_registers2,
349 (const u32)ARRAY_SIZE(dvst_golden_registers2));
350 }
351 break;
352 default:
353 break;
354 }
355}
356
Alex Deucher0af62b02011-01-06 21:19:31 -0500357#define BTC_IO_MC_REGS_SIZE 29
358
359static const u32 barts_io_mc_regs[BTC_IO_MC_REGS_SIZE][2] = {
360 {0x00000077, 0xff010100},
361 {0x00000078, 0x00000000},
362 {0x00000079, 0x00001434},
363 {0x0000007a, 0xcc08ec08},
364 {0x0000007b, 0x00040000},
365 {0x0000007c, 0x000080c0},
366 {0x0000007d, 0x09000000},
367 {0x0000007e, 0x00210404},
368 {0x00000081, 0x08a8e800},
369 {0x00000082, 0x00030444},
370 {0x00000083, 0x00000000},
371 {0x00000085, 0x00000001},
372 {0x00000086, 0x00000002},
373 {0x00000087, 0x48490000},
374 {0x00000088, 0x20244647},
375 {0x00000089, 0x00000005},
376 {0x0000008b, 0x66030000},
377 {0x0000008c, 0x00006603},
378 {0x0000008d, 0x00000100},
379 {0x0000008f, 0x00001c0a},
380 {0x00000090, 0xff000001},
381 {0x00000094, 0x00101101},
382 {0x00000095, 0x00000fff},
383 {0x00000096, 0x00116fff},
384 {0x00000097, 0x60010000},
385 {0x00000098, 0x10010000},
386 {0x00000099, 0x00006000},
387 {0x0000009a, 0x00001000},
388 {0x0000009f, 0x00946a00}
389};
390
391static const u32 turks_io_mc_regs[BTC_IO_MC_REGS_SIZE][2] = {
392 {0x00000077, 0xff010100},
393 {0x00000078, 0x00000000},
394 {0x00000079, 0x00001434},
395 {0x0000007a, 0xcc08ec08},
396 {0x0000007b, 0x00040000},
397 {0x0000007c, 0x000080c0},
398 {0x0000007d, 0x09000000},
399 {0x0000007e, 0x00210404},
400 {0x00000081, 0x08a8e800},
401 {0x00000082, 0x00030444},
402 {0x00000083, 0x00000000},
403 {0x00000085, 0x00000001},
404 {0x00000086, 0x00000002},
405 {0x00000087, 0x48490000},
406 {0x00000088, 0x20244647},
407 {0x00000089, 0x00000005},
408 {0x0000008b, 0x66030000},
409 {0x0000008c, 0x00006603},
410 {0x0000008d, 0x00000100},
411 {0x0000008f, 0x00001c0a},
412 {0x00000090, 0xff000001},
413 {0x00000094, 0x00101101},
414 {0x00000095, 0x00000fff},
415 {0x00000096, 0x00116fff},
416 {0x00000097, 0x60010000},
417 {0x00000098, 0x10010000},
418 {0x00000099, 0x00006000},
419 {0x0000009a, 0x00001000},
420 {0x0000009f, 0x00936a00}
421};
422
423static const u32 caicos_io_mc_regs[BTC_IO_MC_REGS_SIZE][2] = {
424 {0x00000077, 0xff010100},
425 {0x00000078, 0x00000000},
426 {0x00000079, 0x00001434},
427 {0x0000007a, 0xcc08ec08},
428 {0x0000007b, 0x00040000},
429 {0x0000007c, 0x000080c0},
430 {0x0000007d, 0x09000000},
431 {0x0000007e, 0x00210404},
432 {0x00000081, 0x08a8e800},
433 {0x00000082, 0x00030444},
434 {0x00000083, 0x00000000},
435 {0x00000085, 0x00000001},
436 {0x00000086, 0x00000002},
437 {0x00000087, 0x48490000},
438 {0x00000088, 0x20244647},
439 {0x00000089, 0x00000005},
440 {0x0000008b, 0x66030000},
441 {0x0000008c, 0x00006603},
442 {0x0000008d, 0x00000100},
443 {0x0000008f, 0x00001c0a},
444 {0x00000090, 0xff000001},
445 {0x00000094, 0x00101101},
446 {0x00000095, 0x00000fff},
447 {0x00000096, 0x00116fff},
448 {0x00000097, 0x60010000},
449 {0x00000098, 0x10010000},
450 {0x00000099, 0x00006000},
451 {0x0000009a, 0x00001000},
452 {0x0000009f, 0x00916a00}
453};
454
Alex Deucher9b8253c2011-03-02 20:07:28 -0500455static const u32 cayman_io_mc_regs[BTC_IO_MC_REGS_SIZE][2] = {
456 {0x00000077, 0xff010100},
457 {0x00000078, 0x00000000},
458 {0x00000079, 0x00001434},
459 {0x0000007a, 0xcc08ec08},
460 {0x0000007b, 0x00040000},
461 {0x0000007c, 0x000080c0},
462 {0x0000007d, 0x09000000},
463 {0x0000007e, 0x00210404},
464 {0x00000081, 0x08a8e800},
465 {0x00000082, 0x00030444},
466 {0x00000083, 0x00000000},
467 {0x00000085, 0x00000001},
468 {0x00000086, 0x00000002},
469 {0x00000087, 0x48490000},
470 {0x00000088, 0x20244647},
471 {0x00000089, 0x00000005},
472 {0x0000008b, 0x66030000},
473 {0x0000008c, 0x00006603},
474 {0x0000008d, 0x00000100},
475 {0x0000008f, 0x00001c0a},
476 {0x00000090, 0xff000001},
477 {0x00000094, 0x00101101},
478 {0x00000095, 0x00000fff},
479 {0x00000096, 0x00116fff},
480 {0x00000097, 0x60010000},
481 {0x00000098, 0x10010000},
482 {0x00000099, 0x00006000},
483 {0x0000009a, 0x00001000},
484 {0x0000009f, 0x00976b00}
485};
486
Alex Deucher755d8192011-03-02 20:07:34 -0500487int ni_mc_load_microcode(struct radeon_device *rdev)
Alex Deucher0af62b02011-01-06 21:19:31 -0500488{
489 const __be32 *fw_data;
490 u32 mem_type, running, blackout = 0;
491 u32 *io_mc_regs;
Alex Deucher9b8253c2011-03-02 20:07:28 -0500492 int i, ucode_size, regs_size;
Alex Deucher0af62b02011-01-06 21:19:31 -0500493
494 if (!rdev->mc_fw)
495 return -EINVAL;
496
497 switch (rdev->family) {
498 case CHIP_BARTS:
499 io_mc_regs = (u32 *)&barts_io_mc_regs;
Alex Deucher9b8253c2011-03-02 20:07:28 -0500500 ucode_size = BTC_MC_UCODE_SIZE;
501 regs_size = BTC_IO_MC_REGS_SIZE;
Alex Deucher0af62b02011-01-06 21:19:31 -0500502 break;
503 case CHIP_TURKS:
504 io_mc_regs = (u32 *)&turks_io_mc_regs;
Alex Deucher9b8253c2011-03-02 20:07:28 -0500505 ucode_size = BTC_MC_UCODE_SIZE;
506 regs_size = BTC_IO_MC_REGS_SIZE;
Alex Deucher0af62b02011-01-06 21:19:31 -0500507 break;
508 case CHIP_CAICOS:
509 default:
510 io_mc_regs = (u32 *)&caicos_io_mc_regs;
Alex Deucher9b8253c2011-03-02 20:07:28 -0500511 ucode_size = BTC_MC_UCODE_SIZE;
512 regs_size = BTC_IO_MC_REGS_SIZE;
513 break;
514 case CHIP_CAYMAN:
515 io_mc_regs = (u32 *)&cayman_io_mc_regs;
516 ucode_size = CAYMAN_MC_UCODE_SIZE;
517 regs_size = BTC_IO_MC_REGS_SIZE;
Alex Deucher0af62b02011-01-06 21:19:31 -0500518 break;
519 }
520
521 mem_type = (RREG32(MC_SEQ_MISC0) & MC_SEQ_MISC0_GDDR5_MASK) >> MC_SEQ_MISC0_GDDR5_SHIFT;
522 running = RREG32(MC_SEQ_SUP_CNTL) & RUN_MASK;
523
524 if ((mem_type == MC_SEQ_MISC0_GDDR5_VALUE) && (running == 0)) {
525 if (running) {
526 blackout = RREG32(MC_SHARED_BLACKOUT_CNTL);
527 WREG32(MC_SHARED_BLACKOUT_CNTL, 1);
528 }
529
530 /* reset the engine and set to writable */
531 WREG32(MC_SEQ_SUP_CNTL, 0x00000008);
532 WREG32(MC_SEQ_SUP_CNTL, 0x00000010);
533
534 /* load mc io regs */
Alex Deucher9b8253c2011-03-02 20:07:28 -0500535 for (i = 0; i < regs_size; i++) {
Alex Deucher0af62b02011-01-06 21:19:31 -0500536 WREG32(MC_SEQ_IO_DEBUG_INDEX, io_mc_regs[(i << 1)]);
537 WREG32(MC_SEQ_IO_DEBUG_DATA, io_mc_regs[(i << 1) + 1]);
538 }
539 /* load the MC ucode */
540 fw_data = (const __be32 *)rdev->mc_fw->data;
Alex Deucher9b8253c2011-03-02 20:07:28 -0500541 for (i = 0; i < ucode_size; i++)
Alex Deucher0af62b02011-01-06 21:19:31 -0500542 WREG32(MC_SEQ_SUP_PGM, be32_to_cpup(fw_data++));
543
544 /* put the engine back into the active state */
545 WREG32(MC_SEQ_SUP_CNTL, 0x00000008);
546 WREG32(MC_SEQ_SUP_CNTL, 0x00000004);
547 WREG32(MC_SEQ_SUP_CNTL, 0x00000001);
548
549 /* wait for training to complete */
Alex Deucher0e2c9782011-11-02 18:08:25 -0400550 for (i = 0; i < rdev->usec_timeout; i++) {
551 if (RREG32(MC_IO_PAD_CNTL_D0) & MEM_FALL_OUT_CMD)
552 break;
553 udelay(1);
554 }
Alex Deucher0af62b02011-01-06 21:19:31 -0500555
556 if (running)
557 WREG32(MC_SHARED_BLACKOUT_CNTL, blackout);
558 }
559
560 return 0;
561}
562
563int ni_init_microcode(struct radeon_device *rdev)
564{
565 struct platform_device *pdev;
566 const char *chip_name;
567 const char *rlc_chip_name;
568 size_t pfp_req_size, me_req_size, rlc_req_size, mc_req_size;
569 char fw_name[30];
570 int err;
571
572 DRM_DEBUG("\n");
573
574 pdev = platform_device_register_simple("radeon_cp", 0, NULL, 0);
575 err = IS_ERR(pdev);
576 if (err) {
577 printk(KERN_ERR "radeon_cp: Failed to register firmware\n");
578 return -EINVAL;
579 }
580
581 switch (rdev->family) {
582 case CHIP_BARTS:
583 chip_name = "BARTS";
584 rlc_chip_name = "BTC";
Alex Deucher9b8253c2011-03-02 20:07:28 -0500585 pfp_req_size = EVERGREEN_PFP_UCODE_SIZE * 4;
586 me_req_size = EVERGREEN_PM4_UCODE_SIZE * 4;
587 rlc_req_size = EVERGREEN_RLC_UCODE_SIZE * 4;
588 mc_req_size = BTC_MC_UCODE_SIZE * 4;
Alex Deucher0af62b02011-01-06 21:19:31 -0500589 break;
590 case CHIP_TURKS:
591 chip_name = "TURKS";
592 rlc_chip_name = "BTC";
Alex Deucher9b8253c2011-03-02 20:07:28 -0500593 pfp_req_size = EVERGREEN_PFP_UCODE_SIZE * 4;
594 me_req_size = EVERGREEN_PM4_UCODE_SIZE * 4;
595 rlc_req_size = EVERGREEN_RLC_UCODE_SIZE * 4;
596 mc_req_size = BTC_MC_UCODE_SIZE * 4;
Alex Deucher0af62b02011-01-06 21:19:31 -0500597 break;
598 case CHIP_CAICOS:
599 chip_name = "CAICOS";
600 rlc_chip_name = "BTC";
Alex Deucher9b8253c2011-03-02 20:07:28 -0500601 pfp_req_size = EVERGREEN_PFP_UCODE_SIZE * 4;
602 me_req_size = EVERGREEN_PM4_UCODE_SIZE * 4;
603 rlc_req_size = EVERGREEN_RLC_UCODE_SIZE * 4;
604 mc_req_size = BTC_MC_UCODE_SIZE * 4;
605 break;
606 case CHIP_CAYMAN:
607 chip_name = "CAYMAN";
608 rlc_chip_name = "CAYMAN";
609 pfp_req_size = CAYMAN_PFP_UCODE_SIZE * 4;
610 me_req_size = CAYMAN_PM4_UCODE_SIZE * 4;
611 rlc_req_size = CAYMAN_RLC_UCODE_SIZE * 4;
612 mc_req_size = CAYMAN_MC_UCODE_SIZE * 4;
Alex Deucher0af62b02011-01-06 21:19:31 -0500613 break;
Alex Deucherc420c742012-03-20 17:18:39 -0400614 case CHIP_ARUBA:
615 chip_name = "ARUBA";
616 rlc_chip_name = "ARUBA";
617 /* pfp/me same size as CAYMAN */
618 pfp_req_size = CAYMAN_PFP_UCODE_SIZE * 4;
619 me_req_size = CAYMAN_PM4_UCODE_SIZE * 4;
620 rlc_req_size = ARUBA_RLC_UCODE_SIZE * 4;
621 mc_req_size = 0;
622 break;
Alex Deucher0af62b02011-01-06 21:19:31 -0500623 default: BUG();
624 }
625
Alex Deucher0af62b02011-01-06 21:19:31 -0500626 DRM_INFO("Loading %s Microcode\n", chip_name);
627
628 snprintf(fw_name, sizeof(fw_name), "radeon/%s_pfp.bin", chip_name);
629 err = request_firmware(&rdev->pfp_fw, fw_name, &pdev->dev);
630 if (err)
631 goto out;
632 if (rdev->pfp_fw->size != pfp_req_size) {
633 printk(KERN_ERR
634 "ni_cp: Bogus length %zu in firmware \"%s\"\n",
635 rdev->pfp_fw->size, fw_name);
636 err = -EINVAL;
637 goto out;
638 }
639
640 snprintf(fw_name, sizeof(fw_name), "radeon/%s_me.bin", chip_name);
641 err = request_firmware(&rdev->me_fw, fw_name, &pdev->dev);
642 if (err)
643 goto out;
644 if (rdev->me_fw->size != me_req_size) {
645 printk(KERN_ERR
646 "ni_cp: Bogus length %zu in firmware \"%s\"\n",
647 rdev->me_fw->size, fw_name);
648 err = -EINVAL;
649 }
650
651 snprintf(fw_name, sizeof(fw_name), "radeon/%s_rlc.bin", rlc_chip_name);
652 err = request_firmware(&rdev->rlc_fw, fw_name, &pdev->dev);
653 if (err)
654 goto out;
655 if (rdev->rlc_fw->size != rlc_req_size) {
656 printk(KERN_ERR
657 "ni_rlc: Bogus length %zu in firmware \"%s\"\n",
658 rdev->rlc_fw->size, fw_name);
659 err = -EINVAL;
660 }
661
Alex Deucherc420c742012-03-20 17:18:39 -0400662 /* no MC ucode on TN */
663 if (!(rdev->flags & RADEON_IS_IGP)) {
664 snprintf(fw_name, sizeof(fw_name), "radeon/%s_mc.bin", chip_name);
665 err = request_firmware(&rdev->mc_fw, fw_name, &pdev->dev);
666 if (err)
667 goto out;
668 if (rdev->mc_fw->size != mc_req_size) {
669 printk(KERN_ERR
670 "ni_mc: Bogus length %zu in firmware \"%s\"\n",
671 rdev->mc_fw->size, fw_name);
672 err = -EINVAL;
673 }
Alex Deucher0af62b02011-01-06 21:19:31 -0500674 }
675out:
676 platform_device_unregister(pdev);
677
678 if (err) {
679 if (err != -EINVAL)
680 printk(KERN_ERR
681 "ni_cp: Failed to load firmware \"%s\"\n",
682 fw_name);
683 release_firmware(rdev->pfp_fw);
684 rdev->pfp_fw = NULL;
685 release_firmware(rdev->me_fw);
686 rdev->me_fw = NULL;
687 release_firmware(rdev->rlc_fw);
688 rdev->rlc_fw = NULL;
689 release_firmware(rdev->mc_fw);
690 rdev->mc_fw = NULL;
691 }
692 return err;
693}
694
Alex Deucherfecf1d02011-03-02 20:07:29 -0500695/*
696 * Core functions
697 */
Alex Deucherfecf1d02011-03-02 20:07:29 -0500698static void cayman_gpu_init(struct radeon_device *rdev)
699{
Alex Deucherfecf1d02011-03-02 20:07:29 -0500700 u32 gb_addr_config = 0;
701 u32 mc_shared_chmap, mc_arb_ramcfg;
Alex Deucherfecf1d02011-03-02 20:07:29 -0500702 u32 cgts_tcc_disable;
703 u32 sx_debug_1;
704 u32 smx_dc_ctl0;
Alex Deucherfecf1d02011-03-02 20:07:29 -0500705 u32 cgts_sm_ctrl_reg;
706 u32 hdp_host_path_cntl;
707 u32 tmp;
Alex Deucher416a2bd2012-05-31 19:00:25 -0400708 u32 disabled_rb_mask;
Alex Deucherfecf1d02011-03-02 20:07:29 -0500709 int i, j;
710
711 switch (rdev->family) {
712 case CHIP_CAYMAN:
Alex Deucherfecf1d02011-03-02 20:07:29 -0500713 rdev->config.cayman.max_shader_engines = 2;
714 rdev->config.cayman.max_pipes_per_simd = 4;
715 rdev->config.cayman.max_tile_pipes = 8;
716 rdev->config.cayman.max_simds_per_se = 12;
717 rdev->config.cayman.max_backends_per_se = 4;
718 rdev->config.cayman.max_texture_channel_caches = 8;
719 rdev->config.cayman.max_gprs = 256;
720 rdev->config.cayman.max_threads = 256;
721 rdev->config.cayman.max_gs_threads = 32;
722 rdev->config.cayman.max_stack_entries = 512;
723 rdev->config.cayman.sx_num_of_sets = 8;
724 rdev->config.cayman.sx_max_export_size = 256;
725 rdev->config.cayman.sx_max_export_pos_size = 64;
726 rdev->config.cayman.sx_max_export_smx_size = 192;
727 rdev->config.cayman.max_hw_contexts = 8;
728 rdev->config.cayman.sq_num_cf_insts = 2;
729
730 rdev->config.cayman.sc_prim_fifo_size = 0x100;
731 rdev->config.cayman.sc_hiz_tile_fifo_size = 0x30;
732 rdev->config.cayman.sc_earlyz_tile_fifo_size = 0x130;
Alex Deucher416a2bd2012-05-31 19:00:25 -0400733 gb_addr_config = CAYMAN_GB_ADDR_CONFIG_GOLDEN;
Alex Deucherfecf1d02011-03-02 20:07:29 -0500734 break;
Alex Deucher7b76e472012-03-20 17:18:36 -0400735 case CHIP_ARUBA:
736 default:
737 rdev->config.cayman.max_shader_engines = 1;
738 rdev->config.cayman.max_pipes_per_simd = 4;
739 rdev->config.cayman.max_tile_pipes = 2;
740 if ((rdev->pdev->device == 0x9900) ||
Alex Deucherd430f7d2012-06-05 09:50:28 -0400741 (rdev->pdev->device == 0x9901) ||
742 (rdev->pdev->device == 0x9905) ||
743 (rdev->pdev->device == 0x9906) ||
744 (rdev->pdev->device == 0x9907) ||
745 (rdev->pdev->device == 0x9908) ||
746 (rdev->pdev->device == 0x9909) ||
Alex Deuchere4d17062013-03-08 13:44:15 -0500747 (rdev->pdev->device == 0x990B) ||
748 (rdev->pdev->device == 0x990C) ||
749 (rdev->pdev->device == 0x990F) ||
Alex Deucherd430f7d2012-06-05 09:50:28 -0400750 (rdev->pdev->device == 0x9910) ||
Alex Deuchere4d17062013-03-08 13:44:15 -0500751 (rdev->pdev->device == 0x9917) ||
Alex Deucher62d1f922013-04-25 14:06:05 -0400752 (rdev->pdev->device == 0x9999) ||
753 (rdev->pdev->device == 0x999C)) {
Alex Deucher7b76e472012-03-20 17:18:36 -0400754 rdev->config.cayman.max_simds_per_se = 6;
755 rdev->config.cayman.max_backends_per_se = 2;
756 } else if ((rdev->pdev->device == 0x9903) ||
Alex Deucherd430f7d2012-06-05 09:50:28 -0400757 (rdev->pdev->device == 0x9904) ||
758 (rdev->pdev->device == 0x990A) ||
Alex Deuchere4d17062013-03-08 13:44:15 -0500759 (rdev->pdev->device == 0x990D) ||
760 (rdev->pdev->device == 0x990E) ||
Alex Deucherd430f7d2012-06-05 09:50:28 -0400761 (rdev->pdev->device == 0x9913) ||
Alex Deucher62d1f922013-04-25 14:06:05 -0400762 (rdev->pdev->device == 0x9918) ||
763 (rdev->pdev->device == 0x999D)) {
Alex Deucher7b76e472012-03-20 17:18:36 -0400764 rdev->config.cayman.max_simds_per_se = 4;
765 rdev->config.cayman.max_backends_per_se = 2;
Alex Deucherd430f7d2012-06-05 09:50:28 -0400766 } else if ((rdev->pdev->device == 0x9919) ||
767 (rdev->pdev->device == 0x9990) ||
768 (rdev->pdev->device == 0x9991) ||
769 (rdev->pdev->device == 0x9994) ||
Alex Deuchere4d17062013-03-08 13:44:15 -0500770 (rdev->pdev->device == 0x9995) ||
771 (rdev->pdev->device == 0x9996) ||
772 (rdev->pdev->device == 0x999A) ||
Alex Deucherd430f7d2012-06-05 09:50:28 -0400773 (rdev->pdev->device == 0x99A0)) {
Alex Deucher7b76e472012-03-20 17:18:36 -0400774 rdev->config.cayman.max_simds_per_se = 3;
775 rdev->config.cayman.max_backends_per_se = 1;
776 } else {
777 rdev->config.cayman.max_simds_per_se = 2;
778 rdev->config.cayman.max_backends_per_se = 1;
779 }
780 rdev->config.cayman.max_texture_channel_caches = 2;
781 rdev->config.cayman.max_gprs = 256;
782 rdev->config.cayman.max_threads = 256;
783 rdev->config.cayman.max_gs_threads = 32;
784 rdev->config.cayman.max_stack_entries = 512;
785 rdev->config.cayman.sx_num_of_sets = 8;
786 rdev->config.cayman.sx_max_export_size = 256;
787 rdev->config.cayman.sx_max_export_pos_size = 64;
788 rdev->config.cayman.sx_max_export_smx_size = 192;
789 rdev->config.cayman.max_hw_contexts = 8;
790 rdev->config.cayman.sq_num_cf_insts = 2;
791
792 rdev->config.cayman.sc_prim_fifo_size = 0x40;
793 rdev->config.cayman.sc_hiz_tile_fifo_size = 0x30;
794 rdev->config.cayman.sc_earlyz_tile_fifo_size = 0x130;
Alex Deucher416a2bd2012-05-31 19:00:25 -0400795 gb_addr_config = ARUBA_GB_ADDR_CONFIG_GOLDEN;
Alex Deucher7b76e472012-03-20 17:18:36 -0400796 break;
Alex Deucherfecf1d02011-03-02 20:07:29 -0500797 }
798
799 /* Initialize HDP */
800 for (i = 0, j = 0; i < 32; i++, j += 0x18) {
801 WREG32((0x2c14 + j), 0x00000000);
802 WREG32((0x2c18 + j), 0x00000000);
803 WREG32((0x2c1c + j), 0x00000000);
804 WREG32((0x2c20 + j), 0x00000000);
805 WREG32((0x2c24 + j), 0x00000000);
806 }
807
808 WREG32(GRBM_CNTL, GRBM_READ_TIMEOUT(0xff));
809
Alex Deucherd054ac12011-09-01 17:46:15 +0000810 evergreen_fix_pci_max_read_req_size(rdev);
811
Alex Deucherfecf1d02011-03-02 20:07:29 -0500812 mc_shared_chmap = RREG32(MC_SHARED_CHMAP);
813 mc_arb_ramcfg = RREG32(MC_ARB_RAMCFG);
814
Alex Deucherfecf1d02011-03-02 20:07:29 -0500815 tmp = (mc_arb_ramcfg & NOOFCOLS_MASK) >> NOOFCOLS_SHIFT;
816 rdev->config.cayman.mem_row_size_in_kb = (4 * (1 << (8 + tmp))) / 1024;
817 if (rdev->config.cayman.mem_row_size_in_kb > 4)
818 rdev->config.cayman.mem_row_size_in_kb = 4;
819 /* XXX use MC settings? */
820 rdev->config.cayman.shader_engine_tile_size = 32;
821 rdev->config.cayman.num_gpus = 1;
822 rdev->config.cayman.multi_gpu_tile_size = 64;
823
Alex Deucherfecf1d02011-03-02 20:07:29 -0500824 tmp = (gb_addr_config & NUM_PIPES_MASK) >> NUM_PIPES_SHIFT;
825 rdev->config.cayman.num_tile_pipes = (1 << tmp);
826 tmp = (gb_addr_config & PIPE_INTERLEAVE_SIZE_MASK) >> PIPE_INTERLEAVE_SIZE_SHIFT;
827 rdev->config.cayman.mem_max_burst_length_bytes = (tmp + 1) * 256;
828 tmp = (gb_addr_config & NUM_SHADER_ENGINES_MASK) >> NUM_SHADER_ENGINES_SHIFT;
829 rdev->config.cayman.num_shader_engines = tmp + 1;
830 tmp = (gb_addr_config & NUM_GPUS_MASK) >> NUM_GPUS_SHIFT;
831 rdev->config.cayman.num_gpus = tmp + 1;
832 tmp = (gb_addr_config & MULTI_GPU_TILE_SIZE_MASK) >> MULTI_GPU_TILE_SIZE_SHIFT;
833 rdev->config.cayman.multi_gpu_tile_size = 1 << tmp;
834 tmp = (gb_addr_config & ROW_SIZE_MASK) >> ROW_SIZE_SHIFT;
835 rdev->config.cayman.mem_row_size_in_kb = 1 << tmp;
836
Alex Deucher416a2bd2012-05-31 19:00:25 -0400837
Alex Deucherfecf1d02011-03-02 20:07:29 -0500838 /* setup tiling info dword. gb_addr_config is not adequate since it does
839 * not have bank info, so create a custom tiling dword.
840 * bits 3:0 num_pipes
841 * bits 7:4 num_banks
842 * bits 11:8 group_size
843 * bits 15:12 row_size
844 */
845 rdev->config.cayman.tile_config = 0;
846 switch (rdev->config.cayman.num_tile_pipes) {
847 case 1:
848 default:
849 rdev->config.cayman.tile_config |= (0 << 0);
850 break;
851 case 2:
852 rdev->config.cayman.tile_config |= (1 << 0);
853 break;
854 case 4:
855 rdev->config.cayman.tile_config |= (2 << 0);
856 break;
857 case 8:
858 rdev->config.cayman.tile_config |= (3 << 0);
859 break;
860 }
Alex Deucher7b76e472012-03-20 17:18:36 -0400861
862 /* num banks is 8 on all fusion asics. 0 = 4, 1 = 8, 2 = 16 */
863 if (rdev->flags & RADEON_IS_IGP)
Alex Deucher1f73cca2012-05-24 22:55:15 -0400864 rdev->config.cayman.tile_config |= 1 << 4;
Alex Deucher29d65402012-05-31 18:53:36 -0400865 else {
Alex Deucher5b23c902012-07-31 11:05:11 -0400866 switch ((mc_arb_ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT) {
867 case 0: /* four banks */
Alex Deucher29d65402012-05-31 18:53:36 -0400868 rdev->config.cayman.tile_config |= 0 << 4;
Alex Deucher5b23c902012-07-31 11:05:11 -0400869 break;
870 case 1: /* eight banks */
871 rdev->config.cayman.tile_config |= 1 << 4;
872 break;
873 case 2: /* sixteen banks */
874 default:
875 rdev->config.cayman.tile_config |= 2 << 4;
876 break;
877 }
Alex Deucher29d65402012-05-31 18:53:36 -0400878 }
Alex Deucherfecf1d02011-03-02 20:07:29 -0500879 rdev->config.cayman.tile_config |=
Dave Airliecde50832011-05-19 14:14:41 +1000880 ((gb_addr_config & PIPE_INTERLEAVE_SIZE_MASK) >> PIPE_INTERLEAVE_SIZE_SHIFT) << 8;
Alex Deucherfecf1d02011-03-02 20:07:29 -0500881 rdev->config.cayman.tile_config |=
882 ((gb_addr_config & ROW_SIZE_MASK) >> ROW_SIZE_SHIFT) << 12;
883
Alex Deucher416a2bd2012-05-31 19:00:25 -0400884 tmp = 0;
885 for (i = (rdev->config.cayman.max_shader_engines - 1); i >= 0; i--) {
886 u32 rb_disable_bitmap;
887
888 WREG32(GRBM_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_INDEX(i));
889 WREG32(RLC_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_INDEX(i));
890 rb_disable_bitmap = (RREG32(CC_RB_BACKEND_DISABLE) & 0x00ff0000) >> 16;
891 tmp <<= 4;
892 tmp |= rb_disable_bitmap;
893 }
894 /* enabled rb are just the one not disabled :) */
895 disabled_rb_mask = tmp;
Alex Deuchercedb6552013-04-09 10:13:22 -0400896 tmp = 0;
897 for (i = 0; i < (rdev->config.cayman.max_backends_per_se * rdev->config.cayman.max_shader_engines); i++)
898 tmp |= (1 << i);
899 /* if all the backends are disabled, fix it up here */
900 if ((disabled_rb_mask & tmp) == tmp) {
901 for (i = 0; i < (rdev->config.cayman.max_backends_per_se * rdev->config.cayman.max_shader_engines); i++)
902 disabled_rb_mask &= ~(1 << i);
903 }
Alex Deucher416a2bd2012-05-31 19:00:25 -0400904
905 WREG32(GRBM_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_BROADCAST_WRITES);
906 WREG32(RLC_GFX_INDEX, INSTANCE_BROADCAST_WRITES | SE_BROADCAST_WRITES);
907
Alex Deucherfecf1d02011-03-02 20:07:29 -0500908 WREG32(GB_ADDR_CONFIG, gb_addr_config);
909 WREG32(DMIF_ADDR_CONFIG, gb_addr_config);
Alex Deucher7c1c7c12013-04-05 10:28:08 -0400910 if (ASIC_IS_DCE6(rdev))
911 WREG32(DMIF_ADDR_CALC, gb_addr_config);
Alex Deucherfecf1d02011-03-02 20:07:29 -0500912 WREG32(HDP_ADDR_CONFIG, gb_addr_config);
Alex Deucherf60cbd12012-12-04 15:27:33 -0500913 WREG32(DMA_TILING_CONFIG + DMA0_REGISTER_OFFSET, gb_addr_config);
914 WREG32(DMA_TILING_CONFIG + DMA1_REGISTER_OFFSET, gb_addr_config);
Christian König9a210592013-04-08 12:41:37 +0200915 WREG32(UVD_UDEC_ADDR_CONFIG, gb_addr_config);
916 WREG32(UVD_UDEC_DB_ADDR_CONFIG, gb_addr_config);
917 WREG32(UVD_UDEC_DBW_ADDR_CONFIG, gb_addr_config);
Alex Deucherfecf1d02011-03-02 20:07:29 -0500918
Alex Deucher8f612b22013-03-11 19:28:39 -0400919 if ((rdev->config.cayman.max_backends_per_se == 1) &&
920 (rdev->flags & RADEON_IS_IGP)) {
921 if ((disabled_rb_mask & 3) == 1) {
922 /* RB0 disabled, RB1 enabled */
923 tmp = 0x11111111;
924 } else {
925 /* RB1 disabled, RB0 enabled */
926 tmp = 0x00000000;
927 }
928 } else {
929 tmp = gb_addr_config & NUM_PIPES_MASK;
930 tmp = r6xx_remap_render_backend(rdev, tmp,
931 rdev->config.cayman.max_backends_per_se *
932 rdev->config.cayman.max_shader_engines,
933 CAYMAN_MAX_BACKENDS, disabled_rb_mask);
934 }
Alex Deucher416a2bd2012-05-31 19:00:25 -0400935 WREG32(GB_BACKEND_MAP, tmp);
Alex Deucherfecf1d02011-03-02 20:07:29 -0500936
Alex Deucher416a2bd2012-05-31 19:00:25 -0400937 cgts_tcc_disable = 0xffff0000;
938 for (i = 0; i < rdev->config.cayman.max_texture_channel_caches; i++)
939 cgts_tcc_disable &= ~(1 << (16 + i));
Alex Deucherfecf1d02011-03-02 20:07:29 -0500940 WREG32(CGTS_TCC_DISABLE, cgts_tcc_disable);
941 WREG32(CGTS_SYS_TCC_DISABLE, cgts_tcc_disable);
Alex Deucherfecf1d02011-03-02 20:07:29 -0500942 WREG32(CGTS_USER_SYS_TCC_DISABLE, cgts_tcc_disable);
943 WREG32(CGTS_USER_TCC_DISABLE, cgts_tcc_disable);
944
945 /* reprogram the shader complex */
946 cgts_sm_ctrl_reg = RREG32(CGTS_SM_CTRL_REG);
947 for (i = 0; i < 16; i++)
948 WREG32(CGTS_SM_CTRL_REG, OVERRIDE);
949 WREG32(CGTS_SM_CTRL_REG, cgts_sm_ctrl_reg);
950
951 /* set HW defaults for 3D engine */
952 WREG32(CP_MEQ_THRESHOLDS, MEQ1_START(0x30) | MEQ2_START(0x60));
953
954 sx_debug_1 = RREG32(SX_DEBUG_1);
955 sx_debug_1 |= ENABLE_NEW_SMX_ADDRESS;
956 WREG32(SX_DEBUG_1, sx_debug_1);
957
958 smx_dc_ctl0 = RREG32(SMX_DC_CTL0);
959 smx_dc_ctl0 &= ~NUMBER_OF_SETS(0x1ff);
Dave Airlie285e0422011-05-09 14:54:33 +1000960 smx_dc_ctl0 |= NUMBER_OF_SETS(rdev->config.cayman.sx_num_of_sets);
Alex Deucherfecf1d02011-03-02 20:07:29 -0500961 WREG32(SMX_DC_CTL0, smx_dc_ctl0);
962
963 WREG32(SPI_CONFIG_CNTL_1, VTX_DONE_DELAY(4) | CRC_SIMD_ID_WADDR_DISABLE);
964
965 /* need to be explicitly zero-ed */
966 WREG32(VGT_OFFCHIP_LDS_BASE, 0);
967 WREG32(SQ_LSTMP_RING_BASE, 0);
968 WREG32(SQ_HSTMP_RING_BASE, 0);
969 WREG32(SQ_ESTMP_RING_BASE, 0);
970 WREG32(SQ_GSTMP_RING_BASE, 0);
971 WREG32(SQ_VSTMP_RING_BASE, 0);
972 WREG32(SQ_PSTMP_RING_BASE, 0);
973
974 WREG32(TA_CNTL_AUX, DISABLE_CUBE_ANISO);
975
Dave Airlie285e0422011-05-09 14:54:33 +1000976 WREG32(SX_EXPORT_BUFFER_SIZES, (COLOR_BUFFER_SIZE((rdev->config.cayman.sx_max_export_size / 4) - 1) |
977 POSITION_BUFFER_SIZE((rdev->config.cayman.sx_max_export_pos_size / 4) - 1) |
978 SMX_BUFFER_SIZE((rdev->config.cayman.sx_max_export_smx_size / 4) - 1)));
Alex Deucherfecf1d02011-03-02 20:07:29 -0500979
Dave Airlie285e0422011-05-09 14:54:33 +1000980 WREG32(PA_SC_FIFO_SIZE, (SC_PRIM_FIFO_SIZE(rdev->config.cayman.sc_prim_fifo_size) |
981 SC_HIZ_TILE_FIFO_SIZE(rdev->config.cayman.sc_hiz_tile_fifo_size) |
982 SC_EARLYZ_TILE_FIFO_SIZE(rdev->config.cayman.sc_earlyz_tile_fifo_size)));
Alex Deucherfecf1d02011-03-02 20:07:29 -0500983
984
985 WREG32(VGT_NUM_INSTANCES, 1);
986
987 WREG32(CP_PERFMON_CNTL, 0);
988
Dave Airlie285e0422011-05-09 14:54:33 +1000989 WREG32(SQ_MS_FIFO_SIZES, (CACHE_FIFO_SIZE(16 * rdev->config.cayman.sq_num_cf_insts) |
Alex Deucherfecf1d02011-03-02 20:07:29 -0500990 FETCH_FIFO_HIWATER(0x4) |
991 DONE_FIFO_HIWATER(0xe0) |
992 ALU_UPDATE_FIFO_HIWATER(0x8)));
993
994 WREG32(SQ_GPR_RESOURCE_MGMT_1, NUM_CLAUSE_TEMP_GPRS(4));
995 WREG32(SQ_CONFIG, (VC_ENABLE |
996 EXPORT_SRC_C |
997 GFX_PRIO(0) |
998 CS1_PRIO(0) |
999 CS2_PRIO(1)));
1000 WREG32(SQ_DYN_GPR_CNTL_PS_FLUSH_REQ, DYN_GPR_ENABLE);
1001
1002 WREG32(PA_SC_FORCE_EOV_MAX_CNTS, (FORCE_EOV_MAX_CLK_CNT(4095) |
1003 FORCE_EOV_MAX_REZ_CNT(255)));
1004
1005 WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(VC_AND_TC) |
1006 AUTO_INVLD_EN(ES_AND_GS_AUTO));
1007
1008 WREG32(VGT_GS_VERTEX_REUSE, 16);
1009 WREG32(PA_SC_LINE_STIPPLE_STATE, 0);
1010
1011 WREG32(CB_PERF_CTR0_SEL_0, 0);
1012 WREG32(CB_PERF_CTR0_SEL_1, 0);
1013 WREG32(CB_PERF_CTR1_SEL_0, 0);
1014 WREG32(CB_PERF_CTR1_SEL_1, 0);
1015 WREG32(CB_PERF_CTR2_SEL_0, 0);
1016 WREG32(CB_PERF_CTR2_SEL_1, 0);
1017 WREG32(CB_PERF_CTR3_SEL_0, 0);
1018 WREG32(CB_PERF_CTR3_SEL_1, 0);
1019
Dave Airlie0b65f832011-05-19 14:14:42 +10001020 tmp = RREG32(HDP_MISC_CNTL);
1021 tmp |= HDP_FLUSH_INVALIDATE_CACHE;
1022 WREG32(HDP_MISC_CNTL, tmp);
1023
Alex Deucherfecf1d02011-03-02 20:07:29 -05001024 hdp_host_path_cntl = RREG32(HDP_HOST_PATH_CNTL);
1025 WREG32(HDP_HOST_PATH_CNTL, hdp_host_path_cntl);
1026
1027 WREG32(PA_CL_ENHANCE, CLIP_VTX_REORDER_ENA | NUM_CLIP_SEQ(3));
1028
1029 udelay(50);
1030}
1031
Alex Deucherfa8198e2011-03-02 20:07:30 -05001032/*
1033 * GART
1034 */
1035void cayman_pcie_gart_tlb_flush(struct radeon_device *rdev)
1036{
1037 /* flush hdp cache */
1038 WREG32(HDP_MEM_COHERENCY_FLUSH_CNTL, 0x1);
1039
1040 /* bits 0-7 are the VM contexts0-7 */
1041 WREG32(VM_INVALIDATE_REQUEST, 1);
1042}
1043
Lauri Kasanen1109ca02012-08-31 13:43:50 -04001044static int cayman_pcie_gart_enable(struct radeon_device *rdev)
Alex Deucherfa8198e2011-03-02 20:07:30 -05001045{
Jerome Glisse721604a2012-01-05 22:11:05 -05001046 int i, r;
Alex Deucherfa8198e2011-03-02 20:07:30 -05001047
Jerome Glissec9a1be92011-11-03 11:16:49 -04001048 if (rdev->gart.robj == NULL) {
Alex Deucherfa8198e2011-03-02 20:07:30 -05001049 dev_err(rdev->dev, "No VRAM object for PCIE GART.\n");
1050 return -EINVAL;
1051 }
1052 r = radeon_gart_table_vram_pin(rdev);
1053 if (r)
1054 return r;
1055 radeon_gart_restore(rdev);
1056 /* Setup TLB control */
Jerome Glisse721604a2012-01-05 22:11:05 -05001057 WREG32(MC_VM_MX_L1_TLB_CNTL,
1058 (0xA << 7) |
1059 ENABLE_L1_TLB |
Alex Deucherfa8198e2011-03-02 20:07:30 -05001060 ENABLE_L1_FRAGMENT_PROCESSING |
1061 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
Jerome Glisse721604a2012-01-05 22:11:05 -05001062 ENABLE_ADVANCED_DRIVER_MODEL |
Alex Deucherfa8198e2011-03-02 20:07:30 -05001063 SYSTEM_APERTURE_UNMAPPED_ACCESS_PASS_THRU);
1064 /* Setup L2 cache */
1065 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE |
1066 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
1067 ENABLE_L2_PDE0_CACHE_LRU_UPDATE_BY_WRITE |
1068 EFFECTIVE_L2_QUEUE_SIZE(7) |
1069 CONTEXT1_IDENTITY_ACCESS_MODE(1));
1070 WREG32(VM_L2_CNTL2, INVALIDATE_ALL_L1_TLBS | INVALIDATE_L2_CACHE);
1071 WREG32(VM_L2_CNTL3, L2_CACHE_BIGK_ASSOCIATIVITY |
1072 L2_CACHE_BIGK_FRAGMENT_SIZE(6));
1073 /* setup context0 */
1074 WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR, rdev->mc.gtt_start >> 12);
1075 WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR, rdev->mc.gtt_end >> 12);
1076 WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR, rdev->gart.table_addr >> 12);
1077 WREG32(VM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
1078 (u32)(rdev->dummy_page.addr >> 12));
1079 WREG32(VM_CONTEXT0_CNTL2, 0);
1080 WREG32(VM_CONTEXT0_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(0) |
1081 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT);
Jerome Glisse721604a2012-01-05 22:11:05 -05001082
1083 WREG32(0x15D4, 0);
1084 WREG32(0x15D8, 0);
1085 WREG32(0x15DC, 0);
1086
1087 /* empty context1-7 */
Alex Deucher23d4f1f2012-10-08 09:45:46 -04001088 /* Assign the pt base to something valid for now; the pts used for
1089 * the VMs are determined by the application and setup and assigned
1090 * on the fly in the vm part of radeon_gart.c
1091 */
Jerome Glisse721604a2012-01-05 22:11:05 -05001092 for (i = 1; i < 8; i++) {
1093 WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR + (i << 2), 0);
Alex Deucherc1a7ca02012-10-08 12:15:13 -04001094 WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR + (i << 2), rdev->vm_manager.max_pfn);
Jerome Glisse721604a2012-01-05 22:11:05 -05001095 WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR + (i << 2),
1096 rdev->gart.table_addr >> 12);
1097 }
1098
1099 /* enable context1-7 */
1100 WREG32(VM_CONTEXT1_PROTECTION_FAULT_DEFAULT_ADDR,
1101 (u32)(rdev->dummy_page.addr >> 12));
Christian Königae133a12012-09-18 15:30:44 -04001102 WREG32(VM_CONTEXT1_CNTL2, 4);
Dmitry Cherkasovfa87e622012-09-17 19:36:19 +02001103 WREG32(VM_CONTEXT1_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(1) |
Christian Königae133a12012-09-18 15:30:44 -04001104 RANGE_PROTECTION_FAULT_ENABLE_INTERRUPT |
1105 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT |
1106 DUMMY_PAGE_PROTECTION_FAULT_ENABLE_INTERRUPT |
1107 DUMMY_PAGE_PROTECTION_FAULT_ENABLE_DEFAULT |
1108 PDE0_PROTECTION_FAULT_ENABLE_INTERRUPT |
1109 PDE0_PROTECTION_FAULT_ENABLE_DEFAULT |
1110 VALID_PROTECTION_FAULT_ENABLE_INTERRUPT |
1111 VALID_PROTECTION_FAULT_ENABLE_DEFAULT |
1112 READ_PROTECTION_FAULT_ENABLE_INTERRUPT |
1113 READ_PROTECTION_FAULT_ENABLE_DEFAULT |
1114 WRITE_PROTECTION_FAULT_ENABLE_INTERRUPT |
1115 WRITE_PROTECTION_FAULT_ENABLE_DEFAULT);
Alex Deucherfa8198e2011-03-02 20:07:30 -05001116
1117 cayman_pcie_gart_tlb_flush(rdev);
Tormod Voldenfcf4de52011-08-31 21:54:07 +00001118 DRM_INFO("PCIE GART of %uM enabled (table at 0x%016llX).\n",
1119 (unsigned)(rdev->mc.gtt_size >> 20),
1120 (unsigned long long)rdev->gart.table_addr);
Alex Deucherfa8198e2011-03-02 20:07:30 -05001121 rdev->gart.ready = true;
1122 return 0;
1123}
1124
Lauri Kasanen1109ca02012-08-31 13:43:50 -04001125static void cayman_pcie_gart_disable(struct radeon_device *rdev)
Alex Deucherfa8198e2011-03-02 20:07:30 -05001126{
Alex Deucherfa8198e2011-03-02 20:07:30 -05001127 /* Disable all tables */
1128 WREG32(VM_CONTEXT0_CNTL, 0);
1129 WREG32(VM_CONTEXT1_CNTL, 0);
1130 /* Setup TLB control */
1131 WREG32(MC_VM_MX_L1_TLB_CNTL, ENABLE_L1_FRAGMENT_PROCESSING |
1132 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
1133 SYSTEM_APERTURE_UNMAPPED_ACCESS_PASS_THRU);
1134 /* Setup L2 cache */
1135 WREG32(VM_L2_CNTL, ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
1136 ENABLE_L2_PDE0_CACHE_LRU_UPDATE_BY_WRITE |
1137 EFFECTIVE_L2_QUEUE_SIZE(7) |
1138 CONTEXT1_IDENTITY_ACCESS_MODE(1));
1139 WREG32(VM_L2_CNTL2, 0);
1140 WREG32(VM_L2_CNTL3, L2_CACHE_BIGK_ASSOCIATIVITY |
1141 L2_CACHE_BIGK_FRAGMENT_SIZE(6));
Jerome Glissec9a1be92011-11-03 11:16:49 -04001142 radeon_gart_table_vram_unpin(rdev);
Alex Deucherfa8198e2011-03-02 20:07:30 -05001143}
1144
Lauri Kasanen1109ca02012-08-31 13:43:50 -04001145static void cayman_pcie_gart_fini(struct radeon_device *rdev)
Alex Deucherfa8198e2011-03-02 20:07:30 -05001146{
1147 cayman_pcie_gart_disable(rdev);
1148 radeon_gart_table_vram_free(rdev);
1149 radeon_gart_fini(rdev);
1150}
1151
Alex Deucher1b370782011-11-17 20:13:28 -05001152void cayman_cp_int_cntl_setup(struct radeon_device *rdev,
1153 int ring, u32 cp_int_cntl)
1154{
1155 u32 srbm_gfx_cntl = RREG32(SRBM_GFX_CNTL) & ~3;
1156
1157 WREG32(SRBM_GFX_CNTL, srbm_gfx_cntl | (ring & 3));
1158 WREG32(CP_INT_CNTL, cp_int_cntl);
1159}
1160
Alex Deucher0c88a022011-03-02 20:07:31 -05001161/*
1162 * CP.
1163 */
Alex Deucherb40e7e12011-11-17 14:57:50 -05001164void cayman_fence_ring_emit(struct radeon_device *rdev,
1165 struct radeon_fence *fence)
1166{
1167 struct radeon_ring *ring = &rdev->ring[fence->ring];
1168 u64 addr = rdev->fence_drv[fence->ring].gpu_addr;
1169
Jerome Glisse721604a2012-01-05 22:11:05 -05001170 /* flush read cache over gart for this vmid */
1171 radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1));
1172 radeon_ring_write(ring, (CP_COHER_CNTL2 - PACKET3_SET_CONFIG_REG_START) >> 2);
1173 radeon_ring_write(ring, 0);
Alex Deucherb40e7e12011-11-17 14:57:50 -05001174 radeon_ring_write(ring, PACKET3(PACKET3_SURFACE_SYNC, 3));
1175 radeon_ring_write(ring, PACKET3_TC_ACTION_ENA | PACKET3_SH_ACTION_ENA);
1176 radeon_ring_write(ring, 0xFFFFFFFF);
1177 radeon_ring_write(ring, 0);
1178 radeon_ring_write(ring, 10); /* poll interval */
1179 /* EVENT_WRITE_EOP - flush caches, send int */
1180 radeon_ring_write(ring, PACKET3(PACKET3_EVENT_WRITE_EOP, 4));
1181 radeon_ring_write(ring, EVENT_TYPE(CACHE_FLUSH_AND_INV_EVENT_TS) | EVENT_INDEX(5));
1182 radeon_ring_write(ring, addr & 0xffffffff);
1183 radeon_ring_write(ring, (upper_32_bits(addr) & 0xff) | DATA_SEL(1) | INT_SEL(2));
1184 radeon_ring_write(ring, fence->seq);
1185 radeon_ring_write(ring, 0);
1186}
1187
Jerome Glisse721604a2012-01-05 22:11:05 -05001188void cayman_ring_ib_execute(struct radeon_device *rdev, struct radeon_ib *ib)
1189{
Christian König876dc9f2012-05-08 14:24:01 +02001190 struct radeon_ring *ring = &rdev->ring[ib->ring];
Jerome Glisse721604a2012-01-05 22:11:05 -05001191
1192 /* set to DX10/11 mode */
1193 radeon_ring_write(ring, PACKET3(PACKET3_MODE_CONTROL, 0));
1194 radeon_ring_write(ring, 1);
Christian König45df6802012-07-06 16:22:55 +02001195
1196 if (ring->rptr_save_reg) {
1197 uint32_t next_rptr = ring->wptr + 3 + 4 + 8;
1198 radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1));
1199 radeon_ring_write(ring, ((ring->rptr_save_reg -
1200 PACKET3_SET_CONFIG_REG_START) >> 2));
1201 radeon_ring_write(ring, next_rptr);
1202 }
1203
Jerome Glisse721604a2012-01-05 22:11:05 -05001204 radeon_ring_write(ring, PACKET3(PACKET3_INDIRECT_BUFFER, 2));
1205 radeon_ring_write(ring,
1206#ifdef __BIG_ENDIAN
1207 (2 << 0) |
1208#endif
1209 (ib->gpu_addr & 0xFFFFFFFC));
1210 radeon_ring_write(ring, upper_32_bits(ib->gpu_addr) & 0xFF);
Christian König4bf3dd92012-08-06 18:57:44 +02001211 radeon_ring_write(ring, ib->length_dw |
1212 (ib->vm ? (ib->vm->id << 24) : 0));
Jerome Glisse721604a2012-01-05 22:11:05 -05001213
1214 /* flush read cache over gart for this vmid */
1215 radeon_ring_write(ring, PACKET3(PACKET3_SET_CONFIG_REG, 1));
1216 radeon_ring_write(ring, (CP_COHER_CNTL2 - PACKET3_SET_CONFIG_REG_START) >> 2);
Christian König4bf3dd92012-08-06 18:57:44 +02001217 radeon_ring_write(ring, ib->vm ? ib->vm->id : 0);
Jerome Glisse721604a2012-01-05 22:11:05 -05001218 radeon_ring_write(ring, PACKET3(PACKET3_SURFACE_SYNC, 3));
1219 radeon_ring_write(ring, PACKET3_TC_ACTION_ENA | PACKET3_SH_ACTION_ENA);
1220 radeon_ring_write(ring, 0xFFFFFFFF);
1221 radeon_ring_write(ring, 0);
1222 radeon_ring_write(ring, 10); /* poll interval */
1223}
1224
Christian Königf2ba57b2013-04-08 12:41:29 +02001225void cayman_uvd_semaphore_emit(struct radeon_device *rdev,
1226 struct radeon_ring *ring,
1227 struct radeon_semaphore *semaphore,
1228 bool emit_wait)
1229{
1230 uint64_t addr = semaphore->gpu_addr;
1231
1232 radeon_ring_write(ring, PACKET0(UVD_SEMA_ADDR_LOW, 0));
1233 radeon_ring_write(ring, (addr >> 3) & 0x000FFFFF);
1234
1235 radeon_ring_write(ring, PACKET0(UVD_SEMA_ADDR_HIGH, 0));
1236 radeon_ring_write(ring, (addr >> 23) & 0x000FFFFF);
1237
1238 radeon_ring_write(ring, PACKET0(UVD_SEMA_CMD, 0));
1239 radeon_ring_write(ring, 0x80 | (emit_wait ? 1 : 0));
1240}
1241
Alex Deucher0c88a022011-03-02 20:07:31 -05001242static void cayman_cp_enable(struct radeon_device *rdev, bool enable)
1243{
1244 if (enable)
1245 WREG32(CP_ME_CNTL, 0);
1246 else {
Dave Airlie38f1cff2011-03-16 11:34:41 +10001247 radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size);
Alex Deucher0c88a022011-03-02 20:07:31 -05001248 WREG32(CP_ME_CNTL, (CP_ME_HALT | CP_PFP_HALT));
1249 WREG32(SCRATCH_UMSK, 0);
Alex Deucherf60cbd12012-12-04 15:27:33 -05001250 rdev->ring[RADEON_RING_TYPE_GFX_INDEX].ready = false;
Alex Deucher0c88a022011-03-02 20:07:31 -05001251 }
1252}
1253
1254static int cayman_cp_load_microcode(struct radeon_device *rdev)
1255{
1256 const __be32 *fw_data;
1257 int i;
1258
1259 if (!rdev->me_fw || !rdev->pfp_fw)
1260 return -EINVAL;
1261
1262 cayman_cp_enable(rdev, false);
1263
1264 fw_data = (const __be32 *)rdev->pfp_fw->data;
1265 WREG32(CP_PFP_UCODE_ADDR, 0);
1266 for (i = 0; i < CAYMAN_PFP_UCODE_SIZE; i++)
1267 WREG32(CP_PFP_UCODE_DATA, be32_to_cpup(fw_data++));
1268 WREG32(CP_PFP_UCODE_ADDR, 0);
1269
1270 fw_data = (const __be32 *)rdev->me_fw->data;
1271 WREG32(CP_ME_RAM_WADDR, 0);
1272 for (i = 0; i < CAYMAN_PM4_UCODE_SIZE; i++)
1273 WREG32(CP_ME_RAM_DATA, be32_to_cpup(fw_data++));
1274
1275 WREG32(CP_PFP_UCODE_ADDR, 0);
1276 WREG32(CP_ME_RAM_WADDR, 0);
1277 WREG32(CP_ME_RAM_RADDR, 0);
1278 return 0;
1279}
1280
1281static int cayman_cp_start(struct radeon_device *rdev)
1282{
Christian Könige32eb502011-10-23 12:56:27 +02001283 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
Alex Deucher0c88a022011-03-02 20:07:31 -05001284 int r, i;
1285
Christian Könige32eb502011-10-23 12:56:27 +02001286 r = radeon_ring_lock(rdev, ring, 7);
Alex Deucher0c88a022011-03-02 20:07:31 -05001287 if (r) {
1288 DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
1289 return r;
1290 }
Christian Könige32eb502011-10-23 12:56:27 +02001291 radeon_ring_write(ring, PACKET3(PACKET3_ME_INITIALIZE, 5));
1292 radeon_ring_write(ring, 0x1);
1293 radeon_ring_write(ring, 0x0);
1294 radeon_ring_write(ring, rdev->config.cayman.max_hw_contexts - 1);
1295 radeon_ring_write(ring, PACKET3_ME_INITIALIZE_DEVICE_ID(1));
1296 radeon_ring_write(ring, 0);
1297 radeon_ring_write(ring, 0);
1298 radeon_ring_unlock_commit(rdev, ring);
Alex Deucher0c88a022011-03-02 20:07:31 -05001299
1300 cayman_cp_enable(rdev, true);
1301
Christian Könige32eb502011-10-23 12:56:27 +02001302 r = radeon_ring_lock(rdev, ring, cayman_default_size + 19);
Alex Deucher0c88a022011-03-02 20:07:31 -05001303 if (r) {
1304 DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
1305 return r;
1306 }
1307
1308 /* setup clear context state */
Christian Könige32eb502011-10-23 12:56:27 +02001309 radeon_ring_write(ring, PACKET3(PACKET3_PREAMBLE_CNTL, 0));
1310 radeon_ring_write(ring, PACKET3_PREAMBLE_BEGIN_CLEAR_STATE);
Alex Deucher0c88a022011-03-02 20:07:31 -05001311
1312 for (i = 0; i < cayman_default_size; i++)
Christian Könige32eb502011-10-23 12:56:27 +02001313 radeon_ring_write(ring, cayman_default_state[i]);
Alex Deucher0c88a022011-03-02 20:07:31 -05001314
Christian Könige32eb502011-10-23 12:56:27 +02001315 radeon_ring_write(ring, PACKET3(PACKET3_PREAMBLE_CNTL, 0));
1316 radeon_ring_write(ring, PACKET3_PREAMBLE_END_CLEAR_STATE);
Alex Deucher0c88a022011-03-02 20:07:31 -05001317
1318 /* set clear context state */
Christian Könige32eb502011-10-23 12:56:27 +02001319 radeon_ring_write(ring, PACKET3(PACKET3_CLEAR_STATE, 0));
1320 radeon_ring_write(ring, 0);
Alex Deucher0c88a022011-03-02 20:07:31 -05001321
1322 /* SQ_VTX_BASE_VTX_LOC */
Christian Könige32eb502011-10-23 12:56:27 +02001323 radeon_ring_write(ring, 0xc0026f00);
1324 radeon_ring_write(ring, 0x00000000);
1325 radeon_ring_write(ring, 0x00000000);
1326 radeon_ring_write(ring, 0x00000000);
Alex Deucher0c88a022011-03-02 20:07:31 -05001327
1328 /* Clear consts */
Christian Könige32eb502011-10-23 12:56:27 +02001329 radeon_ring_write(ring, 0xc0036f00);
1330 radeon_ring_write(ring, 0x00000bc4);
1331 radeon_ring_write(ring, 0xffffffff);
1332 radeon_ring_write(ring, 0xffffffff);
1333 radeon_ring_write(ring, 0xffffffff);
Alex Deucher0c88a022011-03-02 20:07:31 -05001334
Christian Könige32eb502011-10-23 12:56:27 +02001335 radeon_ring_write(ring, 0xc0026900);
1336 radeon_ring_write(ring, 0x00000316);
1337 radeon_ring_write(ring, 0x0000000e); /* VGT_VERTEX_REUSE_BLOCK_CNTL */
1338 radeon_ring_write(ring, 0x00000010); /* */
Alex Deucher9b91d182011-03-02 20:07:39 -05001339
Christian Könige32eb502011-10-23 12:56:27 +02001340 radeon_ring_unlock_commit(rdev, ring);
Alex Deucher0c88a022011-03-02 20:07:31 -05001341
1342 /* XXX init other rings */
1343
1344 return 0;
1345}
1346
Alex Deucher755d8192011-03-02 20:07:34 -05001347static void cayman_cp_fini(struct radeon_device *rdev)
1348{
Christian König45df6802012-07-06 16:22:55 +02001349 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
Alex Deucher755d8192011-03-02 20:07:34 -05001350 cayman_cp_enable(rdev, false);
Christian König45df6802012-07-06 16:22:55 +02001351 radeon_ring_fini(rdev, ring);
1352 radeon_scratch_free(rdev, ring->rptr_save_reg);
Alex Deucher755d8192011-03-02 20:07:34 -05001353}
1354
Lauri Kasanen1109ca02012-08-31 13:43:50 -04001355static int cayman_cp_resume(struct radeon_device *rdev)
Alex Deucher0c88a022011-03-02 20:07:31 -05001356{
Christian Königb90ca982012-07-04 21:36:53 +02001357 static const int ridx[] = {
1358 RADEON_RING_TYPE_GFX_INDEX,
1359 CAYMAN_RING_TYPE_CP1_INDEX,
1360 CAYMAN_RING_TYPE_CP2_INDEX
1361 };
1362 static const unsigned cp_rb_cntl[] = {
1363 CP_RB0_CNTL,
1364 CP_RB1_CNTL,
1365 CP_RB2_CNTL,
1366 };
1367 static const unsigned cp_rb_rptr_addr[] = {
1368 CP_RB0_RPTR_ADDR,
1369 CP_RB1_RPTR_ADDR,
1370 CP_RB2_RPTR_ADDR
1371 };
1372 static const unsigned cp_rb_rptr_addr_hi[] = {
1373 CP_RB0_RPTR_ADDR_HI,
1374 CP_RB1_RPTR_ADDR_HI,
1375 CP_RB2_RPTR_ADDR_HI
1376 };
1377 static const unsigned cp_rb_base[] = {
1378 CP_RB0_BASE,
1379 CP_RB1_BASE,
1380 CP_RB2_BASE
1381 };
Christian Könige32eb502011-10-23 12:56:27 +02001382 struct radeon_ring *ring;
Christian Königb90ca982012-07-04 21:36:53 +02001383 int i, r;
Alex Deucher0c88a022011-03-02 20:07:31 -05001384
1385 /* Reset cp; if cp is reset, then PA, SH, VGT also need to be reset */
1386 WREG32(GRBM_SOFT_RESET, (SOFT_RESET_CP |
1387 SOFT_RESET_PA |
1388 SOFT_RESET_SH |
1389 SOFT_RESET_VGT |
Jerome Glissea49a50d2011-08-24 20:00:17 +00001390 SOFT_RESET_SPI |
Alex Deucher0c88a022011-03-02 20:07:31 -05001391 SOFT_RESET_SX));
1392 RREG32(GRBM_SOFT_RESET);
1393 mdelay(15);
1394 WREG32(GRBM_SOFT_RESET, 0);
1395 RREG32(GRBM_SOFT_RESET);
1396
Christian König15d33322011-09-15 19:02:22 +02001397 WREG32(CP_SEM_WAIT_TIMER, 0x0);
Alex Deucher11ef3f1f2012-01-20 14:47:43 -05001398 WREG32(CP_SEM_INCOMPLETE_TIMER_CNTL, 0x0);
Alex Deucher0c88a022011-03-02 20:07:31 -05001399
1400 /* Set the write pointer delay */
1401 WREG32(CP_RB_WPTR_DELAY, 0);
1402
1403 WREG32(CP_DEBUG, (1 << 27));
1404
Adam Buchbinder48fc7f72012-09-19 21:48:00 -04001405 /* set the wb address whether it's enabled or not */
Alex Deucher0c88a022011-03-02 20:07:31 -05001406 WREG32(SCRATCH_ADDR, ((rdev->wb.gpu_addr + RADEON_WB_SCRATCH_OFFSET) >> 8) & 0xFFFFFFFF);
Christian Königb90ca982012-07-04 21:36:53 +02001407 WREG32(SCRATCH_UMSK, 0xff);
Alex Deucher0c88a022011-03-02 20:07:31 -05001408
Christian Königb90ca982012-07-04 21:36:53 +02001409 for (i = 0; i < 3; ++i) {
1410 uint32_t rb_cntl;
1411 uint64_t addr;
1412
1413 /* Set ring buffer size */
1414 ring = &rdev->ring[ridx[i]];
1415 rb_cntl = drm_order(ring->ring_size / 8);
1416 rb_cntl |= drm_order(RADEON_GPU_PAGE_SIZE/8) << 8;
1417#ifdef __BIG_ENDIAN
1418 rb_cntl |= BUF_SWAP_32BIT;
1419#endif
1420 WREG32(cp_rb_cntl[i], rb_cntl);
1421
Adam Buchbinder48fc7f72012-09-19 21:48:00 -04001422 /* set the wb address whether it's enabled or not */
Christian Königb90ca982012-07-04 21:36:53 +02001423 addr = rdev->wb.gpu_addr + RADEON_WB_CP_RPTR_OFFSET;
1424 WREG32(cp_rb_rptr_addr[i], addr & 0xFFFFFFFC);
1425 WREG32(cp_rb_rptr_addr_hi[i], upper_32_bits(addr) & 0xFF);
Alex Deucher0c88a022011-03-02 20:07:31 -05001426 }
1427
Christian Königb90ca982012-07-04 21:36:53 +02001428 /* set the rb base addr, this causes an internal reset of ALL rings */
1429 for (i = 0; i < 3; ++i) {
1430 ring = &rdev->ring[ridx[i]];
1431 WREG32(cp_rb_base[i], ring->gpu_addr >> 8);
1432 }
Alex Deucher0c88a022011-03-02 20:07:31 -05001433
Christian Königb90ca982012-07-04 21:36:53 +02001434 for (i = 0; i < 3; ++i) {
1435 /* Initialize the ring buffer's read and write pointers */
1436 ring = &rdev->ring[ridx[i]];
1437 WREG32_P(cp_rb_cntl[i], RB_RPTR_WR_ENA, ~RB_RPTR_WR_ENA);
Alex Deucher0c88a022011-03-02 20:07:31 -05001438
Christian Königb90ca982012-07-04 21:36:53 +02001439 ring->rptr = ring->wptr = 0;
1440 WREG32(ring->rptr_reg, ring->rptr);
1441 WREG32(ring->wptr_reg, ring->wptr);
Alex Deucher0c88a022011-03-02 20:07:31 -05001442
Christian Königb90ca982012-07-04 21:36:53 +02001443 mdelay(1);
1444 WREG32_P(cp_rb_cntl[i], 0, ~RB_RPTR_WR_ENA);
1445 }
Alex Deucher0c88a022011-03-02 20:07:31 -05001446
1447 /* start the rings */
1448 cayman_cp_start(rdev);
Christian Könige32eb502011-10-23 12:56:27 +02001449 rdev->ring[RADEON_RING_TYPE_GFX_INDEX].ready = true;
1450 rdev->ring[CAYMAN_RING_TYPE_CP1_INDEX].ready = false;
1451 rdev->ring[CAYMAN_RING_TYPE_CP2_INDEX].ready = false;
Alex Deucher0c88a022011-03-02 20:07:31 -05001452 /* this only test cp0 */
Alex Deucherf7128122012-02-23 17:53:45 -05001453 r = radeon_ring_test(rdev, RADEON_RING_TYPE_GFX_INDEX, &rdev->ring[RADEON_RING_TYPE_GFX_INDEX]);
Alex Deucher0c88a022011-03-02 20:07:31 -05001454 if (r) {
Christian Könige32eb502011-10-23 12:56:27 +02001455 rdev->ring[RADEON_RING_TYPE_GFX_INDEX].ready = false;
1456 rdev->ring[CAYMAN_RING_TYPE_CP1_INDEX].ready = false;
1457 rdev->ring[CAYMAN_RING_TYPE_CP2_INDEX].ready = false;
Alex Deucher0c88a022011-03-02 20:07:31 -05001458 return r;
1459 }
1460
1461 return 0;
1462}
1463
Alex Deucherf60cbd12012-12-04 15:27:33 -05001464/*
1465 * DMA
1466 * Starting with R600, the GPU has an asynchronous
1467 * DMA engine. The programming model is very similar
1468 * to the 3D engine (ring buffer, IBs, etc.), but the
1469 * DMA controller has it's own packet format that is
1470 * different form the PM4 format used by the 3D engine.
1471 * It supports copying data, writing embedded data,
1472 * solid fills, and a number of other things. It also
1473 * has support for tiling/detiling of buffers.
1474 * Cayman and newer support two asynchronous DMA engines.
1475 */
1476/**
1477 * cayman_dma_ring_ib_execute - Schedule an IB on the DMA engine
1478 *
1479 * @rdev: radeon_device pointer
1480 * @ib: IB object to schedule
1481 *
1482 * Schedule an IB in the DMA ring (cayman-SI).
1483 */
1484void cayman_dma_ring_ib_execute(struct radeon_device *rdev,
1485 struct radeon_ib *ib)
1486{
1487 struct radeon_ring *ring = &rdev->ring[ib->ring];
1488
1489 if (rdev->wb.enabled) {
1490 u32 next_rptr = ring->wptr + 4;
1491 while ((next_rptr & 7) != 5)
1492 next_rptr++;
1493 next_rptr += 3;
1494 radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_WRITE, 0, 0, 1));
1495 radeon_ring_write(ring, ring->next_rptr_gpu_addr & 0xfffffffc);
1496 radeon_ring_write(ring, upper_32_bits(ring->next_rptr_gpu_addr) & 0xff);
1497 radeon_ring_write(ring, next_rptr);
1498 }
1499
1500 /* The indirect buffer packet must end on an 8 DW boundary in the DMA ring.
1501 * Pad as necessary with NOPs.
1502 */
1503 while ((ring->wptr & 7) != 5)
1504 radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_NOP, 0, 0, 0));
1505 radeon_ring_write(ring, DMA_IB_PACKET(DMA_PACKET_INDIRECT_BUFFER, ib->vm ? ib->vm->id : 0, 0));
1506 radeon_ring_write(ring, (ib->gpu_addr & 0xFFFFFFE0));
1507 radeon_ring_write(ring, (ib->length_dw << 12) | (upper_32_bits(ib->gpu_addr) & 0xFF));
1508
1509}
1510
1511/**
1512 * cayman_dma_stop - stop the async dma engines
1513 *
1514 * @rdev: radeon_device pointer
1515 *
1516 * Stop the async dma engines (cayman-SI).
1517 */
1518void cayman_dma_stop(struct radeon_device *rdev)
1519{
1520 u32 rb_cntl;
1521
1522 radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size);
1523
1524 /* dma0 */
1525 rb_cntl = RREG32(DMA_RB_CNTL + DMA0_REGISTER_OFFSET);
1526 rb_cntl &= ~DMA_RB_ENABLE;
1527 WREG32(DMA_RB_CNTL + DMA0_REGISTER_OFFSET, rb_cntl);
1528
1529 /* dma1 */
1530 rb_cntl = RREG32(DMA_RB_CNTL + DMA1_REGISTER_OFFSET);
1531 rb_cntl &= ~DMA_RB_ENABLE;
1532 WREG32(DMA_RB_CNTL + DMA1_REGISTER_OFFSET, rb_cntl);
1533
1534 rdev->ring[R600_RING_TYPE_DMA_INDEX].ready = false;
1535 rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX].ready = false;
1536}
1537
1538/**
1539 * cayman_dma_resume - setup and start the async dma engines
1540 *
1541 * @rdev: radeon_device pointer
1542 *
1543 * Set up the DMA ring buffers and enable them. (cayman-SI).
1544 * Returns 0 for success, error for failure.
1545 */
1546int cayman_dma_resume(struct radeon_device *rdev)
1547{
1548 struct radeon_ring *ring;
Michel Dänzerb3dfcb22013-01-24 19:02:01 +01001549 u32 rb_cntl, dma_cntl, ib_cntl;
Alex Deucherf60cbd12012-12-04 15:27:33 -05001550 u32 rb_bufsz;
1551 u32 reg_offset, wb_offset;
1552 int i, r;
1553
1554 /* Reset dma */
1555 WREG32(SRBM_SOFT_RESET, SOFT_RESET_DMA | SOFT_RESET_DMA1);
1556 RREG32(SRBM_SOFT_RESET);
1557 udelay(50);
1558 WREG32(SRBM_SOFT_RESET, 0);
1559
1560 for (i = 0; i < 2; i++) {
1561 if (i == 0) {
1562 ring = &rdev->ring[R600_RING_TYPE_DMA_INDEX];
1563 reg_offset = DMA0_REGISTER_OFFSET;
1564 wb_offset = R600_WB_DMA_RPTR_OFFSET;
1565 } else {
1566 ring = &rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX];
1567 reg_offset = DMA1_REGISTER_OFFSET;
1568 wb_offset = CAYMAN_WB_DMA1_RPTR_OFFSET;
1569 }
1570
1571 WREG32(DMA_SEM_INCOMPLETE_TIMER_CNTL + reg_offset, 0);
1572 WREG32(DMA_SEM_WAIT_FAIL_TIMER_CNTL + reg_offset, 0);
1573
1574 /* Set ring buffer size in dwords */
1575 rb_bufsz = drm_order(ring->ring_size / 4);
1576 rb_cntl = rb_bufsz << 1;
1577#ifdef __BIG_ENDIAN
1578 rb_cntl |= DMA_RB_SWAP_ENABLE | DMA_RPTR_WRITEBACK_SWAP_ENABLE;
1579#endif
1580 WREG32(DMA_RB_CNTL + reg_offset, rb_cntl);
1581
1582 /* Initialize the ring buffer's read and write pointers */
1583 WREG32(DMA_RB_RPTR + reg_offset, 0);
1584 WREG32(DMA_RB_WPTR + reg_offset, 0);
1585
1586 /* set the wb address whether it's enabled or not */
1587 WREG32(DMA_RB_RPTR_ADDR_HI + reg_offset,
1588 upper_32_bits(rdev->wb.gpu_addr + wb_offset) & 0xFF);
1589 WREG32(DMA_RB_RPTR_ADDR_LO + reg_offset,
1590 ((rdev->wb.gpu_addr + wb_offset) & 0xFFFFFFFC));
1591
1592 if (rdev->wb.enabled)
1593 rb_cntl |= DMA_RPTR_WRITEBACK_ENABLE;
1594
1595 WREG32(DMA_RB_BASE + reg_offset, ring->gpu_addr >> 8);
1596
1597 /* enable DMA IBs */
Michel Dänzerb3dfcb22013-01-24 19:02:01 +01001598 ib_cntl = DMA_IB_ENABLE | CMD_VMID_FORCE;
1599#ifdef __BIG_ENDIAN
1600 ib_cntl |= DMA_IB_SWAP_ENABLE;
1601#endif
1602 WREG32(DMA_IB_CNTL + reg_offset, ib_cntl);
Alex Deucherf60cbd12012-12-04 15:27:33 -05001603
1604 dma_cntl = RREG32(DMA_CNTL + reg_offset);
1605 dma_cntl &= ~CTXEMPTY_INT_ENABLE;
1606 WREG32(DMA_CNTL + reg_offset, dma_cntl);
1607
1608 ring->wptr = 0;
1609 WREG32(DMA_RB_WPTR + reg_offset, ring->wptr << 2);
1610
1611 ring->rptr = RREG32(DMA_RB_RPTR + reg_offset) >> 2;
1612
1613 WREG32(DMA_RB_CNTL + reg_offset, rb_cntl | DMA_RB_ENABLE);
1614
1615 ring->ready = true;
1616
1617 r = radeon_ring_test(rdev, ring->idx, ring);
1618 if (r) {
1619 ring->ready = false;
1620 return r;
1621 }
1622 }
1623
1624 radeon_ttm_set_active_vram_size(rdev, rdev->mc.real_vram_size);
1625
1626 return 0;
1627}
1628
1629/**
1630 * cayman_dma_fini - tear down the async dma engines
1631 *
1632 * @rdev: radeon_device pointer
1633 *
1634 * Stop the async dma engines and free the rings (cayman-SI).
1635 */
1636void cayman_dma_fini(struct radeon_device *rdev)
1637{
1638 cayman_dma_stop(rdev);
1639 radeon_ring_fini(rdev, &rdev->ring[R600_RING_TYPE_DMA_INDEX]);
1640 radeon_ring_fini(rdev, &rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX]);
1641}
1642
Alex Deucher168757e2013-01-18 19:17:22 -05001643static u32 cayman_gpu_check_soft_reset(struct radeon_device *rdev)
1644{
1645 u32 reset_mask = 0;
1646 u32 tmp;
1647
1648 /* GRBM_STATUS */
1649 tmp = RREG32(GRBM_STATUS);
1650 if (tmp & (PA_BUSY | SC_BUSY |
1651 SH_BUSY | SX_BUSY |
1652 TA_BUSY | VGT_BUSY |
1653 DB_BUSY | CB_BUSY |
1654 GDS_BUSY | SPI_BUSY |
1655 IA_BUSY | IA_BUSY_NO_DMA))
1656 reset_mask |= RADEON_RESET_GFX;
1657
1658 if (tmp & (CF_RQ_PENDING | PF_RQ_PENDING |
1659 CP_BUSY | CP_COHERENCY_BUSY))
1660 reset_mask |= RADEON_RESET_CP;
1661
1662 if (tmp & GRBM_EE_BUSY)
1663 reset_mask |= RADEON_RESET_GRBM | RADEON_RESET_GFX | RADEON_RESET_CP;
1664
1665 /* DMA_STATUS_REG 0 */
1666 tmp = RREG32(DMA_STATUS_REG + DMA0_REGISTER_OFFSET);
1667 if (!(tmp & DMA_IDLE))
1668 reset_mask |= RADEON_RESET_DMA;
1669
1670 /* DMA_STATUS_REG 1 */
1671 tmp = RREG32(DMA_STATUS_REG + DMA1_REGISTER_OFFSET);
1672 if (!(tmp & DMA_IDLE))
1673 reset_mask |= RADEON_RESET_DMA1;
1674
1675 /* SRBM_STATUS2 */
1676 tmp = RREG32(SRBM_STATUS2);
1677 if (tmp & DMA_BUSY)
1678 reset_mask |= RADEON_RESET_DMA;
1679
1680 if (tmp & DMA1_BUSY)
1681 reset_mask |= RADEON_RESET_DMA1;
1682
1683 /* SRBM_STATUS */
1684 tmp = RREG32(SRBM_STATUS);
1685 if (tmp & (RLC_RQ_PENDING | RLC_BUSY))
1686 reset_mask |= RADEON_RESET_RLC;
1687
1688 if (tmp & IH_BUSY)
1689 reset_mask |= RADEON_RESET_IH;
1690
1691 if (tmp & SEM_BUSY)
1692 reset_mask |= RADEON_RESET_SEM;
1693
1694 if (tmp & GRBM_RQ_PENDING)
1695 reset_mask |= RADEON_RESET_GRBM;
1696
1697 if (tmp & VMC_BUSY)
1698 reset_mask |= RADEON_RESET_VMC;
1699
1700 if (tmp & (MCB_BUSY | MCB_NON_DISPLAY_BUSY |
1701 MCC_BUSY | MCD_BUSY))
1702 reset_mask |= RADEON_RESET_MC;
1703
1704 if (evergreen_is_display_hung(rdev))
1705 reset_mask |= RADEON_RESET_DISPLAY;
1706
1707 /* VM_L2_STATUS */
1708 tmp = RREG32(VM_L2_STATUS);
1709 if (tmp & L2_BUSY)
1710 reset_mask |= RADEON_RESET_VMC;
1711
Alex Deucherd808fc82013-02-28 10:03:08 -05001712 /* Skip MC reset as it's mostly likely not hung, just busy */
1713 if (reset_mask & RADEON_RESET_MC) {
1714 DRM_DEBUG("MC busy: 0x%08X, clearing.\n", reset_mask);
1715 reset_mask &= ~RADEON_RESET_MC;
1716 }
1717
Alex Deucher168757e2013-01-18 19:17:22 -05001718 return reset_mask;
1719}
1720
1721static void cayman_gpu_soft_reset(struct radeon_device *rdev, u32 reset_mask)
Alex Deucher271d6fed2013-01-03 12:48:05 -05001722{
1723 struct evergreen_mc_save save;
Alex Deucher187e3592013-01-18 14:51:38 -05001724 u32 grbm_soft_reset = 0, srbm_soft_reset = 0;
1725 u32 tmp;
Alex Deucher19fc42e2013-01-14 11:04:39 -05001726
Alex Deucher271d6fed2013-01-03 12:48:05 -05001727 if (reset_mask == 0)
Alex Deucher168757e2013-01-18 19:17:22 -05001728 return;
Alex Deucher271d6fed2013-01-03 12:48:05 -05001729
1730 dev_info(rdev->dev, "GPU softreset: 0x%08X\n", reset_mask);
1731
Alex Deucher187e3592013-01-18 14:51:38 -05001732 evergreen_print_gpu_status_regs(rdev);
Alex Deucher271d6fed2013-01-03 12:48:05 -05001733 dev_info(rdev->dev, " VM_CONTEXT0_PROTECTION_FAULT_ADDR 0x%08X\n",
1734 RREG32(0x14F8));
1735 dev_info(rdev->dev, " VM_CONTEXT0_PROTECTION_FAULT_STATUS 0x%08X\n",
1736 RREG32(0x14D8));
1737 dev_info(rdev->dev, " VM_CONTEXT1_PROTECTION_FAULT_ADDR 0x%08X\n",
1738 RREG32(0x14FC));
1739 dev_info(rdev->dev, " VM_CONTEXT1_PROTECTION_FAULT_STATUS 0x%08X\n",
1740 RREG32(0x14DC));
1741
Alex Deucher187e3592013-01-18 14:51:38 -05001742 /* Disable CP parsing/prefetching */
1743 WREG32(CP_ME_CNTL, CP_ME_HALT | CP_PFP_HALT);
1744
1745 if (reset_mask & RADEON_RESET_DMA) {
1746 /* dma0 */
1747 tmp = RREG32(DMA_RB_CNTL + DMA0_REGISTER_OFFSET);
1748 tmp &= ~DMA_RB_ENABLE;
1749 WREG32(DMA_RB_CNTL + DMA0_REGISTER_OFFSET, tmp);
Alex Deucher168757e2013-01-18 19:17:22 -05001750 }
Alex Deucher187e3592013-01-18 14:51:38 -05001751
Alex Deucher168757e2013-01-18 19:17:22 -05001752 if (reset_mask & RADEON_RESET_DMA1) {
Alex Deucher187e3592013-01-18 14:51:38 -05001753 /* dma1 */
1754 tmp = RREG32(DMA_RB_CNTL + DMA1_REGISTER_OFFSET);
1755 tmp &= ~DMA_RB_ENABLE;
1756 WREG32(DMA_RB_CNTL + DMA1_REGISTER_OFFSET, tmp);
1757 }
1758
Alex Deucher90fb8772013-01-23 18:59:17 -05001759 udelay(50);
1760
1761 evergreen_mc_stop(rdev, &save);
1762 if (evergreen_mc_wait_for_idle(rdev)) {
1763 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
1764 }
1765
Alex Deucher187e3592013-01-18 14:51:38 -05001766 if (reset_mask & (RADEON_RESET_GFX | RADEON_RESET_COMPUTE)) {
1767 grbm_soft_reset = SOFT_RESET_CB |
1768 SOFT_RESET_DB |
1769 SOFT_RESET_GDS |
1770 SOFT_RESET_PA |
1771 SOFT_RESET_SC |
1772 SOFT_RESET_SPI |
1773 SOFT_RESET_SH |
1774 SOFT_RESET_SX |
1775 SOFT_RESET_TC |
1776 SOFT_RESET_TA |
1777 SOFT_RESET_VGT |
1778 SOFT_RESET_IA;
1779 }
1780
1781 if (reset_mask & RADEON_RESET_CP) {
1782 grbm_soft_reset |= SOFT_RESET_CP | SOFT_RESET_VGT;
1783
1784 srbm_soft_reset |= SOFT_RESET_GRBM;
1785 }
Alex Deucher271d6fed2013-01-03 12:48:05 -05001786
1787 if (reset_mask & RADEON_RESET_DMA)
Alex Deucher168757e2013-01-18 19:17:22 -05001788 srbm_soft_reset |= SOFT_RESET_DMA;
1789
1790 if (reset_mask & RADEON_RESET_DMA1)
1791 srbm_soft_reset |= SOFT_RESET_DMA1;
1792
1793 if (reset_mask & RADEON_RESET_DISPLAY)
1794 srbm_soft_reset |= SOFT_RESET_DC;
1795
1796 if (reset_mask & RADEON_RESET_RLC)
1797 srbm_soft_reset |= SOFT_RESET_RLC;
1798
1799 if (reset_mask & RADEON_RESET_SEM)
1800 srbm_soft_reset |= SOFT_RESET_SEM;
1801
1802 if (reset_mask & RADEON_RESET_IH)
1803 srbm_soft_reset |= SOFT_RESET_IH;
1804
1805 if (reset_mask & RADEON_RESET_GRBM)
1806 srbm_soft_reset |= SOFT_RESET_GRBM;
1807
1808 if (reset_mask & RADEON_RESET_VMC)
1809 srbm_soft_reset |= SOFT_RESET_VMC;
1810
Alex Deucher24178ec2013-01-24 15:00:17 -05001811 if (!(rdev->flags & RADEON_IS_IGP)) {
1812 if (reset_mask & RADEON_RESET_MC)
1813 srbm_soft_reset |= SOFT_RESET_MC;
1814 }
Alex Deucher187e3592013-01-18 14:51:38 -05001815
1816 if (grbm_soft_reset) {
1817 tmp = RREG32(GRBM_SOFT_RESET);
1818 tmp |= grbm_soft_reset;
1819 dev_info(rdev->dev, "GRBM_SOFT_RESET=0x%08X\n", tmp);
1820 WREG32(GRBM_SOFT_RESET, tmp);
1821 tmp = RREG32(GRBM_SOFT_RESET);
1822
1823 udelay(50);
1824
1825 tmp &= ~grbm_soft_reset;
1826 WREG32(GRBM_SOFT_RESET, tmp);
1827 tmp = RREG32(GRBM_SOFT_RESET);
1828 }
1829
1830 if (srbm_soft_reset) {
1831 tmp = RREG32(SRBM_SOFT_RESET);
1832 tmp |= srbm_soft_reset;
1833 dev_info(rdev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
1834 WREG32(SRBM_SOFT_RESET, tmp);
1835 tmp = RREG32(SRBM_SOFT_RESET);
1836
1837 udelay(50);
1838
1839 tmp &= ~srbm_soft_reset;
1840 WREG32(SRBM_SOFT_RESET, tmp);
1841 tmp = RREG32(SRBM_SOFT_RESET);
1842 }
Alex Deucher271d6fed2013-01-03 12:48:05 -05001843
1844 /* Wait a little for things to settle down */
1845 udelay(50);
1846
Alex Deucherb9952a82011-03-02 20:07:33 -05001847 evergreen_mc_resume(rdev, &save);
Alex Deucher187e3592013-01-18 14:51:38 -05001848 udelay(50);
Alex Deucher410a3412013-01-18 13:05:39 -05001849
Alex Deucher187e3592013-01-18 14:51:38 -05001850 evergreen_print_gpu_status_regs(rdev);
Alex Deucherb9952a82011-03-02 20:07:33 -05001851}
1852
1853int cayman_asic_reset(struct radeon_device *rdev)
1854{
Alex Deucher168757e2013-01-18 19:17:22 -05001855 u32 reset_mask;
1856
1857 reset_mask = cayman_gpu_check_soft_reset(rdev);
1858
1859 if (reset_mask)
1860 r600_set_bios_scratch_engine_hung(rdev, true);
1861
1862 cayman_gpu_soft_reset(rdev, reset_mask);
1863
1864 reset_mask = cayman_gpu_check_soft_reset(rdev);
1865
1866 if (!reset_mask)
1867 r600_set_bios_scratch_engine_hung(rdev, false);
1868
1869 return 0;
Alex Deucherb9952a82011-03-02 20:07:33 -05001870}
1871
Alex Deucherf60cbd12012-12-04 15:27:33 -05001872/**
Alex Deucher123bc182013-01-24 11:37:19 -05001873 * cayman_gfx_is_lockup - Check if the GFX engine is locked up
1874 *
1875 * @rdev: radeon_device pointer
1876 * @ring: radeon_ring structure holding ring information
1877 *
1878 * Check if the GFX engine is locked up.
1879 * Returns true if the engine appears to be locked up, false if not.
1880 */
1881bool cayman_gfx_is_lockup(struct radeon_device *rdev, struct radeon_ring *ring)
1882{
1883 u32 reset_mask = cayman_gpu_check_soft_reset(rdev);
1884
1885 if (!(reset_mask & (RADEON_RESET_GFX |
1886 RADEON_RESET_COMPUTE |
1887 RADEON_RESET_CP))) {
1888 radeon_ring_lockup_update(ring);
1889 return false;
1890 }
1891 /* force CP activities */
1892 radeon_ring_force_activity(rdev, ring);
1893 return radeon_ring_test_lockup(rdev, ring);
1894}
1895
1896/**
Alex Deucherf60cbd12012-12-04 15:27:33 -05001897 * cayman_dma_is_lockup - Check if the DMA engine is locked up
1898 *
1899 * @rdev: radeon_device pointer
1900 * @ring: radeon_ring structure holding ring information
1901 *
Alex Deucher123bc182013-01-24 11:37:19 -05001902 * Check if the async DMA engine is locked up.
Alex Deucherf60cbd12012-12-04 15:27:33 -05001903 * Returns true if the engine appears to be locked up, false if not.
1904 */
1905bool cayman_dma_is_lockup(struct radeon_device *rdev, struct radeon_ring *ring)
1906{
Alex Deucher123bc182013-01-24 11:37:19 -05001907 u32 reset_mask = cayman_gpu_check_soft_reset(rdev);
1908 u32 mask;
Alex Deucherf60cbd12012-12-04 15:27:33 -05001909
1910 if (ring->idx == R600_RING_TYPE_DMA_INDEX)
Alex Deucher123bc182013-01-24 11:37:19 -05001911 mask = RADEON_RESET_DMA;
Alex Deucherf60cbd12012-12-04 15:27:33 -05001912 else
Alex Deucher123bc182013-01-24 11:37:19 -05001913 mask = RADEON_RESET_DMA1;
1914
1915 if (!(reset_mask & mask)) {
Alex Deucherf60cbd12012-12-04 15:27:33 -05001916 radeon_ring_lockup_update(ring);
1917 return false;
1918 }
1919 /* force ring activities */
1920 radeon_ring_force_activity(rdev, ring);
1921 return radeon_ring_test_lockup(rdev, ring);
1922}
1923
Alex Deucher755d8192011-03-02 20:07:34 -05001924static int cayman_startup(struct radeon_device *rdev)
1925{
Christian Könige32eb502011-10-23 12:56:27 +02001926 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
Alex Deucher755d8192011-03-02 20:07:34 -05001927 int r;
1928
Ilija Hadzicb07759b2011-09-20 10:22:58 -04001929 /* enable pcie gen2 link */
1930 evergreen_pcie_gen2_enable(rdev);
1931
Alex Deucherc420c742012-03-20 17:18:39 -04001932 if (rdev->flags & RADEON_IS_IGP) {
1933 if (!rdev->me_fw || !rdev->pfp_fw || !rdev->rlc_fw) {
1934 r = ni_init_microcode(rdev);
1935 if (r) {
1936 DRM_ERROR("Failed to load firmware!\n");
1937 return r;
1938 }
1939 }
1940 } else {
1941 if (!rdev->me_fw || !rdev->pfp_fw || !rdev->rlc_fw || !rdev->mc_fw) {
1942 r = ni_init_microcode(rdev);
1943 if (r) {
1944 DRM_ERROR("Failed to load firmware!\n");
1945 return r;
1946 }
1947 }
1948
1949 r = ni_mc_load_microcode(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05001950 if (r) {
Alex Deucherc420c742012-03-20 17:18:39 -04001951 DRM_ERROR("Failed to load MC firmware!\n");
Alex Deucher755d8192011-03-02 20:07:34 -05001952 return r;
1953 }
1954 }
Alex Deucher755d8192011-03-02 20:07:34 -05001955
Alex Deucher16cdf042011-10-28 10:30:02 -04001956 r = r600_vram_scratch_init(rdev);
1957 if (r)
1958 return r;
1959
Alex Deucher755d8192011-03-02 20:07:34 -05001960 evergreen_mc_program(rdev);
1961 r = cayman_pcie_gart_enable(rdev);
1962 if (r)
1963 return r;
1964 cayman_gpu_init(rdev);
1965
Alex Deuchercb92d452011-05-25 16:39:00 -04001966 r = evergreen_blit_init(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05001967 if (r) {
Ilija Hadzicfb3d9e92011-10-12 23:29:41 -04001968 r600_blit_fini(rdev);
Alex Deucher27cd7762012-02-23 17:53:42 -05001969 rdev->asic->copy.copy = NULL;
Alex Deucher755d8192011-03-02 20:07:34 -05001970 dev_warn(rdev->dev, "failed blitter (%d) falling back to memcpy\n", r);
1971 }
Alex Deucher755d8192011-03-02 20:07:34 -05001972
Alex Deucherc420c742012-03-20 17:18:39 -04001973 /* allocate rlc buffers */
1974 if (rdev->flags & RADEON_IS_IGP) {
1975 r = si_rlc_init(rdev);
1976 if (r) {
1977 DRM_ERROR("Failed to init rlc BOs!\n");
1978 return r;
1979 }
1980 }
1981
Alex Deucher755d8192011-03-02 20:07:34 -05001982 /* allocate wb buffer */
1983 r = radeon_wb_init(rdev);
1984 if (r)
1985 return r;
1986
Jerome Glisse30eb77f2011-11-20 20:45:34 +00001987 r = radeon_fence_driver_start_ring(rdev, RADEON_RING_TYPE_GFX_INDEX);
1988 if (r) {
1989 dev_err(rdev->dev, "failed initializing CP fences (%d).\n", r);
1990 return r;
1991 }
1992
Christian Königf2ba57b2013-04-08 12:41:29 +02001993 r = rv770_uvd_resume(rdev);
1994 if (!r) {
1995 r = radeon_fence_driver_start_ring(rdev,
1996 R600_RING_TYPE_UVD_INDEX);
1997 if (r)
1998 dev_err(rdev->dev, "UVD fences init error (%d).\n", r);
1999 }
2000 if (r)
2001 rdev->ring[R600_RING_TYPE_UVD_INDEX].ring_size = 0;
2002
Jerome Glisse30eb77f2011-11-20 20:45:34 +00002003 r = radeon_fence_driver_start_ring(rdev, CAYMAN_RING_TYPE_CP1_INDEX);
2004 if (r) {
2005 dev_err(rdev->dev, "failed initializing CP fences (%d).\n", r);
2006 return r;
2007 }
2008
2009 r = radeon_fence_driver_start_ring(rdev, CAYMAN_RING_TYPE_CP2_INDEX);
2010 if (r) {
2011 dev_err(rdev->dev, "failed initializing CP fences (%d).\n", r);
2012 return r;
2013 }
2014
Alex Deucherf60cbd12012-12-04 15:27:33 -05002015 r = radeon_fence_driver_start_ring(rdev, R600_RING_TYPE_DMA_INDEX);
2016 if (r) {
2017 dev_err(rdev->dev, "failed initializing DMA fences (%d).\n", r);
2018 return r;
2019 }
2020
2021 r = radeon_fence_driver_start_ring(rdev, CAYMAN_RING_TYPE_DMA1_INDEX);
2022 if (r) {
2023 dev_err(rdev->dev, "failed initializing DMA fences (%d).\n", r);
2024 return r;
2025 }
2026
Alex Deucher755d8192011-03-02 20:07:34 -05002027 /* Enable IRQ */
2028 r = r600_irq_init(rdev);
2029 if (r) {
2030 DRM_ERROR("radeon: IH init failed (%d).\n", r);
2031 radeon_irq_kms_fini(rdev);
2032 return r;
2033 }
2034 evergreen_irq_set(rdev);
2035
Christian Könige32eb502011-10-23 12:56:27 +02002036 r = radeon_ring_init(rdev, ring, ring->ring_size, RADEON_WB_CP_RPTR_OFFSET,
Alex Deucher78c55602011-11-17 14:25:56 -05002037 CP_RB0_RPTR, CP_RB0_WPTR,
2038 0, 0xfffff, RADEON_CP_PACKET2);
Alex Deucher755d8192011-03-02 20:07:34 -05002039 if (r)
2040 return r;
Alex Deucherf60cbd12012-12-04 15:27:33 -05002041
2042 ring = &rdev->ring[R600_RING_TYPE_DMA_INDEX];
2043 r = radeon_ring_init(rdev, ring, ring->ring_size, R600_WB_DMA_RPTR_OFFSET,
2044 DMA_RB_RPTR + DMA0_REGISTER_OFFSET,
2045 DMA_RB_WPTR + DMA0_REGISTER_OFFSET,
2046 2, 0x3fffc, DMA_PACKET(DMA_PACKET_NOP, 0, 0, 0));
2047 if (r)
2048 return r;
2049
2050 ring = &rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX];
2051 r = radeon_ring_init(rdev, ring, ring->ring_size, CAYMAN_WB_DMA1_RPTR_OFFSET,
2052 DMA_RB_RPTR + DMA1_REGISTER_OFFSET,
2053 DMA_RB_WPTR + DMA1_REGISTER_OFFSET,
2054 2, 0x3fffc, DMA_PACKET(DMA_PACKET_NOP, 0, 0, 0));
2055 if (r)
2056 return r;
2057
Alex Deucher755d8192011-03-02 20:07:34 -05002058 r = cayman_cp_load_microcode(rdev);
2059 if (r)
2060 return r;
2061 r = cayman_cp_resume(rdev);
2062 if (r)
2063 return r;
2064
Alex Deucherf60cbd12012-12-04 15:27:33 -05002065 r = cayman_dma_resume(rdev);
2066 if (r)
2067 return r;
2068
Christian Königf2ba57b2013-04-08 12:41:29 +02002069 ring = &rdev->ring[R600_RING_TYPE_UVD_INDEX];
2070 if (ring->ring_size) {
2071 r = radeon_ring_init(rdev, ring, ring->ring_size,
2072 R600_WB_UVD_RPTR_OFFSET,
2073 UVD_RBC_RB_RPTR, UVD_RBC_RB_WPTR,
2074 0, 0xfffff, RADEON_CP_PACKET2);
2075 if (!r)
2076 r = r600_uvd_init(rdev);
2077 if (r)
2078 DRM_ERROR("radeon: failed initializing UVD (%d).\n", r);
2079 }
2080
Christian König2898c342012-07-05 11:55:34 +02002081 r = radeon_ib_pool_init(rdev);
2082 if (r) {
2083 dev_err(rdev->dev, "IB initialization failed (%d).\n", r);
Jerome Glisseb15ba512011-11-15 11:48:34 -05002084 return r;
Christian König2898c342012-07-05 11:55:34 +02002085 }
Jerome Glisseb15ba512011-11-15 11:48:34 -05002086
Christian Königc6105f22012-07-05 14:32:00 +02002087 r = radeon_vm_manager_init(rdev);
2088 if (r) {
2089 dev_err(rdev->dev, "vm manager initialization failed (%d).\n", r);
Jerome Glisse721604a2012-01-05 22:11:05 -05002090 return r;
Christian Königc6105f22012-07-05 14:32:00 +02002091 }
Jerome Glisse721604a2012-01-05 22:11:05 -05002092
Rafał Miłecki6b53a052012-06-11 12:34:01 +02002093 r = r600_audio_init(rdev);
2094 if (r)
2095 return r;
2096
Alex Deucher755d8192011-03-02 20:07:34 -05002097 return 0;
2098}
2099
2100int cayman_resume(struct radeon_device *rdev)
2101{
2102 int r;
2103
2104 /* Do not reset GPU before posting, on rv770 hw unlike on r500 hw,
2105 * posting will perform necessary task to bring back GPU into good
2106 * shape.
2107 */
2108 /* post card */
2109 atom_asic_init(rdev->mode_info.atom_context);
2110
Alex Deuchera2c96a22013-02-28 17:58:36 -05002111 /* init golden registers */
2112 ni_init_golden_registers(rdev);
2113
Jerome Glisseb15ba512011-11-15 11:48:34 -05002114 rdev->accel_working = true;
Alex Deucher755d8192011-03-02 20:07:34 -05002115 r = cayman_startup(rdev);
2116 if (r) {
2117 DRM_ERROR("cayman startup failed on resume\n");
Jerome Glisse6b7746e2012-02-20 17:57:20 -05002118 rdev->accel_working = false;
Alex Deucher755d8192011-03-02 20:07:34 -05002119 return r;
2120 }
Alex Deucher755d8192011-03-02 20:07:34 -05002121 return r;
Alex Deucher755d8192011-03-02 20:07:34 -05002122}
2123
2124int cayman_suspend(struct radeon_device *rdev)
2125{
Rafał Miłecki6b53a052012-06-11 12:34:01 +02002126 r600_audio_fini(rdev);
Alex Deucherfa3daf92013-03-11 15:32:26 -04002127 radeon_vm_manager_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002128 cayman_cp_enable(rdev, false);
Alex Deucherf60cbd12012-12-04 15:27:33 -05002129 cayman_dma_stop(rdev);
Christian Königf2ba57b2013-04-08 12:41:29 +02002130 r600_uvd_rbc_stop(rdev);
2131 radeon_uvd_suspend(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002132 evergreen_irq_suspend(rdev);
2133 radeon_wb_disable(rdev);
2134 cayman_pcie_gart_disable(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002135 return 0;
2136}
2137
2138/* Plan is to move initialization in that function and use
2139 * helper function so that radeon_device_init pretty much
2140 * do nothing more than calling asic specific function. This
2141 * should also allow to remove a bunch of callback function
2142 * like vram_info.
2143 */
2144int cayman_init(struct radeon_device *rdev)
2145{
Christian Könige32eb502011-10-23 12:56:27 +02002146 struct radeon_ring *ring = &rdev->ring[RADEON_RING_TYPE_GFX_INDEX];
Alex Deucher755d8192011-03-02 20:07:34 -05002147 int r;
2148
Alex Deucher755d8192011-03-02 20:07:34 -05002149 /* Read BIOS */
2150 if (!radeon_get_bios(rdev)) {
2151 if (ASIC_IS_AVIVO(rdev))
2152 return -EINVAL;
2153 }
2154 /* Must be an ATOMBIOS */
2155 if (!rdev->is_atom_bios) {
2156 dev_err(rdev->dev, "Expecting atombios for cayman GPU\n");
2157 return -EINVAL;
2158 }
2159 r = radeon_atombios_init(rdev);
2160 if (r)
2161 return r;
2162
2163 /* Post card if necessary */
2164 if (!radeon_card_posted(rdev)) {
2165 if (!rdev->bios) {
2166 dev_err(rdev->dev, "Card not posted and no BIOS - ignoring\n");
2167 return -EINVAL;
2168 }
2169 DRM_INFO("GPU not posted. posting now...\n");
2170 atom_asic_init(rdev->mode_info.atom_context);
2171 }
Alex Deuchera2c96a22013-02-28 17:58:36 -05002172 /* init golden registers */
2173 ni_init_golden_registers(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002174 /* Initialize scratch registers */
2175 r600_scratch_init(rdev);
2176 /* Initialize surface registers */
2177 radeon_surface_init(rdev);
2178 /* Initialize clocks */
2179 radeon_get_clock_info(rdev->ddev);
2180 /* Fence driver */
Jerome Glisse30eb77f2011-11-20 20:45:34 +00002181 r = radeon_fence_driver_init(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002182 if (r)
2183 return r;
2184 /* initialize memory controller */
2185 r = evergreen_mc_init(rdev);
2186 if (r)
2187 return r;
2188 /* Memory manager */
2189 r = radeon_bo_init(rdev);
2190 if (r)
2191 return r;
2192
2193 r = radeon_irq_kms_init(rdev);
2194 if (r)
2195 return r;
2196
Christian Könige32eb502011-10-23 12:56:27 +02002197 ring->ring_obj = NULL;
2198 r600_ring_init(rdev, ring, 1024 * 1024);
Alex Deucher755d8192011-03-02 20:07:34 -05002199
Alex Deucherf60cbd12012-12-04 15:27:33 -05002200 ring = &rdev->ring[R600_RING_TYPE_DMA_INDEX];
2201 ring->ring_obj = NULL;
2202 r600_ring_init(rdev, ring, 64 * 1024);
2203
2204 ring = &rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX];
2205 ring->ring_obj = NULL;
2206 r600_ring_init(rdev, ring, 64 * 1024);
2207
Christian Königf2ba57b2013-04-08 12:41:29 +02002208 r = radeon_uvd_init(rdev);
2209 if (!r) {
2210 ring = &rdev->ring[R600_RING_TYPE_UVD_INDEX];
2211 ring->ring_obj = NULL;
2212 r600_ring_init(rdev, ring, 4096);
2213 }
2214
Alex Deucher755d8192011-03-02 20:07:34 -05002215 rdev->ih.ring_obj = NULL;
2216 r600_ih_ring_init(rdev, 64 * 1024);
2217
2218 r = r600_pcie_gart_init(rdev);
2219 if (r)
2220 return r;
2221
2222 rdev->accel_working = true;
2223 r = cayman_startup(rdev);
2224 if (r) {
2225 dev_err(rdev->dev, "disabling GPU acceleration\n");
2226 cayman_cp_fini(rdev);
Alex Deucherf60cbd12012-12-04 15:27:33 -05002227 cayman_dma_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002228 r600_irq_fini(rdev);
Alex Deucherc420c742012-03-20 17:18:39 -04002229 if (rdev->flags & RADEON_IS_IGP)
2230 si_rlc_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002231 radeon_wb_fini(rdev);
Christian König2898c342012-07-05 11:55:34 +02002232 radeon_ib_pool_fini(rdev);
Jerome Glisse721604a2012-01-05 22:11:05 -05002233 radeon_vm_manager_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002234 radeon_irq_kms_fini(rdev);
2235 cayman_pcie_gart_fini(rdev);
2236 rdev->accel_working = false;
2237 }
Alex Deucher755d8192011-03-02 20:07:34 -05002238
2239 /* Don't start up if the MC ucode is missing.
2240 * The default clocks and voltages before the MC ucode
2241 * is loaded are not suffient for advanced operations.
Alex Deucherc420c742012-03-20 17:18:39 -04002242 *
2243 * We can skip this check for TN, because there is no MC
2244 * ucode.
Alex Deucher755d8192011-03-02 20:07:34 -05002245 */
Alex Deucherc420c742012-03-20 17:18:39 -04002246 if (!rdev->mc_fw && !(rdev->flags & RADEON_IS_IGP)) {
Alex Deucher755d8192011-03-02 20:07:34 -05002247 DRM_ERROR("radeon: MC ucode required for NI+.\n");
2248 return -EINVAL;
2249 }
2250
2251 return 0;
2252}
2253
2254void cayman_fini(struct radeon_device *rdev)
2255{
Ilija Hadzicfb3d9e92011-10-12 23:29:41 -04002256 r600_blit_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002257 cayman_cp_fini(rdev);
Alex Deucherf60cbd12012-12-04 15:27:33 -05002258 cayman_dma_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002259 r600_irq_fini(rdev);
Alex Deucherc420c742012-03-20 17:18:39 -04002260 if (rdev->flags & RADEON_IS_IGP)
2261 si_rlc_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002262 radeon_wb_fini(rdev);
Jerome Glisse721604a2012-01-05 22:11:05 -05002263 radeon_vm_manager_fini(rdev);
Christian König2898c342012-07-05 11:55:34 +02002264 radeon_ib_pool_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002265 radeon_irq_kms_fini(rdev);
Christian Königf2ba57b2013-04-08 12:41:29 +02002266 radeon_uvd_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002267 cayman_pcie_gart_fini(rdev);
Alex Deucher16cdf042011-10-28 10:30:02 -04002268 r600_vram_scratch_fini(rdev);
Alex Deucher755d8192011-03-02 20:07:34 -05002269 radeon_gem_fini(rdev);
2270 radeon_fence_driver_fini(rdev);
2271 radeon_bo_fini(rdev);
2272 radeon_atombios_fini(rdev);
2273 kfree(rdev->bios);
2274 rdev->bios = NULL;
2275}
2276
Jerome Glisse721604a2012-01-05 22:11:05 -05002277/*
2278 * vm
2279 */
2280int cayman_vm_init(struct radeon_device *rdev)
2281{
2282 /* number of VMs */
2283 rdev->vm_manager.nvm = 8;
2284 /* base offset of vram pages */
Alex Deuchere71270f2012-03-20 17:18:38 -04002285 if (rdev->flags & RADEON_IS_IGP) {
2286 u64 tmp = RREG32(FUS_MC_VM_FB_OFFSET);
2287 tmp <<= 22;
2288 rdev->vm_manager.vram_base_offset = tmp;
2289 } else
2290 rdev->vm_manager.vram_base_offset = 0;
Jerome Glisse721604a2012-01-05 22:11:05 -05002291 return 0;
2292}
2293
2294void cayman_vm_fini(struct radeon_device *rdev)
2295{
2296}
2297
Christian Königdce34bf2012-09-17 19:36:18 +02002298#define R600_ENTRY_VALID (1 << 0)
Jerome Glisse721604a2012-01-05 22:11:05 -05002299#define R600_PTE_SYSTEM (1 << 1)
2300#define R600_PTE_SNOOPED (1 << 2)
2301#define R600_PTE_READABLE (1 << 5)
2302#define R600_PTE_WRITEABLE (1 << 6)
2303
Christian König089a7862012-08-11 11:54:05 +02002304uint32_t cayman_vm_page_flags(struct radeon_device *rdev, uint32_t flags)
Jerome Glisse721604a2012-01-05 22:11:05 -05002305{
2306 uint32_t r600_flags = 0;
Christian Königdce34bf2012-09-17 19:36:18 +02002307 r600_flags |= (flags & RADEON_VM_PAGE_VALID) ? R600_ENTRY_VALID : 0;
Jerome Glisse721604a2012-01-05 22:11:05 -05002308 r600_flags |= (flags & RADEON_VM_PAGE_READABLE) ? R600_PTE_READABLE : 0;
2309 r600_flags |= (flags & RADEON_VM_PAGE_WRITEABLE) ? R600_PTE_WRITEABLE : 0;
2310 if (flags & RADEON_VM_PAGE_SYSTEM) {
2311 r600_flags |= R600_PTE_SYSTEM;
2312 r600_flags |= (flags & RADEON_VM_PAGE_SNOOPED) ? R600_PTE_SNOOPED : 0;
2313 }
2314 return r600_flags;
2315}
2316
Alex Deucher7a083292012-08-31 13:51:21 -04002317/**
2318 * cayman_vm_set_page - update the page tables using the CP
2319 *
2320 * @rdev: radeon_device pointer
Alex Deucher43f12142013-02-01 17:32:42 +01002321 * @ib: indirect buffer to fill with commands
Christian Königdce34bf2012-09-17 19:36:18 +02002322 * @pe: addr of the page entry
2323 * @addr: dst addr to write into pe
2324 * @count: number of page entries to update
2325 * @incr: increase next addr by incr bytes
2326 * @flags: access flags
Alex Deucher7a083292012-08-31 13:51:21 -04002327 *
Alex Deucher43f12142013-02-01 17:32:42 +01002328 * Update the page tables using the CP (cayman/TN).
Alex Deucher7a083292012-08-31 13:51:21 -04002329 */
Alex Deucher43f12142013-02-01 17:32:42 +01002330void cayman_vm_set_page(struct radeon_device *rdev,
2331 struct radeon_ib *ib,
2332 uint64_t pe,
Christian Königdce34bf2012-09-17 19:36:18 +02002333 uint64_t addr, unsigned count,
2334 uint32_t incr, uint32_t flags)
Jerome Glisse721604a2012-01-05 22:11:05 -05002335{
Christian Königdce34bf2012-09-17 19:36:18 +02002336 uint32_t r600_flags = cayman_vm_page_flags(rdev, flags);
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002337 uint64_t value;
2338 unsigned ndw;
Jerome Glisse721604a2012-01-05 22:11:05 -05002339
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002340 if (rdev->asic->vm.pt_ring_index == RADEON_RING_TYPE_GFX_INDEX) {
2341 while (count) {
2342 ndw = 1 + count * 2;
2343 if (ndw > 0x3FFF)
2344 ndw = 0x3FFF;
Christian König089a7862012-08-11 11:54:05 +02002345
Alex Deucher43f12142013-02-01 17:32:42 +01002346 ib->ptr[ib->length_dw++] = PACKET3(PACKET3_ME_WRITE, ndw);
2347 ib->ptr[ib->length_dw++] = pe;
2348 ib->ptr[ib->length_dw++] = upper_32_bits(pe) & 0xff;
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002349 for (; ndw > 1; ndw -= 2, --count, pe += 8) {
2350 if (flags & RADEON_VM_PAGE_SYSTEM) {
2351 value = radeon_vm_map_gart(rdev, addr);
2352 value &= 0xFFFFFFFFFFFFF000ULL;
2353 } else if (flags & RADEON_VM_PAGE_VALID) {
2354 value = addr;
2355 } else {
2356 value = 0;
2357 }
Christian Königf9fdffa2012-10-22 17:42:36 +02002358 addr += incr;
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002359 value |= r600_flags;
Alex Deucher43f12142013-02-01 17:32:42 +01002360 ib->ptr[ib->length_dw++] = value;
2361 ib->ptr[ib->length_dw++] = upper_32_bits(value);
Christian Königf9fdffa2012-10-22 17:42:36 +02002362 }
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002363 }
2364 } else {
Alex Deucher2ab91ad2013-04-16 10:42:15 -04002365 if ((flags & RADEON_VM_PAGE_SYSTEM) ||
2366 (count == 1)) {
2367 while (count) {
2368 ndw = count * 2;
2369 if (ndw > 0xFFFFE)
2370 ndw = 0xFFFFE;
Christian Königf9fdffa2012-10-22 17:42:36 +02002371
Alex Deucher2ab91ad2013-04-16 10:42:15 -04002372 /* for non-physically contiguous pages (system) */
2373 ib->ptr[ib->length_dw++] = DMA_PACKET(DMA_PACKET_WRITE, 0, 0, ndw);
2374 ib->ptr[ib->length_dw++] = pe;
2375 ib->ptr[ib->length_dw++] = upper_32_bits(pe) & 0xff;
2376 for (; ndw > 0; ndw -= 2, --count, pe += 8) {
2377 if (flags & RADEON_VM_PAGE_SYSTEM) {
2378 value = radeon_vm_map_gart(rdev, addr);
2379 value &= 0xFFFFFFFFFFFFF000ULL;
2380 } else if (flags & RADEON_VM_PAGE_VALID) {
2381 value = addr;
2382 } else {
2383 value = 0;
2384 }
2385 addr += incr;
2386 value |= r600_flags;
2387 ib->ptr[ib->length_dw++] = value;
2388 ib->ptr[ib->length_dw++] = upper_32_bits(value);
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002389 }
Alex Deucher2ab91ad2013-04-16 10:42:15 -04002390 }
2391 while (ib->length_dw & 0x7)
2392 ib->ptr[ib->length_dw++] = DMA_PACKET(DMA_PACKET_NOP, 0, 0, 0);
2393 } else {
2394 while (count) {
2395 ndw = count * 2;
2396 if (ndw > 0xFFFFE)
2397 ndw = 0xFFFFE;
2398
2399 if (flags & RADEON_VM_PAGE_VALID)
2400 value = addr;
2401 else
2402 value = 0;
2403 /* for physically contiguous pages (vram) */
2404 ib->ptr[ib->length_dw++] = DMA_PTE_PDE_PACKET(ndw);
2405 ib->ptr[ib->length_dw++] = pe; /* dst addr */
2406 ib->ptr[ib->length_dw++] = upper_32_bits(pe) & 0xff;
2407 ib->ptr[ib->length_dw++] = r600_flags; /* mask */
2408 ib->ptr[ib->length_dw++] = 0;
2409 ib->ptr[ib->length_dw++] = value; /* value */
Alex Deucher43f12142013-02-01 17:32:42 +01002410 ib->ptr[ib->length_dw++] = upper_32_bits(value);
Alex Deucher2ab91ad2013-04-16 10:42:15 -04002411 ib->ptr[ib->length_dw++] = incr; /* increment size */
2412 ib->ptr[ib->length_dw++] = 0;
2413 pe += ndw * 4;
2414 addr += (ndw / 2) * incr;
2415 count -= ndw / 2;
Alex Deucher3b6b59b2012-10-22 12:19:01 -04002416 }
Christian König2a6f1ab2012-08-11 15:00:30 +02002417 }
Alex Deucher43f12142013-02-01 17:32:42 +01002418 while (ib->length_dw & 0x7)
2419 ib->ptr[ib->length_dw++] = DMA_PACKET(DMA_PACKET_NOP, 0, 0, 0);
Christian König2a6f1ab2012-08-11 15:00:30 +02002420 }
Jerome Glisse721604a2012-01-05 22:11:05 -05002421}
Christian König9b40e5d2012-08-08 12:22:43 +02002422
Alex Deucher7a083292012-08-31 13:51:21 -04002423/**
2424 * cayman_vm_flush - vm flush using the CP
2425 *
2426 * @rdev: radeon_device pointer
2427 *
2428 * Update the page table base and flush the VM TLB
2429 * using the CP (cayman-si).
2430 */
Alex Deucher498522b2012-10-02 14:43:38 -04002431void cayman_vm_flush(struct radeon_device *rdev, int ridx, struct radeon_vm *vm)
Christian König9b40e5d2012-08-08 12:22:43 +02002432{
Alex Deucher498522b2012-10-02 14:43:38 -04002433 struct radeon_ring *ring = &rdev->ring[ridx];
Christian König9b40e5d2012-08-08 12:22:43 +02002434
Christian Königee60e292012-08-09 16:21:08 +02002435 if (vm == NULL)
Christian König9b40e5d2012-08-08 12:22:43 +02002436 return;
2437
Christian Königee60e292012-08-09 16:21:08 +02002438 radeon_ring_write(ring, PACKET0(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR + (vm->id << 2), 0));
Dmitry Cherkasovfa87e622012-09-17 19:36:19 +02002439 radeon_ring_write(ring, vm->pd_gpu_addr >> 12);
Christian Königee60e292012-08-09 16:21:08 +02002440
Christian König9b40e5d2012-08-08 12:22:43 +02002441 /* flush hdp cache */
2442 radeon_ring_write(ring, PACKET0(HDP_MEM_COHERENCY_FLUSH_CNTL, 0));
2443 radeon_ring_write(ring, 0x1);
2444
2445 /* bits 0-7 are the VM contexts0-7 */
2446 radeon_ring_write(ring, PACKET0(VM_INVALIDATE_REQUEST, 0));
Alex Deucher498522b2012-10-02 14:43:38 -04002447 radeon_ring_write(ring, 1 << vm->id);
Christian König58f8cf52012-10-22 17:42:35 +02002448
2449 /* sync PFP to ME, otherwise we might get invalid PFP reads */
2450 radeon_ring_write(ring, PACKET3(PACKET3_PFP_SYNC_ME, 0));
2451 radeon_ring_write(ring, 0x0);
Alex Deucher0af62b02011-01-06 21:19:31 -05002452}
Alex Deucherf60cbd12012-12-04 15:27:33 -05002453
2454void cayman_dma_vm_flush(struct radeon_device *rdev, int ridx, struct radeon_vm *vm)
2455{
2456 struct radeon_ring *ring = &rdev->ring[ridx];
2457
2458 if (vm == NULL)
2459 return;
2460
2461 radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_SRBM_WRITE, 0, 0, 0));
2462 radeon_ring_write(ring, (0xf << 16) | ((VM_CONTEXT0_PAGE_TABLE_BASE_ADDR + (vm->id << 2)) >> 2));
2463 radeon_ring_write(ring, vm->pd_gpu_addr >> 12);
2464
2465 /* flush hdp cache */
2466 radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_SRBM_WRITE, 0, 0, 0));
2467 radeon_ring_write(ring, (0xf << 16) | (HDP_MEM_COHERENCY_FLUSH_CNTL >> 2));
2468 radeon_ring_write(ring, 1);
2469
2470 /* bits 0-7 are the VM contexts0-7 */
2471 radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_SRBM_WRITE, 0, 0, 0));
2472 radeon_ring_write(ring, (0xf << 16) | (VM_INVALIDATE_REQUEST >> 2));
2473 radeon_ring_write(ring, 1 << vm->id);
2474}
2475