2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
24 * Authors: Dave Airlie
28 #include <linux/slab.h>
29 #include <linux/seq_file.h>
30 #include <linux/firmware.h>
31 #include <linux/platform_device.h>
32 #include <linux/module.h>
34 #include "radeon_drm.h"
36 #include "radeon_asic.h"
37 #include "radeon_mode.h"
42 #define PFP_UCODE_SIZE 576
43 #define PM4_UCODE_SIZE 1792
44 #define RLC_UCODE_SIZE 768
45 #define R700_PFP_UCODE_SIZE 848
46 #define R700_PM4_UCODE_SIZE 1360
47 #define R700_RLC_UCODE_SIZE 1024
48 #define EVERGREEN_PFP_UCODE_SIZE 1120
49 #define EVERGREEN_PM4_UCODE_SIZE 1376
50 #define EVERGREEN_RLC_UCODE_SIZE 768
51 #define CAYMAN_RLC_UCODE_SIZE 1024
54 MODULE_FIRMWARE("radeon/R600_pfp.bin");
55 MODULE_FIRMWARE("radeon/R600_me.bin");
56 MODULE_FIRMWARE("radeon/RV610_pfp.bin");
57 MODULE_FIRMWARE("radeon/RV610_me.bin");
58 MODULE_FIRMWARE("radeon/RV630_pfp.bin");
59 MODULE_FIRMWARE("radeon/RV630_me.bin");
60 MODULE_FIRMWARE("radeon/RV620_pfp.bin");
61 MODULE_FIRMWARE("radeon/RV620_me.bin");
62 MODULE_FIRMWARE("radeon/RV635_pfp.bin");
63 MODULE_FIRMWARE("radeon/RV635_me.bin");
64 MODULE_FIRMWARE("radeon/RV670_pfp.bin");
65 MODULE_FIRMWARE("radeon/RV670_me.bin");
66 MODULE_FIRMWARE("radeon/RS780_pfp.bin");
67 MODULE_FIRMWARE("radeon/RS780_me.bin");
68 MODULE_FIRMWARE("radeon/RV770_pfp.bin");
69 MODULE_FIRMWARE("radeon/RV770_me.bin");
70 MODULE_FIRMWARE("radeon/RV730_pfp.bin");
71 MODULE_FIRMWARE("radeon/RV730_me.bin");
72 MODULE_FIRMWARE("radeon/RV710_pfp.bin");
73 MODULE_FIRMWARE("radeon/RV710_me.bin");
74 MODULE_FIRMWARE("radeon/R600_rlc.bin");
75 MODULE_FIRMWARE("radeon/R700_rlc.bin");
76 MODULE_FIRMWARE("radeon/CEDAR_pfp.bin");
77 MODULE_FIRMWARE("radeon/CEDAR_me.bin");
78 MODULE_FIRMWARE("radeon/CEDAR_rlc.bin");
79 MODULE_FIRMWARE("radeon/REDWOOD_pfp.bin");
80 MODULE_FIRMWARE("radeon/REDWOOD_me.bin");
81 MODULE_FIRMWARE("radeon/REDWOOD_rlc.bin");
82 MODULE_FIRMWARE("radeon/JUNIPER_pfp.bin");
83 MODULE_FIRMWARE("radeon/JUNIPER_me.bin");
84 MODULE_FIRMWARE("radeon/JUNIPER_rlc.bin");
85 MODULE_FIRMWARE("radeon/CYPRESS_pfp.bin");
86 MODULE_FIRMWARE("radeon/CYPRESS_me.bin");
87 MODULE_FIRMWARE("radeon/CYPRESS_rlc.bin");
88 MODULE_FIRMWARE("radeon/PALM_pfp.bin");
89 MODULE_FIRMWARE("radeon/PALM_me.bin");
90 MODULE_FIRMWARE("radeon/SUMO_rlc.bin");
91 MODULE_FIRMWARE("radeon/SUMO_pfp.bin");
92 MODULE_FIRMWARE("radeon/SUMO_me.bin");
93 MODULE_FIRMWARE("radeon/SUMO2_pfp.bin");
94 MODULE_FIRMWARE("radeon/SUMO2_me.bin");
96 int r600_debugfs_mc_info_init(struct radeon_device *rdev);
98 /* r600,rv610,rv630,rv620,rv635,rv670 */
99 int r600_mc_wait_for_idle(struct radeon_device *rdev);
100 void r600_gpu_init(struct radeon_device *rdev);
101 void r600_fini(struct radeon_device *rdev);
102 void r600_irq_disable(struct radeon_device *rdev);
103 static void r600_pcie_gen2_enable(struct radeon_device *rdev);
105 /* get temperature in millidegrees */
106 int rv6xx_get_temp(struct radeon_device *rdev)
108 u32 temp = (RREG32(CG_THERMAL_STATUS) & ASIC_T_MASK) >>
110 int actual_temp = temp & 0xff;
115 return actual_temp * 1000;
118 void r600_pm_get_dynpm_state(struct radeon_device *rdev)
122 rdev->pm.dynpm_can_upclock = true;
123 rdev->pm.dynpm_can_downclock = true;
125 /* power state array is low to high, default is first */
126 if ((rdev->flags & RADEON_IS_IGP) || (rdev->family == CHIP_R600)) {
127 int min_power_state_index = 0;
129 if (rdev->pm.num_power_states > 2)
130 min_power_state_index = 1;
132 switch (rdev->pm.dynpm_planned_action) {
133 case DYNPM_ACTION_MINIMUM:
134 rdev->pm.requested_power_state_index = min_power_state_index;
135 rdev->pm.requested_clock_mode_index = 0;
136 rdev->pm.dynpm_can_downclock = false;
138 case DYNPM_ACTION_DOWNCLOCK:
139 if (rdev->pm.current_power_state_index == min_power_state_index) {
140 rdev->pm.requested_power_state_index = rdev->pm.current_power_state_index;
141 rdev->pm.dynpm_can_downclock = false;
143 if (rdev->pm.active_crtc_count > 1) {
144 for (i = 0; i < rdev->pm.num_power_states; i++) {
145 if (rdev->pm.power_state[i].flags & RADEON_PM_STATE_SINGLE_DISPLAY_ONLY)
147 else if (i >= rdev->pm.current_power_state_index) {
148 rdev->pm.requested_power_state_index =
149 rdev->pm.current_power_state_index;
152 rdev->pm.requested_power_state_index = i;
157 if (rdev->pm.current_power_state_index == 0)
158 rdev->pm.requested_power_state_index =
159 rdev->pm.num_power_states - 1;
161 rdev->pm.requested_power_state_index =
162 rdev->pm.current_power_state_index - 1;
165 rdev->pm.requested_clock_mode_index = 0;
166 /* don't use the power state if crtcs are active and no display flag is set */
167 if ((rdev->pm.active_crtc_count > 0) &&
168 (rdev->pm.power_state[rdev->pm.requested_power_state_index].
169 clock_info[rdev->pm.requested_clock_mode_index].flags &
170 RADEON_PM_MODE_NO_DISPLAY)) {
171 rdev->pm.requested_power_state_index++;
174 case DYNPM_ACTION_UPCLOCK:
175 if (rdev->pm.current_power_state_index == (rdev->pm.num_power_states - 1)) {
176 rdev->pm.requested_power_state_index = rdev->pm.current_power_state_index;
177 rdev->pm.dynpm_can_upclock = false;
179 if (rdev->pm.active_crtc_count > 1) {
180 for (i = (rdev->pm.num_power_states - 1); i >= 0; i--) {
181 if (rdev->pm.power_state[i].flags & RADEON_PM_STATE_SINGLE_DISPLAY_ONLY)
183 else if (i <= rdev->pm.current_power_state_index) {
184 rdev->pm.requested_power_state_index =
185 rdev->pm.current_power_state_index;
188 rdev->pm.requested_power_state_index = i;
193 rdev->pm.requested_power_state_index =
194 rdev->pm.current_power_state_index + 1;
196 rdev->pm.requested_clock_mode_index = 0;
198 case DYNPM_ACTION_DEFAULT:
199 rdev->pm.requested_power_state_index = rdev->pm.default_power_state_index;
200 rdev->pm.requested_clock_mode_index = 0;
201 rdev->pm.dynpm_can_upclock = false;
203 case DYNPM_ACTION_NONE:
205 DRM_ERROR("Requested mode for not defined action\n");
209 /* XXX select a power state based on AC/DC, single/dualhead, etc. */
210 /* for now just select the first power state and switch between clock modes */
211 /* power state array is low to high, default is first (0) */
212 if (rdev->pm.active_crtc_count > 1) {
213 rdev->pm.requested_power_state_index = -1;
214 /* start at 1 as we don't want the default mode */
215 for (i = 1; i < rdev->pm.num_power_states; i++) {
216 if (rdev->pm.power_state[i].flags & RADEON_PM_STATE_SINGLE_DISPLAY_ONLY)
218 else if ((rdev->pm.power_state[i].type == POWER_STATE_TYPE_PERFORMANCE) ||
219 (rdev->pm.power_state[i].type == POWER_STATE_TYPE_BATTERY)) {
220 rdev->pm.requested_power_state_index = i;
224 /* if nothing selected, grab the default state. */
225 if (rdev->pm.requested_power_state_index == -1)
226 rdev->pm.requested_power_state_index = 0;
228 rdev->pm.requested_power_state_index = 1;
230 switch (rdev->pm.dynpm_planned_action) {
231 case DYNPM_ACTION_MINIMUM:
232 rdev->pm.requested_clock_mode_index = 0;
233 rdev->pm.dynpm_can_downclock = false;
235 case DYNPM_ACTION_DOWNCLOCK:
236 if (rdev->pm.requested_power_state_index == rdev->pm.current_power_state_index) {
237 if (rdev->pm.current_clock_mode_index == 0) {
238 rdev->pm.requested_clock_mode_index = 0;
239 rdev->pm.dynpm_can_downclock = false;
241 rdev->pm.requested_clock_mode_index =
242 rdev->pm.current_clock_mode_index - 1;
244 rdev->pm.requested_clock_mode_index = 0;
245 rdev->pm.dynpm_can_downclock = false;
247 /* don't use the power state if crtcs are active and no display flag is set */
248 if ((rdev->pm.active_crtc_count > 0) &&
249 (rdev->pm.power_state[rdev->pm.requested_power_state_index].
250 clock_info[rdev->pm.requested_clock_mode_index].flags &
251 RADEON_PM_MODE_NO_DISPLAY)) {
252 rdev->pm.requested_clock_mode_index++;
255 case DYNPM_ACTION_UPCLOCK:
256 if (rdev->pm.requested_power_state_index == rdev->pm.current_power_state_index) {
257 if (rdev->pm.current_clock_mode_index ==
258 (rdev->pm.power_state[rdev->pm.requested_power_state_index].num_clock_modes - 1)) {
259 rdev->pm.requested_clock_mode_index = rdev->pm.current_clock_mode_index;
260 rdev->pm.dynpm_can_upclock = false;
262 rdev->pm.requested_clock_mode_index =
263 rdev->pm.current_clock_mode_index + 1;
265 rdev->pm.requested_clock_mode_index =
266 rdev->pm.power_state[rdev->pm.requested_power_state_index].num_clock_modes - 1;
267 rdev->pm.dynpm_can_upclock = false;
270 case DYNPM_ACTION_DEFAULT:
271 rdev->pm.requested_power_state_index = rdev->pm.default_power_state_index;
272 rdev->pm.requested_clock_mode_index = 0;
273 rdev->pm.dynpm_can_upclock = false;
275 case DYNPM_ACTION_NONE:
277 DRM_ERROR("Requested mode for not defined action\n");
282 DRM_DEBUG_DRIVER("Requested: e: %d m: %d p: %d\n",
283 rdev->pm.power_state[rdev->pm.requested_power_state_index].
284 clock_info[rdev->pm.requested_clock_mode_index].sclk,
285 rdev->pm.power_state[rdev->pm.requested_power_state_index].
286 clock_info[rdev->pm.requested_clock_mode_index].mclk,
287 rdev->pm.power_state[rdev->pm.requested_power_state_index].
291 static int r600_pm_get_type_index(struct radeon_device *rdev,
292 enum radeon_pm_state_type ps_type,
296 int found_instance = -1;
298 for (i = 0; i < rdev->pm.num_power_states; i++) {
299 if (rdev->pm.power_state[i].type == ps_type) {
301 if (found_instance == instance)
305 /* return default if no match */
306 return rdev->pm.default_power_state_index;
309 void rs780_pm_init_profile(struct radeon_device *rdev)
311 if (rdev->pm.num_power_states == 2) {
313 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
314 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
315 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
316 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 0;
318 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = 0;
319 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = 0;
320 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
321 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
323 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = 0;
324 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = 0;
325 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
326 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 0;
328 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = 0;
329 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = 1;
330 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
331 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 0;
333 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = 0;
334 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = 0;
335 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
336 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
338 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = 0;
339 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = 0;
340 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
341 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 0;
343 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = 0;
344 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = 1;
345 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
346 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 0;
347 } else if (rdev->pm.num_power_states == 3) {
349 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
350 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
351 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
352 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 0;
354 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = 1;
355 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = 1;
356 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
357 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
359 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = 1;
360 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = 1;
361 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
362 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 0;
364 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = 1;
365 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = 2;
366 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
367 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 0;
369 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = 1;
370 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = 1;
371 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
372 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
374 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = 1;
375 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = 1;
376 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
377 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 0;
379 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = 1;
380 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = 2;
381 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
382 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 0;
385 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
386 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
387 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
388 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 0;
390 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = 2;
391 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = 2;
392 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
393 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
395 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = 2;
396 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = 2;
397 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
398 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 0;
400 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = 2;
401 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = 3;
402 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
403 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 0;
405 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = 2;
406 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = 0;
407 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
408 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
410 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = 2;
411 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = 0;
412 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
413 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 0;
415 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = 2;
416 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = 3;
417 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
418 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 0;
422 void r600_pm_init_profile(struct radeon_device *rdev)
424 if (rdev->family == CHIP_R600) {
427 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
428 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
429 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
430 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 0;
432 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
433 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
434 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
435 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
437 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
438 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
439 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
440 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 0;
442 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
443 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
444 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
445 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 0;
447 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
448 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
449 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
450 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
452 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
453 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
454 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
455 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 0;
457 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
458 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
459 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
460 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 0;
462 if (rdev->pm.num_power_states < 4) {
464 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
465 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
466 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
467 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 2;
469 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx = 1;
470 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx = 1;
471 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
472 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
474 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx = 1;
475 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx = 1;
476 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
477 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 1;
479 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx = 1;
480 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx = 1;
481 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
482 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 2;
484 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx = 2;
485 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx = 2;
486 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
487 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
489 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx = 2;
490 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx = 2;
491 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
492 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 1;
494 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx = 2;
495 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx = 2;
496 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
497 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 2;
500 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_ps_idx = rdev->pm.default_power_state_index;
501 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_ps_idx = rdev->pm.default_power_state_index;
502 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_off_cm_idx = 0;
503 rdev->pm.profiles[PM_PROFILE_DEFAULT_IDX].dpms_on_cm_idx = 2;
505 if (rdev->flags & RADEON_IS_MOBILITY) {
506 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx =
507 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 0);
508 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx =
509 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 0);
510 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
511 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
513 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_ps_idx =
514 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
515 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_ps_idx =
516 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
517 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_off_cm_idx = 0;
518 rdev->pm.profiles[PM_PROFILE_LOW_SH_IDX].dpms_on_cm_idx = 0;
521 if (rdev->flags & RADEON_IS_MOBILITY) {
522 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx =
523 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 0);
524 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx =
525 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 0);
526 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
527 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 1;
529 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_ps_idx =
530 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
531 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_ps_idx =
532 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
533 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_off_cm_idx = 0;
534 rdev->pm.profiles[PM_PROFILE_MID_SH_IDX].dpms_on_cm_idx = 1;
537 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_ps_idx =
538 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
539 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_ps_idx =
540 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 0);
541 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_off_cm_idx = 0;
542 rdev->pm.profiles[PM_PROFILE_HIGH_SH_IDX].dpms_on_cm_idx = 2;
544 if (rdev->flags & RADEON_IS_MOBILITY) {
545 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx =
546 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 1);
547 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx =
548 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 1);
549 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
550 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
552 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_ps_idx =
553 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 1);
554 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_ps_idx =
555 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 1);
556 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_off_cm_idx = 0;
557 rdev->pm.profiles[PM_PROFILE_LOW_MH_IDX].dpms_on_cm_idx = 0;
560 if (rdev->flags & RADEON_IS_MOBILITY) {
561 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx =
562 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 1);
563 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx =
564 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_BATTERY, 1);
565 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
566 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 1;
568 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_ps_idx =
569 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 1);
570 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_ps_idx =
571 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 1);
572 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_off_cm_idx = 0;
573 rdev->pm.profiles[PM_PROFILE_MID_MH_IDX].dpms_on_cm_idx = 1;
576 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_ps_idx =
577 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 1);
578 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_ps_idx =
579 r600_pm_get_type_index(rdev, POWER_STATE_TYPE_PERFORMANCE, 1);
580 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_off_cm_idx = 0;
581 rdev->pm.profiles[PM_PROFILE_HIGH_MH_IDX].dpms_on_cm_idx = 2;
586 void r600_pm_misc(struct radeon_device *rdev)
588 int req_ps_idx = rdev->pm.requested_power_state_index;
589 int req_cm_idx = rdev->pm.requested_clock_mode_index;
590 struct radeon_power_state *ps = &rdev->pm.power_state[req_ps_idx];
591 struct radeon_voltage *voltage = &ps->clock_info[req_cm_idx].voltage;
593 if ((voltage->type == VOLTAGE_SW) && voltage->voltage) {
594 /* 0xff01 is a flag rather then an actual voltage */
595 if (voltage->voltage == 0xff01)
597 if (voltage->voltage != rdev->pm.current_vddc) {
598 radeon_atom_set_voltage(rdev, voltage->voltage, SET_VOLTAGE_TYPE_ASIC_VDDC);
599 rdev->pm.current_vddc = voltage->voltage;
600 DRM_DEBUG_DRIVER("Setting: v: %d\n", voltage->voltage);
605 bool r600_gui_idle(struct radeon_device *rdev)
607 if (RREG32(GRBM_STATUS) & GUI_ACTIVE)
613 /* hpd for digital panel detect/disconnect */
614 bool r600_hpd_sense(struct radeon_device *rdev, enum radeon_hpd_id hpd)
616 bool connected = false;
618 if (ASIC_IS_DCE3(rdev)) {
621 if (RREG32(DC_HPD1_INT_STATUS) & DC_HPDx_SENSE)
625 if (RREG32(DC_HPD2_INT_STATUS) & DC_HPDx_SENSE)
629 if (RREG32(DC_HPD3_INT_STATUS) & DC_HPDx_SENSE)
633 if (RREG32(DC_HPD4_INT_STATUS) & DC_HPDx_SENSE)
638 if (RREG32(DC_HPD5_INT_STATUS) & DC_HPDx_SENSE)
642 if (RREG32(DC_HPD6_INT_STATUS) & DC_HPDx_SENSE)
651 if (RREG32(DC_HOT_PLUG_DETECT1_INT_STATUS) & DC_HOT_PLUG_DETECTx_SENSE)
655 if (RREG32(DC_HOT_PLUG_DETECT2_INT_STATUS) & DC_HOT_PLUG_DETECTx_SENSE)
659 if (RREG32(DC_HOT_PLUG_DETECT3_INT_STATUS) & DC_HOT_PLUG_DETECTx_SENSE)
669 void r600_hpd_set_polarity(struct radeon_device *rdev,
670 enum radeon_hpd_id hpd)
673 bool connected = r600_hpd_sense(rdev, hpd);
675 if (ASIC_IS_DCE3(rdev)) {
678 tmp = RREG32(DC_HPD1_INT_CONTROL);
680 tmp &= ~DC_HPDx_INT_POLARITY;
682 tmp |= DC_HPDx_INT_POLARITY;
683 WREG32(DC_HPD1_INT_CONTROL, tmp);
686 tmp = RREG32(DC_HPD2_INT_CONTROL);
688 tmp &= ~DC_HPDx_INT_POLARITY;
690 tmp |= DC_HPDx_INT_POLARITY;
691 WREG32(DC_HPD2_INT_CONTROL, tmp);
694 tmp = RREG32(DC_HPD3_INT_CONTROL);
696 tmp &= ~DC_HPDx_INT_POLARITY;
698 tmp |= DC_HPDx_INT_POLARITY;
699 WREG32(DC_HPD3_INT_CONTROL, tmp);
702 tmp = RREG32(DC_HPD4_INT_CONTROL);
704 tmp &= ~DC_HPDx_INT_POLARITY;
706 tmp |= DC_HPDx_INT_POLARITY;
707 WREG32(DC_HPD4_INT_CONTROL, tmp);
710 tmp = RREG32(DC_HPD5_INT_CONTROL);
712 tmp &= ~DC_HPDx_INT_POLARITY;
714 tmp |= DC_HPDx_INT_POLARITY;
715 WREG32(DC_HPD5_INT_CONTROL, tmp);
719 tmp = RREG32(DC_HPD6_INT_CONTROL);
721 tmp &= ~DC_HPDx_INT_POLARITY;
723 tmp |= DC_HPDx_INT_POLARITY;
724 WREG32(DC_HPD6_INT_CONTROL, tmp);
732 tmp = RREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL);
734 tmp &= ~DC_HOT_PLUG_DETECTx_INT_POLARITY;
736 tmp |= DC_HOT_PLUG_DETECTx_INT_POLARITY;
737 WREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL, tmp);
740 tmp = RREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL);
742 tmp &= ~DC_HOT_PLUG_DETECTx_INT_POLARITY;
744 tmp |= DC_HOT_PLUG_DETECTx_INT_POLARITY;
745 WREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL, tmp);
748 tmp = RREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL);
750 tmp &= ~DC_HOT_PLUG_DETECTx_INT_POLARITY;
752 tmp |= DC_HOT_PLUG_DETECTx_INT_POLARITY;
753 WREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL, tmp);
761 void r600_hpd_init(struct radeon_device *rdev)
763 struct drm_device *dev = rdev->ddev;
764 struct drm_connector *connector;
766 if (ASIC_IS_DCE3(rdev)) {
767 u32 tmp = DC_HPDx_CONNECTION_TIMER(0x9c4) | DC_HPDx_RX_INT_TIMER(0xfa);
768 if (ASIC_IS_DCE32(rdev))
771 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
772 struct radeon_connector *radeon_connector = to_radeon_connector(connector);
773 switch (radeon_connector->hpd.hpd) {
775 WREG32(DC_HPD1_CONTROL, tmp);
776 rdev->irq.hpd[0] = true;
779 WREG32(DC_HPD2_CONTROL, tmp);
780 rdev->irq.hpd[1] = true;
783 WREG32(DC_HPD3_CONTROL, tmp);
784 rdev->irq.hpd[2] = true;
787 WREG32(DC_HPD4_CONTROL, tmp);
788 rdev->irq.hpd[3] = true;
792 WREG32(DC_HPD5_CONTROL, tmp);
793 rdev->irq.hpd[4] = true;
796 WREG32(DC_HPD6_CONTROL, tmp);
797 rdev->irq.hpd[5] = true;
804 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
805 struct radeon_connector *radeon_connector = to_radeon_connector(connector);
806 switch (radeon_connector->hpd.hpd) {
808 WREG32(DC_HOT_PLUG_DETECT1_CONTROL, DC_HOT_PLUG_DETECTx_EN);
809 rdev->irq.hpd[0] = true;
812 WREG32(DC_HOT_PLUG_DETECT2_CONTROL, DC_HOT_PLUG_DETECTx_EN);
813 rdev->irq.hpd[1] = true;
816 WREG32(DC_HOT_PLUG_DETECT3_CONTROL, DC_HOT_PLUG_DETECTx_EN);
817 rdev->irq.hpd[2] = true;
824 if (rdev->irq.installed)
828 void r600_hpd_fini(struct radeon_device *rdev)
830 struct drm_device *dev = rdev->ddev;
831 struct drm_connector *connector;
833 if (ASIC_IS_DCE3(rdev)) {
834 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
835 struct radeon_connector *radeon_connector = to_radeon_connector(connector);
836 switch (radeon_connector->hpd.hpd) {
838 WREG32(DC_HPD1_CONTROL, 0);
839 rdev->irq.hpd[0] = false;
842 WREG32(DC_HPD2_CONTROL, 0);
843 rdev->irq.hpd[1] = false;
846 WREG32(DC_HPD3_CONTROL, 0);
847 rdev->irq.hpd[2] = false;
850 WREG32(DC_HPD4_CONTROL, 0);
851 rdev->irq.hpd[3] = false;
855 WREG32(DC_HPD5_CONTROL, 0);
856 rdev->irq.hpd[4] = false;
859 WREG32(DC_HPD6_CONTROL, 0);
860 rdev->irq.hpd[5] = false;
867 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
868 struct radeon_connector *radeon_connector = to_radeon_connector(connector);
869 switch (radeon_connector->hpd.hpd) {
871 WREG32(DC_HOT_PLUG_DETECT1_CONTROL, 0);
872 rdev->irq.hpd[0] = false;
875 WREG32(DC_HOT_PLUG_DETECT2_CONTROL, 0);
876 rdev->irq.hpd[1] = false;
879 WREG32(DC_HOT_PLUG_DETECT3_CONTROL, 0);
880 rdev->irq.hpd[2] = false;
892 void r600_pcie_gart_tlb_flush(struct radeon_device *rdev)
897 /* flush hdp cache so updates hit vram */
898 if ((rdev->family >= CHIP_RV770) && (rdev->family <= CHIP_RV740) &&
899 !(rdev->flags & RADEON_IS_AGP)) {
900 void __iomem *ptr = (void *)rdev->gart.table.vram.ptr;
903 /* r7xx hw bug. write to HDP_DEBUG1 followed by fb read
904 * rather than write to HDP_REG_COHERENCY_FLUSH_CNTL
905 * This seems to cause problems on some AGP cards. Just use the old
908 WREG32(HDP_DEBUG1, 0);
909 tmp = readl((void __iomem *)ptr);
911 WREG32(R_005480_HDP_MEM_COHERENCY_FLUSH_CNTL, 0x1);
913 WREG32(VM_CONTEXT0_INVALIDATION_LOW_ADDR, rdev->mc.gtt_start >> 12);
914 WREG32(VM_CONTEXT0_INVALIDATION_HIGH_ADDR, (rdev->mc.gtt_end - 1) >> 12);
915 WREG32(VM_CONTEXT0_REQUEST_RESPONSE, REQUEST_TYPE(1));
916 for (i = 0; i < rdev->usec_timeout; i++) {
918 tmp = RREG32(VM_CONTEXT0_REQUEST_RESPONSE);
919 tmp = (tmp & RESPONSE_TYPE_MASK) >> RESPONSE_TYPE_SHIFT;
921 printk(KERN_WARNING "[drm] r600 flush TLB failed\n");
931 int r600_pcie_gart_init(struct radeon_device *rdev)
935 if (rdev->gart.table.vram.robj) {
936 WARN(1, "R600 PCIE GART already initialized\n");
939 /* Initialize common gart structure */
940 r = radeon_gart_init(rdev);
943 rdev->gart.table_size = rdev->gart.num_gpu_pages * 8;
944 return radeon_gart_table_vram_alloc(rdev);
947 int r600_pcie_gart_enable(struct radeon_device *rdev)
952 if (rdev->gart.table.vram.robj == NULL) {
953 dev_err(rdev->dev, "No VRAM object for PCIE GART.\n");
956 r = radeon_gart_table_vram_pin(rdev);
959 radeon_gart_restore(rdev);
962 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
963 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
964 EFFECTIVE_L2_QUEUE_SIZE(7));
965 WREG32(VM_L2_CNTL2, 0);
966 WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
967 /* Setup TLB control */
968 tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
969 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
970 EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
971 ENABLE_WAIT_L2_QUERY;
972 WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
973 WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
974 WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp | ENABLE_L1_STRICT_ORDERING);
975 WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
976 WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
977 WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
978 WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
979 WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
980 WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
981 WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
982 WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
983 WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
984 WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
985 WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
986 WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR, rdev->mc.gtt_start >> 12);
987 WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR, rdev->mc.gtt_end >> 12);
988 WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR, rdev->gart.table_addr >> 12);
989 WREG32(VM_CONTEXT0_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(0) |
990 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT);
991 WREG32(VM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
992 (u32)(rdev->dummy_page.addr >> 12));
993 for (i = 1; i < 7; i++)
994 WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
996 r600_pcie_gart_tlb_flush(rdev);
997 DRM_INFO("PCIE GART of %uM enabled (table at 0x%016llX).\n",
998 (unsigned)(rdev->mc.gtt_size >> 20),
999 (unsigned long long)rdev->gart.table_addr);
1000 rdev->gart.ready = true;
1004 void r600_pcie_gart_disable(struct radeon_device *rdev)
1009 /* Disable all tables */
1010 for (i = 0; i < 7; i++)
1011 WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
1013 /* Disable L2 cache */
1014 WREG32(VM_L2_CNTL, ENABLE_L2_FRAGMENT_PROCESSING |
1015 EFFECTIVE_L2_QUEUE_SIZE(7));
1016 WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
1017 /* Setup L1 TLB control */
1018 tmp = EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
1019 ENABLE_WAIT_L2_QUERY;
1020 WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
1021 WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
1022 WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
1023 WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
1024 WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
1025 WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
1026 WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
1027 WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
1028 WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp);
1029 WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp);
1030 WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
1031 WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
1032 WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp);
1033 WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
1034 if (rdev->gart.table.vram.robj) {
1035 r = radeon_bo_reserve(rdev->gart.table.vram.robj, false);
1036 if (likely(r == 0)) {
1037 radeon_bo_kunmap(rdev->gart.table.vram.robj);
1038 radeon_bo_unpin(rdev->gart.table.vram.robj);
1039 radeon_bo_unreserve(rdev->gart.table.vram.robj);
1044 void r600_pcie_gart_fini(struct radeon_device *rdev)
1046 radeon_gart_fini(rdev);
1047 r600_pcie_gart_disable(rdev);
1048 radeon_gart_table_vram_free(rdev);
1051 void r600_agp_enable(struct radeon_device *rdev)
1056 /* Setup L2 cache */
1057 WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
1058 ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
1059 EFFECTIVE_L2_QUEUE_SIZE(7));
1060 WREG32(VM_L2_CNTL2, 0);
1061 WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
1062 /* Setup TLB control */
1063 tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
1064 SYSTEM_ACCESS_MODE_NOT_IN_SYS |
1065 EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
1066 ENABLE_WAIT_L2_QUERY;
1067 WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
1068 WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
1069 WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp | ENABLE_L1_STRICT_ORDERING);
1070 WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
1071 WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
1072 WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
1073 WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
1074 WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
1075 WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
1076 WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
1077 WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
1078 WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
1079 WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
1080 WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
1081 for (i = 0; i < 7; i++)
1082 WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
1085 int r600_mc_wait_for_idle(struct radeon_device *rdev)
1090 for (i = 0; i < rdev->usec_timeout; i++) {
1091 /* read MC_STATUS */
1092 tmp = RREG32(R_000E50_SRBM_STATUS) & 0x3F00;
1100 static void r600_mc_program(struct radeon_device *rdev)
1102 struct rv515_mc_save save;
1106 /* Initialize HDP */
1107 for (i = 0, j = 0; i < 32; i++, j += 0x18) {
1108 WREG32((0x2c14 + j), 0x00000000);
1109 WREG32((0x2c18 + j), 0x00000000);
1110 WREG32((0x2c1c + j), 0x00000000);
1111 WREG32((0x2c20 + j), 0x00000000);
1112 WREG32((0x2c24 + j), 0x00000000);
1114 WREG32(HDP_REG_COHERENCY_FLUSH_CNTL, 0);
1116 rv515_mc_stop(rdev, &save);
1117 if (r600_mc_wait_for_idle(rdev)) {
1118 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
1120 /* Lockout access through VGA aperture (doesn't exist before R600) */
1121 WREG32(VGA_HDP_CONTROL, VGA_MEMORY_DISABLE);
1122 /* Update configuration */
1123 if (rdev->flags & RADEON_IS_AGP) {
1124 if (rdev->mc.vram_start < rdev->mc.gtt_start) {
1125 /* VRAM before AGP */
1126 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
1127 rdev->mc.vram_start >> 12);
1128 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
1129 rdev->mc.gtt_end >> 12);
1131 /* VRAM after AGP */
1132 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR,
1133 rdev->mc.gtt_start >> 12);
1134 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR,
1135 rdev->mc.vram_end >> 12);
1138 WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR, rdev->mc.vram_start >> 12);
1139 WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR, rdev->mc.vram_end >> 12);
1141 WREG32(MC_VM_SYSTEM_APERTURE_DEFAULT_ADDR, 0);
1142 tmp = ((rdev->mc.vram_end >> 24) & 0xFFFF) << 16;
1143 tmp |= ((rdev->mc.vram_start >> 24) & 0xFFFF);
1144 WREG32(MC_VM_FB_LOCATION, tmp);
1145 WREG32(HDP_NONSURFACE_BASE, (rdev->mc.vram_start >> 8));
1146 WREG32(HDP_NONSURFACE_INFO, (2 << 7));
1147 WREG32(HDP_NONSURFACE_SIZE, 0x3FFFFFFF);
1148 if (rdev->flags & RADEON_IS_AGP) {
1149 WREG32(MC_VM_AGP_TOP, rdev->mc.gtt_end >> 22);
1150 WREG32(MC_VM_AGP_BOT, rdev->mc.gtt_start >> 22);
1151 WREG32(MC_VM_AGP_BASE, rdev->mc.agp_base >> 22);
1153 WREG32(MC_VM_AGP_BASE, 0);
1154 WREG32(MC_VM_AGP_TOP, 0x0FFFFFFF);
1155 WREG32(MC_VM_AGP_BOT, 0x0FFFFFFF);
1157 if (r600_mc_wait_for_idle(rdev)) {
1158 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
1160 rv515_mc_resume(rdev, &save);
1161 /* we need to own VRAM, so turn off the VGA renderer here
1162 * to stop it overwriting our objects */
1163 rv515_vga_render_disable(rdev);
1167 * r600_vram_gtt_location - try to find VRAM & GTT location
1168 * @rdev: radeon device structure holding all necessary informations
1169 * @mc: memory controller structure holding memory informations
1171 * Function will place try to place VRAM at same place as in CPU (PCI)
1172 * address space as some GPU seems to have issue when we reprogram at
1173 * different address space.
1175 * If there is not enough space to fit the unvisible VRAM after the
1176 * aperture then we limit the VRAM size to the aperture.
1178 * If we are using AGP then place VRAM adjacent to AGP aperture are we need
1179 * them to be in one from GPU point of view so that we can program GPU to
1180 * catch access outside them (weird GPU policy see ??).
1182 * This function will never fails, worst case are limiting VRAM or GTT.
1184 * Note: GTT start, end, size should be initialized before calling this
1185 * function on AGP platform.
1187 static void r600_vram_gtt_location(struct radeon_device *rdev, struct radeon_mc *mc)
1189 u64 size_bf, size_af;
1191 if (mc->mc_vram_size > 0xE0000000) {
1192 /* leave room for at least 512M GTT */
1193 dev_warn(rdev->dev, "limiting VRAM\n");
1194 mc->real_vram_size = 0xE0000000;
1195 mc->mc_vram_size = 0xE0000000;
1197 if (rdev->flags & RADEON_IS_AGP) {
1198 size_bf = mc->gtt_start;
1199 size_af = 0xFFFFFFFF - mc->gtt_end + 1;
1200 if (size_bf > size_af) {
1201 if (mc->mc_vram_size > size_bf) {
1202 dev_warn(rdev->dev, "limiting VRAM\n");
1203 mc->real_vram_size = size_bf;
1204 mc->mc_vram_size = size_bf;
1206 mc->vram_start = mc->gtt_start - mc->mc_vram_size;
1208 if (mc->mc_vram_size > size_af) {
1209 dev_warn(rdev->dev, "limiting VRAM\n");
1210 mc->real_vram_size = size_af;
1211 mc->mc_vram_size = size_af;
1213 mc->vram_start = mc->gtt_end;
1215 mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
1216 dev_info(rdev->dev, "VRAM: %lluM 0x%08llX - 0x%08llX (%lluM used)\n",
1217 mc->mc_vram_size >> 20, mc->vram_start,
1218 mc->vram_end, mc->real_vram_size >> 20);
1221 if (rdev->flags & RADEON_IS_IGP) {
1222 base = RREG32(MC_VM_FB_LOCATION) & 0xFFFF;
1225 radeon_vram_location(rdev, &rdev->mc, base);
1226 rdev->mc.gtt_base_align = 0;
1227 radeon_gtt_location(rdev, mc);
1231 int r600_mc_init(struct radeon_device *rdev)
1234 int chansize, numchan;
1236 /* Get VRAM informations */
1237 rdev->mc.vram_is_ddr = true;
1238 tmp = RREG32(RAMCFG);
1239 if (tmp & CHANSIZE_OVERRIDE) {
1241 } else if (tmp & CHANSIZE_MASK) {
1246 tmp = RREG32(CHMAP);
1247 switch ((tmp & NOOFCHAN_MASK) >> NOOFCHAN_SHIFT) {
1262 rdev->mc.vram_width = numchan * chansize;
1263 /* Could aper size report 0 ? */
1264 rdev->mc.aper_base = pci_resource_start(rdev->pdev, 0);
1265 rdev->mc.aper_size = pci_resource_len(rdev->pdev, 0);
1266 /* Setup GPU memory space */
1267 rdev->mc.mc_vram_size = RREG32(CONFIG_MEMSIZE);
1268 rdev->mc.real_vram_size = RREG32(CONFIG_MEMSIZE);
1269 rdev->mc.visible_vram_size = rdev->mc.aper_size;
1270 r600_vram_gtt_location(rdev, &rdev->mc);
1272 if (rdev->flags & RADEON_IS_IGP) {
1273 rs690_pm_info(rdev);
1274 rdev->mc.igp_sideport_enabled = radeon_atombios_sideport_present(rdev);
1276 radeon_update_bandwidth_info(rdev);
1280 /* We doesn't check that the GPU really needs a reset we simply do the
1281 * reset, it's up to the caller to determine if the GPU needs one. We
1282 * might add an helper function to check that.
1284 int r600_gpu_soft_reset(struct radeon_device *rdev)
1286 struct rv515_mc_save save;
1287 u32 grbm_busy_mask = S_008010_VC_BUSY(1) | S_008010_VGT_BUSY_NO_DMA(1) |
1288 S_008010_VGT_BUSY(1) | S_008010_TA03_BUSY(1) |
1289 S_008010_TC_BUSY(1) | S_008010_SX_BUSY(1) |
1290 S_008010_SH_BUSY(1) | S_008010_SPI03_BUSY(1) |
1291 S_008010_SMX_BUSY(1) | S_008010_SC_BUSY(1) |
1292 S_008010_PA_BUSY(1) | S_008010_DB03_BUSY(1) |
1293 S_008010_CR_BUSY(1) | S_008010_CB03_BUSY(1) |
1294 S_008010_GUI_ACTIVE(1);
1295 u32 grbm2_busy_mask = S_008014_SPI0_BUSY(1) | S_008014_SPI1_BUSY(1) |
1296 S_008014_SPI2_BUSY(1) | S_008014_SPI3_BUSY(1) |
1297 S_008014_TA0_BUSY(1) | S_008014_TA1_BUSY(1) |
1298 S_008014_TA2_BUSY(1) | S_008014_TA3_BUSY(1) |
1299 S_008014_DB0_BUSY(1) | S_008014_DB1_BUSY(1) |
1300 S_008014_DB2_BUSY(1) | S_008014_DB3_BUSY(1) |
1301 S_008014_CB0_BUSY(1) | S_008014_CB1_BUSY(1) |
1302 S_008014_CB2_BUSY(1) | S_008014_CB3_BUSY(1);
1305 if (!(RREG32(GRBM_STATUS) & GUI_ACTIVE))
1308 dev_info(rdev->dev, "GPU softreset \n");
1309 dev_info(rdev->dev, " R_008010_GRBM_STATUS=0x%08X\n",
1310 RREG32(R_008010_GRBM_STATUS));
1311 dev_info(rdev->dev, " R_008014_GRBM_STATUS2=0x%08X\n",
1312 RREG32(R_008014_GRBM_STATUS2));
1313 dev_info(rdev->dev, " R_000E50_SRBM_STATUS=0x%08X\n",
1314 RREG32(R_000E50_SRBM_STATUS));
1315 rv515_mc_stop(rdev, &save);
1316 if (r600_mc_wait_for_idle(rdev)) {
1317 dev_warn(rdev->dev, "Wait for MC idle timedout !\n");
1319 /* Disable CP parsing/prefetching */
1320 WREG32(R_0086D8_CP_ME_CNTL, S_0086D8_CP_ME_HALT(1));
1321 /* Check if any of the rendering block is busy and reset it */
1322 if ((RREG32(R_008010_GRBM_STATUS) & grbm_busy_mask) ||
1323 (RREG32(R_008014_GRBM_STATUS2) & grbm2_busy_mask)) {
1324 tmp = S_008020_SOFT_RESET_CR(1) |
1325 S_008020_SOFT_RESET_DB(1) |
1326 S_008020_SOFT_RESET_CB(1) |
1327 S_008020_SOFT_RESET_PA(1) |
1328 S_008020_SOFT_RESET_SC(1) |
1329 S_008020_SOFT_RESET_SMX(1) |
1330 S_008020_SOFT_RESET_SPI(1) |
1331 S_008020_SOFT_RESET_SX(1) |
1332 S_008020_SOFT_RESET_SH(1) |
1333 S_008020_SOFT_RESET_TC(1) |
1334 S_008020_SOFT_RESET_TA(1) |
1335 S_008020_SOFT_RESET_VC(1) |
1336 S_008020_SOFT_RESET_VGT(1);
1337 dev_info(rdev->dev, " R_008020_GRBM_SOFT_RESET=0x%08X\n", tmp);
1338 WREG32(R_008020_GRBM_SOFT_RESET, tmp);
1339 RREG32(R_008020_GRBM_SOFT_RESET);
1341 WREG32(R_008020_GRBM_SOFT_RESET, 0);
1343 /* Reset CP (we always reset CP) */
1344 tmp = S_008020_SOFT_RESET_CP(1);
1345 dev_info(rdev->dev, "R_008020_GRBM_SOFT_RESET=0x%08X\n", tmp);
1346 WREG32(R_008020_GRBM_SOFT_RESET, tmp);
1347 RREG32(R_008020_GRBM_SOFT_RESET);
1349 WREG32(R_008020_GRBM_SOFT_RESET, 0);
1350 /* Wait a little for things to settle down */
1352 dev_info(rdev->dev, " R_008010_GRBM_STATUS=0x%08X\n",
1353 RREG32(R_008010_GRBM_STATUS));
1354 dev_info(rdev->dev, " R_008014_GRBM_STATUS2=0x%08X\n",
1355 RREG32(R_008014_GRBM_STATUS2));
1356 dev_info(rdev->dev, " R_000E50_SRBM_STATUS=0x%08X\n",
1357 RREG32(R_000E50_SRBM_STATUS));
1358 rv515_mc_resume(rdev, &save);
1362 bool r600_gpu_is_lockup(struct radeon_device *rdev)
1367 struct r100_gpu_lockup *lockup;
1370 if (rdev->family >= CHIP_RV770)
1371 lockup = &rdev->config.rv770.lockup;
1373 lockup = &rdev->config.r600.lockup;
1375 srbm_status = RREG32(R_000E50_SRBM_STATUS);
1376 grbm_status = RREG32(R_008010_GRBM_STATUS);
1377 grbm_status2 = RREG32(R_008014_GRBM_STATUS2);
1378 if (!G_008010_GUI_ACTIVE(grbm_status)) {
1379 r100_gpu_lockup_update(lockup, &rdev->cp);
1382 /* force CP activities */
1383 r = radeon_ring_lock(rdev, 2);
1386 radeon_ring_write(rdev, 0x80000000);
1387 radeon_ring_write(rdev, 0x80000000);
1388 radeon_ring_unlock_commit(rdev);
1390 rdev->cp.rptr = RREG32(R600_CP_RB_RPTR);
1391 return r100_gpu_cp_is_lockup(rdev, lockup, &rdev->cp);
1394 int r600_asic_reset(struct radeon_device *rdev)
1396 return r600_gpu_soft_reset(rdev);
1399 static u32 r600_get_tile_pipe_to_backend_map(u32 num_tile_pipes,
1401 u32 backend_disable_mask)
1403 u32 backend_map = 0;
1404 u32 enabled_backends_mask;
1405 u32 enabled_backends_count;
1407 u32 swizzle_pipe[R6XX_MAX_PIPES];
1411 if (num_tile_pipes > R6XX_MAX_PIPES)
1412 num_tile_pipes = R6XX_MAX_PIPES;
1413 if (num_tile_pipes < 1)
1415 if (num_backends > R6XX_MAX_BACKENDS)
1416 num_backends = R6XX_MAX_BACKENDS;
1417 if (num_backends < 1)
1420 enabled_backends_mask = 0;
1421 enabled_backends_count = 0;
1422 for (i = 0; i < R6XX_MAX_BACKENDS; ++i) {
1423 if (((backend_disable_mask >> i) & 1) == 0) {
1424 enabled_backends_mask |= (1 << i);
1425 ++enabled_backends_count;
1427 if (enabled_backends_count == num_backends)
1431 if (enabled_backends_count == 0) {
1432 enabled_backends_mask = 1;
1433 enabled_backends_count = 1;
1436 if (enabled_backends_count != num_backends)
1437 num_backends = enabled_backends_count;
1439 memset((uint8_t *)&swizzle_pipe[0], 0, sizeof(u32) * R6XX_MAX_PIPES);
1440 switch (num_tile_pipes) {
1442 swizzle_pipe[0] = 0;
1445 swizzle_pipe[0] = 0;
1446 swizzle_pipe[1] = 1;
1449 swizzle_pipe[0] = 0;
1450 swizzle_pipe[1] = 1;
1451 swizzle_pipe[2] = 2;
1454 swizzle_pipe[0] = 0;
1455 swizzle_pipe[1] = 1;
1456 swizzle_pipe[2] = 2;
1457 swizzle_pipe[3] = 3;
1460 swizzle_pipe[0] = 0;
1461 swizzle_pipe[1] = 1;
1462 swizzle_pipe[2] = 2;
1463 swizzle_pipe[3] = 3;
1464 swizzle_pipe[4] = 4;
1467 swizzle_pipe[0] = 0;
1468 swizzle_pipe[1] = 2;
1469 swizzle_pipe[2] = 4;
1470 swizzle_pipe[3] = 5;
1471 swizzle_pipe[4] = 1;
1472 swizzle_pipe[5] = 3;
1475 swizzle_pipe[0] = 0;
1476 swizzle_pipe[1] = 2;
1477 swizzle_pipe[2] = 4;
1478 swizzle_pipe[3] = 6;
1479 swizzle_pipe[4] = 1;
1480 swizzle_pipe[5] = 3;
1481 swizzle_pipe[6] = 5;
1484 swizzle_pipe[0] = 0;
1485 swizzle_pipe[1] = 2;
1486 swizzle_pipe[2] = 4;
1487 swizzle_pipe[3] = 6;
1488 swizzle_pipe[4] = 1;
1489 swizzle_pipe[5] = 3;
1490 swizzle_pipe[6] = 5;
1491 swizzle_pipe[7] = 7;
1496 for (cur_pipe = 0; cur_pipe < num_tile_pipes; ++cur_pipe) {
1497 while (((1 << cur_backend) & enabled_backends_mask) == 0)
1498 cur_backend = (cur_backend + 1) % R6XX_MAX_BACKENDS;
1500 backend_map |= (u32)(((cur_backend & 3) << (swizzle_pipe[cur_pipe] * 2)));
1502 cur_backend = (cur_backend + 1) % R6XX_MAX_BACKENDS;
1508 int r600_count_pipe_bits(uint32_t val)
1512 for (i = 0; i < 32; i++) {
1519 void r600_gpu_init(struct radeon_device *rdev)
1524 u32 cc_rb_backend_disable;
1525 u32 cc_gc_shader_pipe_config;
1529 u32 sq_gpr_resource_mgmt_1 = 0;
1530 u32 sq_gpr_resource_mgmt_2 = 0;
1531 u32 sq_thread_resource_mgmt = 0;
1532 u32 sq_stack_resource_mgmt_1 = 0;
1533 u32 sq_stack_resource_mgmt_2 = 0;
1535 /* FIXME: implement */
1536 switch (rdev->family) {
1538 rdev->config.r600.max_pipes = 4;
1539 rdev->config.r600.max_tile_pipes = 8;
1540 rdev->config.r600.max_simds = 4;
1541 rdev->config.r600.max_backends = 4;
1542 rdev->config.r600.max_gprs = 256;
1543 rdev->config.r600.max_threads = 192;
1544 rdev->config.r600.max_stack_entries = 256;
1545 rdev->config.r600.max_hw_contexts = 8;
1546 rdev->config.r600.max_gs_threads = 16;
1547 rdev->config.r600.sx_max_export_size = 128;
1548 rdev->config.r600.sx_max_export_pos_size = 16;
1549 rdev->config.r600.sx_max_export_smx_size = 128;
1550 rdev->config.r600.sq_num_cf_insts = 2;
1554 rdev->config.r600.max_pipes = 2;
1555 rdev->config.r600.max_tile_pipes = 2;
1556 rdev->config.r600.max_simds = 3;
1557 rdev->config.r600.max_backends = 1;
1558 rdev->config.r600.max_gprs = 128;
1559 rdev->config.r600.max_threads = 192;
1560 rdev->config.r600.max_stack_entries = 128;
1561 rdev->config.r600.max_hw_contexts = 8;
1562 rdev->config.r600.max_gs_threads = 4;
1563 rdev->config.r600.sx_max_export_size = 128;
1564 rdev->config.r600.sx_max_export_pos_size = 16;
1565 rdev->config.r600.sx_max_export_smx_size = 128;
1566 rdev->config.r600.sq_num_cf_insts = 2;
1572 rdev->config.r600.max_pipes = 1;
1573 rdev->config.r600.max_tile_pipes = 1;
1574 rdev->config.r600.max_simds = 2;
1575 rdev->config.r600.max_backends = 1;
1576 rdev->config.r600.max_gprs = 128;
1577 rdev->config.r600.max_threads = 192;
1578 rdev->config.r600.max_stack_entries = 128;
1579 rdev->config.r600.max_hw_contexts = 4;
1580 rdev->config.r600.max_gs_threads = 4;
1581 rdev->config.r600.sx_max_export_size = 128;
1582 rdev->config.r600.sx_max_export_pos_size = 16;
1583 rdev->config.r600.sx_max_export_smx_size = 128;
1584 rdev->config.r600.sq_num_cf_insts = 1;
1587 rdev->config.r600.max_pipes = 4;
1588 rdev->config.r600.max_tile_pipes = 4;
1589 rdev->config.r600.max_simds = 4;
1590 rdev->config.r600.max_backends = 4;
1591 rdev->config.r600.max_gprs = 192;
1592 rdev->config.r600.max_threads = 192;
1593 rdev->config.r600.max_stack_entries = 256;
1594 rdev->config.r600.max_hw_contexts = 8;
1595 rdev->config.r600.max_gs_threads = 16;
1596 rdev->config.r600.sx_max_export_size = 128;
1597 rdev->config.r600.sx_max_export_pos_size = 16;
1598 rdev->config.r600.sx_max_export_smx_size = 128;
1599 rdev->config.r600.sq_num_cf_insts = 2;
1605 /* Initialize HDP */
1606 for (i = 0, j = 0; i < 32; i++, j += 0x18) {
1607 WREG32((0x2c14 + j), 0x00000000);
1608 WREG32((0x2c18 + j), 0x00000000);
1609 WREG32((0x2c1c + j), 0x00000000);
1610 WREG32((0x2c20 + j), 0x00000000);
1611 WREG32((0x2c24 + j), 0x00000000);
1614 WREG32(GRBM_CNTL, GRBM_READ_TIMEOUT(0xff));
1618 ramcfg = RREG32(RAMCFG);
1619 switch (rdev->config.r600.max_tile_pipes) {
1621 tiling_config |= PIPE_TILING(0);
1624 tiling_config |= PIPE_TILING(1);
1627 tiling_config |= PIPE_TILING(2);
1630 tiling_config |= PIPE_TILING(3);
1635 rdev->config.r600.tiling_npipes = rdev->config.r600.max_tile_pipes;
1636 rdev->config.r600.tiling_nbanks = 4 << ((ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT);
1637 tiling_config |= BANK_TILING((ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT);
1638 tiling_config |= GROUP_SIZE((ramcfg & BURSTLENGTH_MASK) >> BURSTLENGTH_SHIFT);
1639 if ((ramcfg & BURSTLENGTH_MASK) >> BURSTLENGTH_SHIFT)
1640 rdev->config.r600.tiling_group_size = 512;
1642 rdev->config.r600.tiling_group_size = 256;
1643 tmp = (ramcfg & NOOFROWS_MASK) >> NOOFROWS_SHIFT;
1645 tiling_config |= ROW_TILING(3);
1646 tiling_config |= SAMPLE_SPLIT(3);
1648 tiling_config |= ROW_TILING(tmp);
1649 tiling_config |= SAMPLE_SPLIT(tmp);
1651 tiling_config |= BANK_SWAPS(1);
1653 cc_rb_backend_disable = RREG32(CC_RB_BACKEND_DISABLE) & 0x00ff0000;
1654 cc_rb_backend_disable |=
1655 BACKEND_DISABLE((R6XX_MAX_BACKENDS_MASK << rdev->config.r600.max_backends) & R6XX_MAX_BACKENDS_MASK);
1657 cc_gc_shader_pipe_config = RREG32(CC_GC_SHADER_PIPE_CONFIG) & 0xffffff00;
1658 cc_gc_shader_pipe_config |=
1659 INACTIVE_QD_PIPES((R6XX_MAX_PIPES_MASK << rdev->config.r600.max_pipes) & R6XX_MAX_PIPES_MASK);
1660 cc_gc_shader_pipe_config |=
1661 INACTIVE_SIMDS((R6XX_MAX_SIMDS_MASK << rdev->config.r600.max_simds) & R6XX_MAX_SIMDS_MASK);
1663 backend_map = r600_get_tile_pipe_to_backend_map(rdev->config.r600.max_tile_pipes,
1664 (R6XX_MAX_BACKENDS -
1665 r600_count_pipe_bits((cc_rb_backend_disable &
1666 R6XX_MAX_BACKENDS_MASK) >> 16)),
1667 (cc_rb_backend_disable >> 16));
1668 rdev->config.r600.tile_config = tiling_config;
1669 rdev->config.r600.backend_map = backend_map;
1670 tiling_config |= BACKEND_MAP(backend_map);
1671 WREG32(GB_TILING_CONFIG, tiling_config);
1672 WREG32(DCP_TILING_CONFIG, tiling_config & 0xffff);
1673 WREG32(HDP_TILING_CONFIG, tiling_config & 0xffff);
1676 WREG32(CC_RB_BACKEND_DISABLE, cc_rb_backend_disable);
1677 WREG32(CC_GC_SHADER_PIPE_CONFIG, cc_gc_shader_pipe_config);
1678 WREG32(GC_USER_SHADER_PIPE_CONFIG, cc_gc_shader_pipe_config);
1680 tmp = R6XX_MAX_PIPES - r600_count_pipe_bits((cc_gc_shader_pipe_config & INACTIVE_QD_PIPES_MASK) >> 8);
1681 WREG32(VGT_OUT_DEALLOC_CNTL, (tmp * 4) & DEALLOC_DIST_MASK);
1682 WREG32(VGT_VERTEX_REUSE_BLOCK_CNTL, ((tmp * 4) - 2) & VTX_REUSE_DEPTH_MASK);
1684 /* Setup some CP states */
1685 WREG32(CP_QUEUE_THRESHOLDS, (ROQ_IB1_START(0x16) | ROQ_IB2_START(0x2b)));
1686 WREG32(CP_MEQ_THRESHOLDS, (MEQ_END(0x40) | ROQ_END(0x40)));
1688 WREG32(TA_CNTL_AUX, (DISABLE_CUBE_ANISO | SYNC_GRADIENT |
1689 SYNC_WALKER | SYNC_ALIGNER));
1690 /* Setup various GPU states */
1691 if (rdev->family == CHIP_RV670)
1692 WREG32(ARB_GDEC_RD_CNTL, 0x00000021);
1694 tmp = RREG32(SX_DEBUG_1);
1695 tmp |= SMX_EVENT_RELEASE;
1696 if ((rdev->family > CHIP_R600))
1697 tmp |= ENABLE_NEW_SMX_ADDRESS;
1698 WREG32(SX_DEBUG_1, tmp);
1700 if (((rdev->family) == CHIP_R600) ||
1701 ((rdev->family) == CHIP_RV630) ||
1702 ((rdev->family) == CHIP_RV610) ||
1703 ((rdev->family) == CHIP_RV620) ||
1704 ((rdev->family) == CHIP_RS780) ||
1705 ((rdev->family) == CHIP_RS880)) {
1706 WREG32(DB_DEBUG, PREZ_MUST_WAIT_FOR_POSTZ_DONE);
1708 WREG32(DB_DEBUG, 0);
1710 WREG32(DB_WATERMARKS, (DEPTH_FREE(4) | DEPTH_CACHELINE_FREE(16) |
1711 DEPTH_FLUSH(16) | DEPTH_PENDING_FREE(4)));
1713 WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
1714 WREG32(VGT_NUM_INSTANCES, 0);
1716 WREG32(SPI_CONFIG_CNTL, GPR_WRITE_PRIORITY(0));
1717 WREG32(SPI_CONFIG_CNTL_1, VTX_DONE_DELAY(0));
1719 tmp = RREG32(SQ_MS_FIFO_SIZES);
1720 if (((rdev->family) == CHIP_RV610) ||
1721 ((rdev->family) == CHIP_RV620) ||
1722 ((rdev->family) == CHIP_RS780) ||
1723 ((rdev->family) == CHIP_RS880)) {
1724 tmp = (CACHE_FIFO_SIZE(0xa) |
1725 FETCH_FIFO_HIWATER(0xa) |
1726 DONE_FIFO_HIWATER(0xe0) |
1727 ALU_UPDATE_FIFO_HIWATER(0x8));
1728 } else if (((rdev->family) == CHIP_R600) ||
1729 ((rdev->family) == CHIP_RV630)) {
1730 tmp &= ~DONE_FIFO_HIWATER(0xff);
1731 tmp |= DONE_FIFO_HIWATER(0x4);
1733 WREG32(SQ_MS_FIFO_SIZES, tmp);
1735 /* SQ_CONFIG, SQ_GPR_RESOURCE_MGMT, SQ_THREAD_RESOURCE_MGMT, SQ_STACK_RESOURCE_MGMT
1736 * should be adjusted as needed by the 2D/3D drivers. This just sets default values
1738 sq_config = RREG32(SQ_CONFIG);
1739 sq_config &= ~(PS_PRIO(3) |
1743 sq_config |= (DX9_CONSTS |
1750 if ((rdev->family) == CHIP_R600) {
1751 sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(124) |
1753 NUM_CLAUSE_TEMP_GPRS(4));
1754 sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(0) |
1756 sq_thread_resource_mgmt = (NUM_PS_THREADS(136) |
1757 NUM_VS_THREADS(48) |
1760 sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(128) |
1761 NUM_VS_STACK_ENTRIES(128));
1762 sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(0) |
1763 NUM_ES_STACK_ENTRIES(0));
1764 } else if (((rdev->family) == CHIP_RV610) ||
1765 ((rdev->family) == CHIP_RV620) ||
1766 ((rdev->family) == CHIP_RS780) ||
1767 ((rdev->family) == CHIP_RS880)) {
1768 /* no vertex cache */
1769 sq_config &= ~VC_ENABLE;
1771 sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
1773 NUM_CLAUSE_TEMP_GPRS(2));
1774 sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(17) |
1776 sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
1777 NUM_VS_THREADS(78) |
1779 NUM_ES_THREADS(31));
1780 sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(40) |
1781 NUM_VS_STACK_ENTRIES(40));
1782 sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(32) |
1783 NUM_ES_STACK_ENTRIES(16));
1784 } else if (((rdev->family) == CHIP_RV630) ||
1785 ((rdev->family) == CHIP_RV635)) {
1786 sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
1788 NUM_CLAUSE_TEMP_GPRS(2));
1789 sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(18) |
1791 sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
1792 NUM_VS_THREADS(78) |
1794 NUM_ES_THREADS(31));
1795 sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(40) |
1796 NUM_VS_STACK_ENTRIES(40));
1797 sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(32) |
1798 NUM_ES_STACK_ENTRIES(16));
1799 } else if ((rdev->family) == CHIP_RV670) {
1800 sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
1802 NUM_CLAUSE_TEMP_GPRS(2));
1803 sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(17) |
1805 sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
1806 NUM_VS_THREADS(78) |
1808 NUM_ES_THREADS(31));
1809 sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(64) |
1810 NUM_VS_STACK_ENTRIES(64));
1811 sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(64) |
1812 NUM_ES_STACK_ENTRIES(64));
1815 WREG32(SQ_CONFIG, sq_config);
1816 WREG32(SQ_GPR_RESOURCE_MGMT_1, sq_gpr_resource_mgmt_1);
1817 WREG32(SQ_GPR_RESOURCE_MGMT_2, sq_gpr_resource_mgmt_2);
1818 WREG32(SQ_THREAD_RESOURCE_MGMT, sq_thread_resource_mgmt);
1819 WREG32(SQ_STACK_RESOURCE_MGMT_1, sq_stack_resource_mgmt_1);
1820 WREG32(SQ_STACK_RESOURCE_MGMT_2, sq_stack_resource_mgmt_2);
1822 if (((rdev->family) == CHIP_RV610) ||
1823 ((rdev->family) == CHIP_RV620) ||
1824 ((rdev->family) == CHIP_RS780) ||
1825 ((rdev->family) == CHIP_RS880)) {
1826 WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(TC_ONLY));
1828 WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(VC_AND_TC));
1831 /* More default values. 2D/3D driver should adjust as needed */
1832 WREG32(PA_SC_AA_SAMPLE_LOCS_2S, (S0_X(0xc) | S0_Y(0x4) |
1833 S1_X(0x4) | S1_Y(0xc)));
1834 WREG32(PA_SC_AA_SAMPLE_LOCS_4S, (S0_X(0xe) | S0_Y(0xe) |
1835 S1_X(0x2) | S1_Y(0x2) |
1836 S2_X(0xa) | S2_Y(0x6) |
1837 S3_X(0x6) | S3_Y(0xa)));
1838 WREG32(PA_SC_AA_SAMPLE_LOCS_8S_WD0, (S0_X(0xe) | S0_Y(0xb) |
1839 S1_X(0x4) | S1_Y(0xc) |
1840 S2_X(0x1) | S2_Y(0x6) |
1841 S3_X(0xa) | S3_Y(0xe)));
1842 WREG32(PA_SC_AA_SAMPLE_LOCS_8S_WD1, (S4_X(0x6) | S4_Y(0x1) |
1843 S5_X(0x0) | S5_Y(0x0) |
1844 S6_X(0xb) | S6_Y(0x4) |
1845 S7_X(0x7) | S7_Y(0x8)));
1847 WREG32(VGT_STRMOUT_EN, 0);
1848 tmp = rdev->config.r600.max_pipes * 16;
1849 switch (rdev->family) {
1865 WREG32(VGT_ES_PER_GS, 128);
1866 WREG32(VGT_GS_PER_ES, tmp);
1867 WREG32(VGT_GS_PER_VS, 2);
1868 WREG32(VGT_GS_VERTEX_REUSE, 16);
1870 /* more default values. 2D/3D driver should adjust as needed */
1871 WREG32(PA_SC_LINE_STIPPLE_STATE, 0);
1872 WREG32(VGT_STRMOUT_EN, 0);
1874 WREG32(PA_SC_MODE_CNTL, 0);
1875 WREG32(PA_SC_AA_CONFIG, 0);
1876 WREG32(PA_SC_LINE_STIPPLE, 0);
1877 WREG32(SPI_INPUT_Z, 0);
1878 WREG32(SPI_PS_IN_CONTROL_0, NUM_INTERP(2));
1879 WREG32(CB_COLOR7_FRAG, 0);
1881 /* Clear render buffer base addresses */
1882 WREG32(CB_COLOR0_BASE, 0);
1883 WREG32(CB_COLOR1_BASE, 0);
1884 WREG32(CB_COLOR2_BASE, 0);
1885 WREG32(CB_COLOR3_BASE, 0);
1886 WREG32(CB_COLOR4_BASE, 0);
1887 WREG32(CB_COLOR5_BASE, 0);
1888 WREG32(CB_COLOR6_BASE, 0);
1889 WREG32(CB_COLOR7_BASE, 0);
1890 WREG32(CB_COLOR7_FRAG, 0);
1892 switch (rdev->family) {
1897 tmp = TC_L2_SIZE(8);
1901 tmp = TC_L2_SIZE(4);
1904 tmp = TC_L2_SIZE(0) | L2_DISABLE_LATE_HIT;
1907 tmp = TC_L2_SIZE(0);
1910 WREG32(TC_CNTL, tmp);
1912 tmp = RREG32(HDP_HOST_PATH_CNTL);
1913 WREG32(HDP_HOST_PATH_CNTL, tmp);
1915 tmp = RREG32(ARB_POP);
1916 tmp |= ENABLE_TC128;
1917 WREG32(ARB_POP, tmp);
1919 WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
1920 WREG32(PA_CL_ENHANCE, (CLIP_VTX_REORDER_ENA |
1922 WREG32(PA_SC_ENHANCE, FORCE_EOV_MAX_CLK_CNT(4095));
1927 * Indirect registers accessor
1929 u32 r600_pciep_rreg(struct radeon_device *rdev, u32 reg)
1933 WREG32(PCIE_PORT_INDEX, ((reg) & 0xff));
1934 (void)RREG32(PCIE_PORT_INDEX);
1935 r = RREG32(PCIE_PORT_DATA);
1939 void r600_pciep_wreg(struct radeon_device *rdev, u32 reg, u32 v)
1941 WREG32(PCIE_PORT_INDEX, ((reg) & 0xff));
1942 (void)RREG32(PCIE_PORT_INDEX);
1943 WREG32(PCIE_PORT_DATA, (v));
1944 (void)RREG32(PCIE_PORT_DATA);
1950 void r600_cp_stop(struct radeon_device *rdev)
1952 radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size);
1953 WREG32(R_0086D8_CP_ME_CNTL, S_0086D8_CP_ME_HALT(1));
1954 WREG32(SCRATCH_UMSK, 0);
1957 int r600_init_microcode(struct radeon_device *rdev)
1959 struct platform_device *pdev;
1960 const char *chip_name;
1961 const char *rlc_chip_name;
1962 size_t pfp_req_size, me_req_size, rlc_req_size;
1968 pdev = platform_device_register_simple("radeon_cp", 0, NULL, 0);
1971 printk(KERN_ERR "radeon_cp: Failed to register firmware\n");
1975 switch (rdev->family) {
1978 rlc_chip_name = "R600";
1981 chip_name = "RV610";
1982 rlc_chip_name = "R600";
1985 chip_name = "RV630";
1986 rlc_chip_name = "R600";
1989 chip_name = "RV620";
1990 rlc_chip_name = "R600";
1993 chip_name = "RV635";
1994 rlc_chip_name = "R600";
1997 chip_name = "RV670";
1998 rlc_chip_name = "R600";
2002 chip_name = "RS780";
2003 rlc_chip_name = "R600";
2006 chip_name = "RV770";
2007 rlc_chip_name = "R700";
2011 chip_name = "RV730";
2012 rlc_chip_name = "R700";
2015 chip_name = "RV710";
2016 rlc_chip_name = "R700";
2019 chip_name = "CEDAR";
2020 rlc_chip_name = "CEDAR";
2023 chip_name = "REDWOOD";
2024 rlc_chip_name = "REDWOOD";
2027 chip_name = "JUNIPER";
2028 rlc_chip_name = "JUNIPER";
2032 chip_name = "CYPRESS";
2033 rlc_chip_name = "CYPRESS";
2037 rlc_chip_name = "SUMO";
2041 rlc_chip_name = "SUMO";
2044 chip_name = "SUMO2";
2045 rlc_chip_name = "SUMO";
2050 if (rdev->family >= CHIP_CEDAR) {
2051 pfp_req_size = EVERGREEN_PFP_UCODE_SIZE * 4;
2052 me_req_size = EVERGREEN_PM4_UCODE_SIZE * 4;
2053 rlc_req_size = EVERGREEN_RLC_UCODE_SIZE * 4;
2054 } else if (rdev->family >= CHIP_RV770) {
2055 pfp_req_size = R700_PFP_UCODE_SIZE * 4;
2056 me_req_size = R700_PM4_UCODE_SIZE * 4;
2057 rlc_req_size = R700_RLC_UCODE_SIZE * 4;
2059 pfp_req_size = PFP_UCODE_SIZE * 4;
2060 me_req_size = PM4_UCODE_SIZE * 12;
2061 rlc_req_size = RLC_UCODE_SIZE * 4;
2064 DRM_INFO("Loading %s Microcode\n", chip_name);
2066 snprintf(fw_name, sizeof(fw_name), "radeon/%s_pfp.bin", chip_name);
2067 err = request_firmware(&rdev->pfp_fw, fw_name, &pdev->dev);
2070 if (rdev->pfp_fw->size != pfp_req_size) {
2072 "r600_cp: Bogus length %zu in firmware \"%s\"\n",
2073 rdev->pfp_fw->size, fw_name);
2078 snprintf(fw_name, sizeof(fw_name), "radeon/%s_me.bin", chip_name);
2079 err = request_firmware(&rdev->me_fw, fw_name, &pdev->dev);
2082 if (rdev->me_fw->size != me_req_size) {
2084 "r600_cp: Bogus length %zu in firmware \"%s\"\n",
2085 rdev->me_fw->size, fw_name);
2089 snprintf(fw_name, sizeof(fw_name), "radeon/%s_rlc.bin", rlc_chip_name);
2090 err = request_firmware(&rdev->rlc_fw, fw_name, &pdev->dev);
2093 if (rdev->rlc_fw->size != rlc_req_size) {
2095 "r600_rlc: Bogus length %zu in firmware \"%s\"\n",
2096 rdev->rlc_fw->size, fw_name);
2101 platform_device_unregister(pdev);
2106 "r600_cp: Failed to load firmware \"%s\"\n",
2108 release_firmware(rdev->pfp_fw);
2109 rdev->pfp_fw = NULL;
2110 release_firmware(rdev->me_fw);
2112 release_firmware(rdev->rlc_fw);
2113 rdev->rlc_fw = NULL;
2118 static int r600_cp_load_microcode(struct radeon_device *rdev)
2120 const __be32 *fw_data;
2123 if (!rdev->me_fw || !rdev->pfp_fw)
2132 RB_NO_UPDATE | RB_BLKSZ(15) | RB_BUFSZ(3));
2135 WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
2136 RREG32(GRBM_SOFT_RESET);
2138 WREG32(GRBM_SOFT_RESET, 0);
2140 WREG32(CP_ME_RAM_WADDR, 0);
2142 fw_data = (const __be32 *)rdev->me_fw->data;
2143 WREG32(CP_ME_RAM_WADDR, 0);
2144 for (i = 0; i < PM4_UCODE_SIZE * 3; i++)
2145 WREG32(CP_ME_RAM_DATA,
2146 be32_to_cpup(fw_data++));
2148 fw_data = (const __be32 *)rdev->pfp_fw->data;
2149 WREG32(CP_PFP_UCODE_ADDR, 0);
2150 for (i = 0; i < PFP_UCODE_SIZE; i++)
2151 WREG32(CP_PFP_UCODE_DATA,
2152 be32_to_cpup(fw_data++));
2154 WREG32(CP_PFP_UCODE_ADDR, 0);
2155 WREG32(CP_ME_RAM_WADDR, 0);
2156 WREG32(CP_ME_RAM_RADDR, 0);
2160 int r600_cp_start(struct radeon_device *rdev)
2165 r = radeon_ring_lock(rdev, 7);
2167 DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
2170 radeon_ring_write(rdev, PACKET3(PACKET3_ME_INITIALIZE, 5));
2171 radeon_ring_write(rdev, 0x1);
2172 if (rdev->family >= CHIP_RV770) {
2173 radeon_ring_write(rdev, 0x0);
2174 radeon_ring_write(rdev, rdev->config.rv770.max_hw_contexts - 1);
2176 radeon_ring_write(rdev, 0x3);
2177 radeon_ring_write(rdev, rdev->config.r600.max_hw_contexts - 1);
2179 radeon_ring_write(rdev, PACKET3_ME_INITIALIZE_DEVICE_ID(1));
2180 radeon_ring_write(rdev, 0);
2181 radeon_ring_write(rdev, 0);
2182 radeon_ring_unlock_commit(rdev);
2185 WREG32(R_0086D8_CP_ME_CNTL, cp_me);
2189 int r600_cp_resume(struct radeon_device *rdev)
2196 WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
2197 RREG32(GRBM_SOFT_RESET);
2199 WREG32(GRBM_SOFT_RESET, 0);
2201 /* Set ring buffer size */
2202 rb_bufsz = drm_order(rdev->cp.ring_size / 8);
2203 tmp = (drm_order(RADEON_GPU_PAGE_SIZE/8) << 8) | rb_bufsz;
2205 tmp |= BUF_SWAP_32BIT;
2207 WREG32(CP_RB_CNTL, tmp);
2208 WREG32(CP_SEM_WAIT_TIMER, 0x4);
2210 /* Set the write pointer delay */
2211 WREG32(CP_RB_WPTR_DELAY, 0);
2213 /* Initialize the ring buffer's read and write pointers */
2214 WREG32(CP_RB_CNTL, tmp | RB_RPTR_WR_ENA);
2215 WREG32(CP_RB_RPTR_WR, 0);
2217 WREG32(CP_RB_WPTR, rdev->cp.wptr);
2219 /* set the wb address whether it's enabled or not */
2220 WREG32(CP_RB_RPTR_ADDR,
2221 ((rdev->wb.gpu_addr + RADEON_WB_CP_RPTR_OFFSET) & 0xFFFFFFFC));
2222 WREG32(CP_RB_RPTR_ADDR_HI, upper_32_bits(rdev->wb.gpu_addr + RADEON_WB_CP_RPTR_OFFSET) & 0xFF);
2223 WREG32(SCRATCH_ADDR, ((rdev->wb.gpu_addr + RADEON_WB_SCRATCH_OFFSET) >> 8) & 0xFFFFFFFF);
2225 if (rdev->wb.enabled)
2226 WREG32(SCRATCH_UMSK, 0xff);
2228 tmp |= RB_NO_UPDATE;
2229 WREG32(SCRATCH_UMSK, 0);
2233 WREG32(CP_RB_CNTL, tmp);
2235 WREG32(CP_RB_BASE, rdev->cp.gpu_addr >> 8);
2236 WREG32(CP_DEBUG, (1 << 27) | (1 << 28));
2238 rdev->cp.rptr = RREG32(CP_RB_RPTR);
2240 r600_cp_start(rdev);
2241 rdev->cp.ready = true;
2242 r = radeon_ring_test(rdev);
2244 rdev->cp.ready = false;
2250 void r600_cp_commit(struct radeon_device *rdev)
2252 WREG32(CP_RB_WPTR, rdev->cp.wptr);
2253 (void)RREG32(CP_RB_WPTR);
2256 void r600_ring_init(struct radeon_device *rdev, unsigned ring_size)
2260 /* Align ring size */
2261 rb_bufsz = drm_order(ring_size / 8);
2262 ring_size = (1 << (rb_bufsz + 1)) * 4;
2263 rdev->cp.ring_size = ring_size;
2264 rdev->cp.align_mask = 16 - 1;
2267 void r600_cp_fini(struct radeon_device *rdev)
2270 radeon_ring_fini(rdev);
2275 * GPU scratch registers helpers function.
2277 void r600_scratch_init(struct radeon_device *rdev)
2281 rdev->scratch.num_reg = 7;
2282 rdev->scratch.reg_base = SCRATCH_REG0;
2283 for (i = 0; i < rdev->scratch.num_reg; i++) {
2284 rdev->scratch.free[i] = true;
2285 rdev->scratch.reg[i] = rdev->scratch.reg_base + (i * 4);
2289 int r600_ring_test(struct radeon_device *rdev)
2296 r = radeon_scratch_get(rdev, &scratch);
2298 DRM_ERROR("radeon: cp failed to get scratch reg (%d).\n", r);
2301 WREG32(scratch, 0xCAFEDEAD);
2302 r = radeon_ring_lock(rdev, 3);
2304 DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
2305 radeon_scratch_free(rdev, scratch);
2308 radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
2309 radeon_ring_write(rdev, ((scratch - PACKET3_SET_CONFIG_REG_OFFSET) >> 2));
2310 radeon_ring_write(rdev, 0xDEADBEEF);
2311 radeon_ring_unlock_commit(rdev);
2312 for (i = 0; i < rdev->usec_timeout; i++) {
2313 tmp = RREG32(scratch);
2314 if (tmp == 0xDEADBEEF)
2318 if (i < rdev->usec_timeout) {
2319 DRM_INFO("ring test succeeded in %d usecs\n", i);
2321 DRM_ERROR("radeon: ring test failed (scratch(0x%04X)=0x%08X)\n",
2325 radeon_scratch_free(rdev, scratch);
2329 void r600_fence_ring_emit(struct radeon_device *rdev,
2330 struct radeon_fence *fence)
2332 if (rdev->wb.use_event) {
2333 u64 addr = rdev->wb.gpu_addr + R600_WB_EVENT_OFFSET +
2334 (u64)(rdev->fence_drv.scratch_reg - rdev->scratch.reg_base);
2335 /* EVENT_WRITE_EOP - flush caches, send int */
2336 radeon_ring_write(rdev, PACKET3(PACKET3_EVENT_WRITE_EOP, 4));
2337 radeon_ring_write(rdev, EVENT_TYPE(CACHE_FLUSH_AND_INV_EVENT_TS) | EVENT_INDEX(5));
2338 radeon_ring_write(rdev, addr & 0xffffffff);
2339 radeon_ring_write(rdev, (upper_32_bits(addr) & 0xff) | DATA_SEL(1) | INT_SEL(2));
2340 radeon_ring_write(rdev, fence->seq);
2341 radeon_ring_write(rdev, 0);
2343 radeon_ring_write(rdev, PACKET3(PACKET3_EVENT_WRITE, 0));
2344 radeon_ring_write(rdev, EVENT_TYPE(CACHE_FLUSH_AND_INV_EVENT) | EVENT_INDEX(0));
2345 /* wait for 3D idle clean */
2346 radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
2347 radeon_ring_write(rdev, (WAIT_UNTIL - PACKET3_SET_CONFIG_REG_OFFSET) >> 2);
2348 radeon_ring_write(rdev, WAIT_3D_IDLE_bit | WAIT_3D_IDLECLEAN_bit);
2349 /* Emit fence sequence & fire IRQ */
2350 radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
2351 radeon_ring_write(rdev, ((rdev->fence_drv.scratch_reg - PACKET3_SET_CONFIG_REG_OFFSET) >> 2));
2352 radeon_ring_write(rdev, fence->seq);
2353 /* CP_INTERRUPT packet 3 no longer exists, use packet 0 */
2354 radeon_ring_write(rdev, PACKET0(CP_INT_STATUS, 0));
2355 radeon_ring_write(rdev, RB_INT_STAT);
2359 int r600_copy_blit(struct radeon_device *rdev,
2360 uint64_t src_offset,
2361 uint64_t dst_offset,
2362 unsigned num_gpu_pages,
2363 struct radeon_fence *fence)
2367 mutex_lock(&rdev->r600_blit.mutex);
2368 rdev->r600_blit.vb_ib = NULL;
2369 r = r600_blit_prepare_copy(rdev, num_gpu_pages);
2371 if (rdev->r600_blit.vb_ib)
2372 radeon_ib_free(rdev, &rdev->r600_blit.vb_ib);
2373 mutex_unlock(&rdev->r600_blit.mutex);
2376 r600_kms_blit_copy(rdev, src_offset, dst_offset, num_gpu_pages);
2377 r600_blit_done_copy(rdev, fence);
2378 mutex_unlock(&rdev->r600_blit.mutex);
2382 void r600_blit_suspend(struct radeon_device *rdev)
2386 /* unpin shaders bo */
2387 if (rdev->r600_blit.shader_obj) {
2388 r = radeon_bo_reserve(rdev->r600_blit.shader_obj, false);
2390 radeon_bo_unpin(rdev->r600_blit.shader_obj);
2391 radeon_bo_unreserve(rdev->r600_blit.shader_obj);
2396 int r600_set_surface_reg(struct radeon_device *rdev, int reg,
2397 uint32_t tiling_flags, uint32_t pitch,
2398 uint32_t offset, uint32_t obj_size)
2400 /* FIXME: implement */
2404 void r600_clear_surface_reg(struct radeon_device *rdev, int reg)
2406 /* FIXME: implement */
2409 int r600_startup(struct radeon_device *rdev)
2413 /* enable pcie gen2 link */
2414 r600_pcie_gen2_enable(rdev);
2416 if (!rdev->me_fw || !rdev->pfp_fw || !rdev->rlc_fw) {
2417 r = r600_init_microcode(rdev);
2419 DRM_ERROR("Failed to load firmware!\n");
2424 r600_mc_program(rdev);
2425 if (rdev->flags & RADEON_IS_AGP) {
2426 r600_agp_enable(rdev);
2428 r = r600_pcie_gart_enable(rdev);
2432 r600_gpu_init(rdev);
2433 r = r600_blit_init(rdev);
2435 r600_blit_fini(rdev);
2436 rdev->asic->copy = NULL;
2437 dev_warn(rdev->dev, "failed blitter (%d) falling back to memcpy\n", r);
2440 /* allocate wb buffer */
2441 r = radeon_wb_init(rdev);
2446 r = r600_irq_init(rdev);
2448 DRM_ERROR("radeon: IH init failed (%d).\n", r);
2449 radeon_irq_kms_fini(rdev);
2454 r = radeon_ring_init(rdev, rdev->cp.ring_size);
2457 r = r600_cp_load_microcode(rdev);
2460 r = r600_cp_resume(rdev);
2467 void r600_vga_set_state(struct radeon_device *rdev, bool state)
2471 temp = RREG32(CONFIG_CNTL);
2472 if (state == false) {
2478 WREG32(CONFIG_CNTL, temp);
2481 int r600_resume(struct radeon_device *rdev)
2485 /* Do not reset GPU before posting, on r600 hw unlike on r500 hw,
2486 * posting will perform necessary task to bring back GPU into good
2490 atom_asic_init(rdev->mode_info.atom_context);
2492 r = r600_startup(rdev);
2494 DRM_ERROR("r600 startup failed on resume\n");
2498 r = r600_ib_test(rdev);
2500 DRM_ERROR("radeon: failed testing IB (%d).\n", r);
2504 r = r600_audio_init(rdev);
2506 DRM_ERROR("radeon: audio resume failed\n");
2513 int r600_suspend(struct radeon_device *rdev)
2515 r600_audio_fini(rdev);
2516 /* FIXME: we should wait for ring to be empty */
2518 rdev->cp.ready = false;
2519 r600_irq_suspend(rdev);
2520 radeon_wb_disable(rdev);
2521 r600_pcie_gart_disable(rdev);
2522 r600_blit_suspend(rdev);
2527 /* Plan is to move initialization in that function and use
2528 * helper function so that radeon_device_init pretty much
2529 * do nothing more than calling asic specific function. This
2530 * should also allow to remove a bunch of callback function
2533 int r600_init(struct radeon_device *rdev)
2537 if (r600_debugfs_mc_info_init(rdev)) {
2538 DRM_ERROR("Failed to register debugfs file for mc !\n");
2540 /* This don't do much */
2541 r = radeon_gem_init(rdev);
2545 if (!radeon_get_bios(rdev)) {
2546 if (ASIC_IS_AVIVO(rdev))
2549 /* Must be an ATOMBIOS */
2550 if (!rdev->is_atom_bios) {
2551 dev_err(rdev->dev, "Expecting atombios for R600 GPU\n");
2554 r = radeon_atombios_init(rdev);
2557 /* Post card if necessary */
2558 if (!radeon_card_posted(rdev)) {
2560 dev_err(rdev->dev, "Card not posted and no BIOS - ignoring\n");
2563 DRM_INFO("GPU not posted. posting now...\n");
2564 atom_asic_init(rdev->mode_info.atom_context);
2566 /* Initialize scratch registers */
2567 r600_scratch_init(rdev);
2568 /* Initialize surface registers */
2569 radeon_surface_init(rdev);
2570 /* Initialize clocks */
2571 radeon_get_clock_info(rdev->ddev);
2573 r = radeon_fence_driver_init(rdev);
2576 if (rdev->flags & RADEON_IS_AGP) {
2577 r = radeon_agp_init(rdev);
2579 radeon_agp_disable(rdev);
2581 r = r600_mc_init(rdev);
2584 /* Memory manager */
2585 r = radeon_bo_init(rdev);
2589 r = radeon_irq_kms_init(rdev);
2593 rdev->cp.ring_obj = NULL;
2594 r600_ring_init(rdev, 1024 * 1024);
2596 rdev->ih.ring_obj = NULL;
2597 r600_ih_ring_init(rdev, 64 * 1024);
2599 r = r600_pcie_gart_init(rdev);
2603 rdev->accel_working = true;
2604 r = r600_startup(rdev);
2606 dev_err(rdev->dev, "disabling GPU acceleration\n");
2608 r600_irq_fini(rdev);
2609 radeon_wb_fini(rdev);
2610 radeon_irq_kms_fini(rdev);
2611 r600_pcie_gart_fini(rdev);
2612 rdev->accel_working = false;
2614 if (rdev->accel_working) {
2615 r = radeon_ib_pool_init(rdev);
2617 dev_err(rdev->dev, "IB initialization failed (%d).\n", r);
2618 rdev->accel_working = false;
2620 r = r600_ib_test(rdev);
2622 dev_err(rdev->dev, "IB test failed (%d).\n", r);
2623 rdev->accel_working = false;
2628 r = r600_audio_init(rdev);
2630 return r; /* TODO error handling */
2634 void r600_fini(struct radeon_device *rdev)
2636 r600_audio_fini(rdev);
2637 r600_blit_fini(rdev);
2639 r600_irq_fini(rdev);
2640 radeon_wb_fini(rdev);
2641 radeon_ib_pool_fini(rdev);
2642 radeon_irq_kms_fini(rdev);
2643 r600_pcie_gart_fini(rdev);
2644 radeon_agp_fini(rdev);
2645 radeon_gem_fini(rdev);
2646 radeon_fence_driver_fini(rdev);
2647 radeon_bo_fini(rdev);
2648 radeon_atombios_fini(rdev);
2657 void r600_ring_ib_execute(struct radeon_device *rdev, struct radeon_ib *ib)
2659 /* FIXME: implement */
2660 radeon_ring_write(rdev, PACKET3(PACKET3_INDIRECT_BUFFER, 2));
2661 radeon_ring_write(rdev,
2665 (ib->gpu_addr & 0xFFFFFFFC));
2666 radeon_ring_write(rdev, upper_32_bits(ib->gpu_addr) & 0xFF);
2667 radeon_ring_write(rdev, ib->length_dw);
2670 int r600_ib_test(struct radeon_device *rdev)
2672 struct radeon_ib *ib;
2678 r = radeon_scratch_get(rdev, &scratch);
2680 DRM_ERROR("radeon: failed to get scratch reg (%d).\n", r);
2683 WREG32(scratch, 0xCAFEDEAD);
2684 r = radeon_ib_get(rdev, &ib);
2686 DRM_ERROR("radeon: failed to get ib (%d).\n", r);
2689 ib->ptr[0] = PACKET3(PACKET3_SET_CONFIG_REG, 1);
2690 ib->ptr[1] = ((scratch - PACKET3_SET_CONFIG_REG_OFFSET) >> 2);
2691 ib->ptr[2] = 0xDEADBEEF;
2692 ib->ptr[3] = PACKET2(0);
2693 ib->ptr[4] = PACKET2(0);
2694 ib->ptr[5] = PACKET2(0);
2695 ib->ptr[6] = PACKET2(0);
2696 ib->ptr[7] = PACKET2(0);
2697 ib->ptr[8] = PACKET2(0);
2698 ib->ptr[9] = PACKET2(0);
2699 ib->ptr[10] = PACKET2(0);
2700 ib->ptr[11] = PACKET2(0);
2701 ib->ptr[12] = PACKET2(0);
2702 ib->ptr[13] = PACKET2(0);
2703 ib->ptr[14] = PACKET2(0);
2704 ib->ptr[15] = PACKET2(0);
2706 r = radeon_ib_schedule(rdev, ib);
2708 radeon_scratch_free(rdev, scratch);
2709 radeon_ib_free(rdev, &ib);
2710 DRM_ERROR("radeon: failed to schedule ib (%d).\n", r);
2713 r = radeon_fence_wait(ib->fence, false);
2715 DRM_ERROR("radeon: fence wait failed (%d).\n", r);
2718 for (i = 0; i < rdev->usec_timeout; i++) {
2719 tmp = RREG32(scratch);
2720 if (tmp == 0xDEADBEEF)
2724 if (i < rdev->usec_timeout) {
2725 DRM_INFO("ib test succeeded in %u usecs\n", i);
2727 DRM_ERROR("radeon: ib test failed (scratch(0x%04X)=0x%08X)\n",
2731 radeon_scratch_free(rdev, scratch);
2732 radeon_ib_free(rdev, &ib);
2739 * Interrupts use a ring buffer on r6xx/r7xx hardware. It works pretty
2740 * the same as the CP ring buffer, but in reverse. Rather than the CPU
2741 * writing to the ring and the GPU consuming, the GPU writes to the ring
2742 * and host consumes. As the host irq handler processes interrupts, it
2743 * increments the rptr. When the rptr catches up with the wptr, all the
2744 * current interrupts have been processed.
2747 void r600_ih_ring_init(struct radeon_device *rdev, unsigned ring_size)
2751 /* Align ring size */
2752 rb_bufsz = drm_order(ring_size / 4);
2753 ring_size = (1 << rb_bufsz) * 4;
2754 rdev->ih.ring_size = ring_size;
2755 rdev->ih.ptr_mask = rdev->ih.ring_size - 1;
2759 static int r600_ih_ring_alloc(struct radeon_device *rdev)
2763 /* Allocate ring buffer */
2764 if (rdev->ih.ring_obj == NULL) {
2765 r = radeon_bo_create(rdev, rdev->ih.ring_size,
2767 RADEON_GEM_DOMAIN_GTT,
2768 &rdev->ih.ring_obj);
2770 DRM_ERROR("radeon: failed to create ih ring buffer (%d).\n", r);
2773 r = radeon_bo_reserve(rdev->ih.ring_obj, false);
2774 if (unlikely(r != 0))
2776 r = radeon_bo_pin(rdev->ih.ring_obj,
2777 RADEON_GEM_DOMAIN_GTT,
2778 &rdev->ih.gpu_addr);
2780 radeon_bo_unreserve(rdev->ih.ring_obj);
2781 DRM_ERROR("radeon: failed to pin ih ring buffer (%d).\n", r);
2784 r = radeon_bo_kmap(rdev->ih.ring_obj,
2785 (void **)&rdev->ih.ring);
2786 radeon_bo_unreserve(rdev->ih.ring_obj);
2788 DRM_ERROR("radeon: failed to map ih ring buffer (%d).\n", r);
2795 static void r600_ih_ring_fini(struct radeon_device *rdev)
2798 if (rdev->ih.ring_obj) {
2799 r = radeon_bo_reserve(rdev->ih.ring_obj, false);
2800 if (likely(r == 0)) {
2801 radeon_bo_kunmap(rdev->ih.ring_obj);
2802 radeon_bo_unpin(rdev->ih.ring_obj);
2803 radeon_bo_unreserve(rdev->ih.ring_obj);
2805 radeon_bo_unref(&rdev->ih.ring_obj);
2806 rdev->ih.ring = NULL;
2807 rdev->ih.ring_obj = NULL;
2811 void r600_rlc_stop(struct radeon_device *rdev)
2814 if ((rdev->family >= CHIP_RV770) &&
2815 (rdev->family <= CHIP_RV740)) {
2816 /* r7xx asics need to soft reset RLC before halting */
2817 WREG32(SRBM_SOFT_RESET, SOFT_RESET_RLC);
2818 RREG32(SRBM_SOFT_RESET);
2820 WREG32(SRBM_SOFT_RESET, 0);
2821 RREG32(SRBM_SOFT_RESET);
2824 WREG32(RLC_CNTL, 0);
2827 static void r600_rlc_start(struct radeon_device *rdev)
2829 WREG32(RLC_CNTL, RLC_ENABLE);
2832 static int r600_rlc_init(struct radeon_device *rdev)
2835 const __be32 *fw_data;
2840 r600_rlc_stop(rdev);
2842 WREG32(RLC_HB_BASE, 0);
2843 WREG32(RLC_HB_CNTL, 0);
2844 WREG32(RLC_HB_RPTR, 0);
2845 WREG32(RLC_HB_WPTR, 0);
2846 if (rdev->family <= CHIP_CAICOS) {
2847 WREG32(RLC_HB_WPTR_LSB_ADDR, 0);
2848 WREG32(RLC_HB_WPTR_MSB_ADDR, 0);
2850 WREG32(RLC_MC_CNTL, 0);
2851 WREG32(RLC_UCODE_CNTL, 0);
2853 fw_data = (const __be32 *)rdev->rlc_fw->data;
2854 if (rdev->family >= CHIP_CAYMAN) {
2855 for (i = 0; i < CAYMAN_RLC_UCODE_SIZE; i++) {
2856 WREG32(RLC_UCODE_ADDR, i);
2857 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
2859 } else if (rdev->family >= CHIP_CEDAR) {
2860 for (i = 0; i < EVERGREEN_RLC_UCODE_SIZE; i++) {
2861 WREG32(RLC_UCODE_ADDR, i);
2862 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
2864 } else if (rdev->family >= CHIP_RV770) {
2865 for (i = 0; i < R700_RLC_UCODE_SIZE; i++) {
2866 WREG32(RLC_UCODE_ADDR, i);
2867 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
2870 for (i = 0; i < RLC_UCODE_SIZE; i++) {
2871 WREG32(RLC_UCODE_ADDR, i);
2872 WREG32(RLC_UCODE_DATA, be32_to_cpup(fw_data++));
2875 WREG32(RLC_UCODE_ADDR, 0);
2877 r600_rlc_start(rdev);
2882 static void r600_enable_interrupts(struct radeon_device *rdev)
2884 u32 ih_cntl = RREG32(IH_CNTL);
2885 u32 ih_rb_cntl = RREG32(IH_RB_CNTL);
2887 ih_cntl |= ENABLE_INTR;
2888 ih_rb_cntl |= IH_RB_ENABLE;
2889 WREG32(IH_CNTL, ih_cntl);
2890 WREG32(IH_RB_CNTL, ih_rb_cntl);
2891 rdev->ih.enabled = true;
2894 void r600_disable_interrupts(struct radeon_device *rdev)
2896 u32 ih_rb_cntl = RREG32(IH_RB_CNTL);
2897 u32 ih_cntl = RREG32(IH_CNTL);
2899 ih_rb_cntl &= ~IH_RB_ENABLE;
2900 ih_cntl &= ~ENABLE_INTR;
2901 WREG32(IH_RB_CNTL, ih_rb_cntl);
2902 WREG32(IH_CNTL, ih_cntl);
2903 /* set rptr, wptr to 0 */
2904 WREG32(IH_RB_RPTR, 0);
2905 WREG32(IH_RB_WPTR, 0);
2906 rdev->ih.enabled = false;
2911 static void r600_disable_interrupt_state(struct radeon_device *rdev)
2915 WREG32(CP_INT_CNTL, CNTX_BUSY_INT_ENABLE | CNTX_EMPTY_INT_ENABLE);
2916 WREG32(GRBM_INT_CNTL, 0);
2917 WREG32(DxMODE_INT_MASK, 0);
2918 WREG32(D1GRPH_INTERRUPT_CONTROL, 0);
2919 WREG32(D2GRPH_INTERRUPT_CONTROL, 0);
2920 if (ASIC_IS_DCE3(rdev)) {
2921 WREG32(DCE3_DACA_AUTODETECT_INT_CONTROL, 0);
2922 WREG32(DCE3_DACB_AUTODETECT_INT_CONTROL, 0);
2923 tmp = RREG32(DC_HPD1_INT_CONTROL) & DC_HPDx_INT_POLARITY;
2924 WREG32(DC_HPD1_INT_CONTROL, tmp);
2925 tmp = RREG32(DC_HPD2_INT_CONTROL) & DC_HPDx_INT_POLARITY;
2926 WREG32(DC_HPD2_INT_CONTROL, tmp);
2927 tmp = RREG32(DC_HPD3_INT_CONTROL) & DC_HPDx_INT_POLARITY;
2928 WREG32(DC_HPD3_INT_CONTROL, tmp);
2929 tmp = RREG32(DC_HPD4_INT_CONTROL) & DC_HPDx_INT_POLARITY;
2930 WREG32(DC_HPD4_INT_CONTROL, tmp);
2931 if (ASIC_IS_DCE32(rdev)) {
2932 tmp = RREG32(DC_HPD5_INT_CONTROL) & DC_HPDx_INT_POLARITY;
2933 WREG32(DC_HPD5_INT_CONTROL, tmp);
2934 tmp = RREG32(DC_HPD6_INT_CONTROL) & DC_HPDx_INT_POLARITY;
2935 WREG32(DC_HPD6_INT_CONTROL, tmp);
2938 WREG32(DACA_AUTODETECT_INT_CONTROL, 0);
2939 WREG32(DACB_AUTODETECT_INT_CONTROL, 0);
2940 tmp = RREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL) & DC_HOT_PLUG_DETECTx_INT_POLARITY;
2941 WREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL, tmp);
2942 tmp = RREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL) & DC_HOT_PLUG_DETECTx_INT_POLARITY;
2943 WREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL, tmp);
2944 tmp = RREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL) & DC_HOT_PLUG_DETECTx_INT_POLARITY;
2945 WREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL, tmp);
2949 int r600_irq_init(struct radeon_device *rdev)
2953 u32 interrupt_cntl, ih_cntl, ih_rb_cntl;
2956 ret = r600_ih_ring_alloc(rdev);
2961 r600_disable_interrupts(rdev);
2964 ret = r600_rlc_init(rdev);
2966 r600_ih_ring_fini(rdev);
2970 /* setup interrupt control */
2971 /* set dummy read address to ring address */
2972 WREG32(INTERRUPT_CNTL2, rdev->ih.gpu_addr >> 8);
2973 interrupt_cntl = RREG32(INTERRUPT_CNTL);
2974 /* IH_DUMMY_RD_OVERRIDE=0 - dummy read disabled with msi, enabled without msi
2975 * IH_DUMMY_RD_OVERRIDE=1 - dummy read controlled by IH_DUMMY_RD_EN
2977 interrupt_cntl &= ~IH_DUMMY_RD_OVERRIDE;
2978 /* IH_REQ_NONSNOOP_EN=1 if ring is in non-cacheable memory, e.g., vram */
2979 interrupt_cntl &= ~IH_REQ_NONSNOOP_EN;
2980 WREG32(INTERRUPT_CNTL, interrupt_cntl);
2982 WREG32(IH_RB_BASE, rdev->ih.gpu_addr >> 8);
2983 rb_bufsz = drm_order(rdev->ih.ring_size / 4);
2985 ih_rb_cntl = (IH_WPTR_OVERFLOW_ENABLE |
2986 IH_WPTR_OVERFLOW_CLEAR |
2989 if (rdev->wb.enabled)
2990 ih_rb_cntl |= IH_WPTR_WRITEBACK_ENABLE;
2992 /* set the writeback address whether it's enabled or not */
2993 WREG32(IH_RB_WPTR_ADDR_LO, (rdev->wb.gpu_addr + R600_WB_IH_WPTR_OFFSET) & 0xFFFFFFFC);
2994 WREG32(IH_RB_WPTR_ADDR_HI, upper_32_bits(rdev->wb.gpu_addr + R600_WB_IH_WPTR_OFFSET) & 0xFF);
2996 WREG32(IH_RB_CNTL, ih_rb_cntl);
2998 /* set rptr, wptr to 0 */
2999 WREG32(IH_RB_RPTR, 0);
3000 WREG32(IH_RB_WPTR, 0);
3002 /* Default settings for IH_CNTL (disabled at first) */
3003 ih_cntl = MC_WRREQ_CREDIT(0x10) | MC_WR_CLEAN_CNT(0x10);
3004 /* RPTR_REARM only works if msi's are enabled */
3005 if (rdev->msi_enabled)
3006 ih_cntl |= RPTR_REARM;
3007 WREG32(IH_CNTL, ih_cntl);
3009 /* force the active interrupt state to all disabled */
3010 if (rdev->family >= CHIP_CEDAR)
3011 evergreen_disable_interrupt_state(rdev);
3013 r600_disable_interrupt_state(rdev);
3016 r600_enable_interrupts(rdev);
3021 void r600_irq_suspend(struct radeon_device *rdev)
3023 r600_irq_disable(rdev);
3024 r600_rlc_stop(rdev);
3027 void r600_irq_fini(struct radeon_device *rdev)
3029 r600_irq_suspend(rdev);
3030 r600_ih_ring_fini(rdev);
3033 int r600_irq_set(struct radeon_device *rdev)
3035 u32 cp_int_cntl = CNTX_BUSY_INT_ENABLE | CNTX_EMPTY_INT_ENABLE;
3037 u32 hpd1, hpd2, hpd3, hpd4 = 0, hpd5 = 0, hpd6 = 0;
3038 u32 grbm_int_cntl = 0;
3040 u32 d1grph = 0, d2grph = 0;
3042 if (!rdev->irq.installed) {
3043 WARN(1, "Can't enable IRQ/MSI because no handler is installed\n");
3046 /* don't enable anything if the ih is disabled */
3047 if (!rdev->ih.enabled) {
3048 r600_disable_interrupts(rdev);
3049 /* force the active interrupt state to all disabled */
3050 r600_disable_interrupt_state(rdev);
3054 hdmi1 = RREG32(R600_HDMI_BLOCK1 + R600_HDMI_CNTL) & ~R600_HDMI_INT_EN;
3055 if (ASIC_IS_DCE3(rdev)) {
3056 hdmi2 = RREG32(R600_HDMI_BLOCK3 + R600_HDMI_CNTL) & ~R600_HDMI_INT_EN;
3057 hpd1 = RREG32(DC_HPD1_INT_CONTROL) & ~DC_HPDx_INT_EN;
3058 hpd2 = RREG32(DC_HPD2_INT_CONTROL) & ~DC_HPDx_INT_EN;
3059 hpd3 = RREG32(DC_HPD3_INT_CONTROL) & ~DC_HPDx_INT_EN;
3060 hpd4 = RREG32(DC_HPD4_INT_CONTROL) & ~DC_HPDx_INT_EN;
3061 if (ASIC_IS_DCE32(rdev)) {
3062 hpd5 = RREG32(DC_HPD5_INT_CONTROL) & ~DC_HPDx_INT_EN;
3063 hpd6 = RREG32(DC_HPD6_INT_CONTROL) & ~DC_HPDx_INT_EN;
3066 hdmi2 = RREG32(R600_HDMI_BLOCK2 + R600_HDMI_CNTL) & ~R600_HDMI_INT_EN;
3067 hpd1 = RREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL) & ~DC_HPDx_INT_EN;
3068 hpd2 = RREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL) & ~DC_HPDx_INT_EN;
3069 hpd3 = RREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL) & ~DC_HPDx_INT_EN;
3072 if (rdev->irq.sw_int) {
3073 DRM_DEBUG("r600_irq_set: sw int\n");
3074 cp_int_cntl |= RB_INT_ENABLE;
3075 cp_int_cntl |= TIME_STAMP_INT_ENABLE;
3077 if (rdev->irq.crtc_vblank_int[0] ||
3078 rdev->irq.pflip[0]) {
3079 DRM_DEBUG("r600_irq_set: vblank 0\n");
3080 mode_int |= D1MODE_VBLANK_INT_MASK;
3082 if (rdev->irq.crtc_vblank_int[1] ||
3083 rdev->irq.pflip[1]) {
3084 DRM_DEBUG("r600_irq_set: vblank 1\n");
3085 mode_int |= D2MODE_VBLANK_INT_MASK;
3087 if (rdev->irq.hpd[0]) {
3088 DRM_DEBUG("r600_irq_set: hpd 1\n");
3089 hpd1 |= DC_HPDx_INT_EN;
3091 if (rdev->irq.hpd[1]) {
3092 DRM_DEBUG("r600_irq_set: hpd 2\n");
3093 hpd2 |= DC_HPDx_INT_EN;
3095 if (rdev->irq.hpd[2]) {
3096 DRM_DEBUG("r600_irq_set: hpd 3\n");
3097 hpd3 |= DC_HPDx_INT_EN;
3099 if (rdev->irq.hpd[3]) {
3100 DRM_DEBUG("r600_irq_set: hpd 4\n");
3101 hpd4 |= DC_HPDx_INT_EN;
3103 if (rdev->irq.hpd[4]) {
3104 DRM_DEBUG("r600_irq_set: hpd 5\n");
3105 hpd5 |= DC_HPDx_INT_EN;
3107 if (rdev->irq.hpd[5]) {
3108 DRM_DEBUG("r600_irq_set: hpd 6\n");
3109 hpd6 |= DC_HPDx_INT_EN;
3111 if (rdev->irq.hdmi[0]) {
3112 DRM_DEBUG("r600_irq_set: hdmi 1\n");
3113 hdmi1 |= R600_HDMI_INT_EN;
3115 if (rdev->irq.hdmi[1]) {
3116 DRM_DEBUG("r600_irq_set: hdmi 2\n");
3117 hdmi2 |= R600_HDMI_INT_EN;
3119 if (rdev->irq.gui_idle) {
3120 DRM_DEBUG("gui idle\n");
3121 grbm_int_cntl |= GUI_IDLE_INT_ENABLE;
3124 WREG32(CP_INT_CNTL, cp_int_cntl);
3125 WREG32(DxMODE_INT_MASK, mode_int);
3126 WREG32(D1GRPH_INTERRUPT_CONTROL, d1grph);
3127 WREG32(D2GRPH_INTERRUPT_CONTROL, d2grph);
3128 WREG32(GRBM_INT_CNTL, grbm_int_cntl);
3129 WREG32(R600_HDMI_BLOCK1 + R600_HDMI_CNTL, hdmi1);
3130 if (ASIC_IS_DCE3(rdev)) {
3131 WREG32(R600_HDMI_BLOCK3 + R600_HDMI_CNTL, hdmi2);
3132 WREG32(DC_HPD1_INT_CONTROL, hpd1);
3133 WREG32(DC_HPD2_INT_CONTROL, hpd2);
3134 WREG32(DC_HPD3_INT_CONTROL, hpd3);
3135 WREG32(DC_HPD4_INT_CONTROL, hpd4);
3136 if (ASIC_IS_DCE32(rdev)) {
3137 WREG32(DC_HPD5_INT_CONTROL, hpd5);
3138 WREG32(DC_HPD6_INT_CONTROL, hpd6);
3141 WREG32(R600_HDMI_BLOCK2 + R600_HDMI_CNTL, hdmi2);
3142 WREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL, hpd1);
3143 WREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL, hpd2);
3144 WREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL, hpd3);
3150 static void r600_irq_ack(struct radeon_device *rdev)
3154 if (ASIC_IS_DCE3(rdev)) {
3155 rdev->irq.stat_regs.r600.disp_int = RREG32(DCE3_DISP_INTERRUPT_STATUS);
3156 rdev->irq.stat_regs.r600.disp_int_cont = RREG32(DCE3_DISP_INTERRUPT_STATUS_CONTINUE);
3157 rdev->irq.stat_regs.r600.disp_int_cont2 = RREG32(DCE3_DISP_INTERRUPT_STATUS_CONTINUE2);
3159 rdev->irq.stat_regs.r600.disp_int = RREG32(DISP_INTERRUPT_STATUS);
3160 rdev->irq.stat_regs.r600.disp_int_cont = RREG32(DISP_INTERRUPT_STATUS_CONTINUE);
3161 rdev->irq.stat_regs.r600.disp_int_cont2 = 0;
3163 rdev->irq.stat_regs.r600.d1grph_int = RREG32(D1GRPH_INTERRUPT_STATUS);
3164 rdev->irq.stat_regs.r600.d2grph_int = RREG32(D2GRPH_INTERRUPT_STATUS);
3166 if (rdev->irq.stat_regs.r600.d1grph_int & DxGRPH_PFLIP_INT_OCCURRED)
3167 WREG32(D1GRPH_INTERRUPT_STATUS, DxGRPH_PFLIP_INT_CLEAR);
3168 if (rdev->irq.stat_regs.r600.d2grph_int & DxGRPH_PFLIP_INT_OCCURRED)
3169 WREG32(D2GRPH_INTERRUPT_STATUS, DxGRPH_PFLIP_INT_CLEAR);
3170 if (rdev->irq.stat_regs.r600.disp_int & LB_D1_VBLANK_INTERRUPT)
3171 WREG32(D1MODE_VBLANK_STATUS, DxMODE_VBLANK_ACK);
3172 if (rdev->irq.stat_regs.r600.disp_int & LB_D1_VLINE_INTERRUPT)
3173 WREG32(D1MODE_VLINE_STATUS, DxMODE_VLINE_ACK);
3174 if (rdev->irq.stat_regs.r600.disp_int & LB_D2_VBLANK_INTERRUPT)
3175 WREG32(D2MODE_VBLANK_STATUS, DxMODE_VBLANK_ACK);
3176 if (rdev->irq.stat_regs.r600.disp_int & LB_D2_VLINE_INTERRUPT)
3177 WREG32(D2MODE_VLINE_STATUS, DxMODE_VLINE_ACK);
3178 if (rdev->irq.stat_regs.r600.disp_int & DC_HPD1_INTERRUPT) {
3179 if (ASIC_IS_DCE3(rdev)) {
3180 tmp = RREG32(DC_HPD1_INT_CONTROL);
3181 tmp |= DC_HPDx_INT_ACK;
3182 WREG32(DC_HPD1_INT_CONTROL, tmp);
3184 tmp = RREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL);
3185 tmp |= DC_HPDx_INT_ACK;
3186 WREG32(DC_HOT_PLUG_DETECT1_INT_CONTROL, tmp);
3189 if (rdev->irq.stat_regs.r600.disp_int & DC_HPD2_INTERRUPT) {
3190 if (ASIC_IS_DCE3(rdev)) {
3191 tmp = RREG32(DC_HPD2_INT_CONTROL);
3192 tmp |= DC_HPDx_INT_ACK;
3193 WREG32(DC_HPD2_INT_CONTROL, tmp);
3195 tmp = RREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL);
3196 tmp |= DC_HPDx_INT_ACK;
3197 WREG32(DC_HOT_PLUG_DETECT2_INT_CONTROL, tmp);
3200 if (rdev->irq.stat_regs.r600.disp_int_cont & DC_HPD3_INTERRUPT) {
3201 if (ASIC_IS_DCE3(rdev)) {
3202 tmp = RREG32(DC_HPD3_INT_CONTROL);
3203 tmp |= DC_HPDx_INT_ACK;
3204 WREG32(DC_HPD3_INT_CONTROL, tmp);
3206 tmp = RREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL);
3207 tmp |= DC_HPDx_INT_ACK;
3208 WREG32(DC_HOT_PLUG_DETECT3_INT_CONTROL, tmp);
3211 if (rdev->irq.stat_regs.r600.disp_int_cont & DC_HPD4_INTERRUPT) {
3212 tmp = RREG32(DC_HPD4_INT_CONTROL);
3213 tmp |= DC_HPDx_INT_ACK;
3214 WREG32(DC_HPD4_INT_CONTROL, tmp);
3216 if (ASIC_IS_DCE32(rdev)) {
3217 if (rdev->irq.stat_regs.r600.disp_int_cont2 & DC_HPD5_INTERRUPT) {
3218 tmp = RREG32(DC_HPD5_INT_CONTROL);
3219 tmp |= DC_HPDx_INT_ACK;
3220 WREG32(DC_HPD5_INT_CONTROL, tmp);
3222 if (rdev->irq.stat_regs.r600.disp_int_cont2 & DC_HPD6_INTERRUPT) {
3223 tmp = RREG32(DC_HPD5_INT_CONTROL);
3224 tmp |= DC_HPDx_INT_ACK;
3225 WREG32(DC_HPD6_INT_CONTROL, tmp);
3228 if (RREG32(R600_HDMI_BLOCK1 + R600_HDMI_STATUS) & R600_HDMI_INT_PENDING) {
3229 WREG32_P(R600_HDMI_BLOCK1 + R600_HDMI_CNTL, R600_HDMI_INT_ACK, ~R600_HDMI_INT_ACK);
3231 if (ASIC_IS_DCE3(rdev)) {
3232 if (RREG32(R600_HDMI_BLOCK3 + R600_HDMI_STATUS) & R600_HDMI_INT_PENDING) {
3233 WREG32_P(R600_HDMI_BLOCK3 + R600_HDMI_CNTL, R600_HDMI_INT_ACK, ~R600_HDMI_INT_ACK);
3236 if (RREG32(R600_HDMI_BLOCK2 + R600_HDMI_STATUS) & R600_HDMI_INT_PENDING) {
3237 WREG32_P(R600_HDMI_BLOCK2 + R600_HDMI_CNTL, R600_HDMI_INT_ACK, ~R600_HDMI_INT_ACK);
3242 void r600_irq_disable(struct radeon_device *rdev)
3244 r600_disable_interrupts(rdev);
3245 /* Wait and acknowledge irq */
3248 r600_disable_interrupt_state(rdev);
3251 static u32 r600_get_ih_wptr(struct radeon_device *rdev)
3255 if (rdev->wb.enabled)
3256 wptr = le32_to_cpu(rdev->wb.wb[R600_WB_IH_WPTR_OFFSET/4]);
3258 wptr = RREG32(IH_RB_WPTR);
3260 if (wptr & RB_OVERFLOW) {
3261 /* When a ring buffer overflow happen start parsing interrupt
3262 * from the last not overwritten vector (wptr + 16). Hopefully
3263 * this should allow us to catchup.
3265 dev_warn(rdev->dev, "IH ring buffer overflow (0x%08X, %d, %d)\n",
3266 wptr, rdev->ih.rptr, (wptr + 16) + rdev->ih.ptr_mask);
3267 rdev->ih.rptr = (wptr + 16) & rdev->ih.ptr_mask;
3268 tmp = RREG32(IH_RB_CNTL);
3269 tmp |= IH_WPTR_OVERFLOW_CLEAR;
3270 WREG32(IH_RB_CNTL, tmp);
3272 return (wptr & rdev->ih.ptr_mask);
3276 * Each IV ring entry is 128 bits:
3277 * [7:0] - interrupt source id
3279 * [59:32] - interrupt source data
3280 * [127:60] - reserved
3282 * The basic interrupt vector entries
3283 * are decoded as follows:
3284 * src_id src_data description
3289 * 19 0 FP Hot plug detection A
3290 * 19 1 FP Hot plug detection B
3291 * 19 2 DAC A auto-detection
3292 * 19 3 DAC B auto-detection
3298 * 181 - EOP Interrupt
3301 * Note, these are based on r600 and may need to be
3302 * adjusted or added to on newer asics
3305 int r600_irq_process(struct radeon_device *rdev)
3309 u32 src_id, src_data;
3311 unsigned long flags;
3312 bool queue_hotplug = false;
3314 if (!rdev->ih.enabled || rdev->shutdown)
3317 /* No MSIs, need a dummy read to flush PCI DMAs */
3318 if (!rdev->msi_enabled)
3321 wptr = r600_get_ih_wptr(rdev);
3322 rptr = rdev->ih.rptr;
3323 DRM_DEBUG("r600_irq_process start: rptr %d, wptr %d\n", rptr, wptr);
3325 spin_lock_irqsave(&rdev->ih.lock, flags);
3328 spin_unlock_irqrestore(&rdev->ih.lock, flags);
3333 /* Order reading of wptr vs. reading of IH ring data */
3336 /* display interrupts */
3339 rdev->ih.wptr = wptr;
3340 while (rptr != wptr) {
3341 /* wptr/rptr are in bytes! */
3342 ring_index = rptr / 4;
3343 src_id = le32_to_cpu(rdev->ih.ring[ring_index]) & 0xff;
3344 src_data = le32_to_cpu(rdev->ih.ring[ring_index + 1]) & 0xfffffff;
3347 case 1: /* D1 vblank/vline */
3349 case 0: /* D1 vblank */
3350 if (rdev->irq.stat_regs.r600.disp_int & LB_D1_VBLANK_INTERRUPT) {
3351 if (rdev->irq.crtc_vblank_int[0]) {
3352 drm_handle_vblank(rdev->ddev, 0);
3353 rdev->pm.vblank_sync = true;
3354 wake_up(&rdev->irq.vblank_queue);
3356 if (rdev->irq.pflip[0])
3357 radeon_crtc_handle_flip(rdev, 0);
3358 rdev->irq.stat_regs.r600.disp_int &= ~LB_D1_VBLANK_INTERRUPT;
3359 DRM_DEBUG("IH: D1 vblank\n");
3362 case 1: /* D1 vline */
3363 if (rdev->irq.stat_regs.r600.disp_int & LB_D1_VLINE_INTERRUPT) {
3364 rdev->irq.stat_regs.r600.disp_int &= ~LB_D1_VLINE_INTERRUPT;
3365 DRM_DEBUG("IH: D1 vline\n");
3369 DRM_DEBUG("Unhandled interrupt: %d %d\n", src_id, src_data);
3373 case 5: /* D2 vblank/vline */
3375 case 0: /* D2 vblank */
3376 if (rdev->irq.stat_regs.r600.disp_int & LB_D2_VBLANK_INTERRUPT) {
3377 if (rdev->irq.crtc_vblank_int[1]) {
3378 drm_handle_vblank(rdev->ddev, 1);
3379 rdev->pm.vblank_sync = true;
3380 wake_up(&rdev->irq.vblank_queue);
3382 if (rdev->irq.pflip[1])
3383 radeon_crtc_handle_flip(rdev, 1);
3384 rdev->irq.stat_regs.r600.disp_int &= ~LB_D2_VBLANK_INTERRUPT;
3385 DRM_DEBUG("IH: D2 vblank\n");
3388 case 1: /* D1 vline */
3389 if (rdev->irq.stat_regs.r600.disp_int & LB_D2_VLINE_INTERRUPT) {
3390 rdev->irq.stat_regs.r600.disp_int &= ~LB_D2_VLINE_INTERRUPT;
3391 DRM_DEBUG("IH: D2 vline\n");
3395 DRM_DEBUG("Unhandled interrupt: %d %d\n", src_id, src_data);
3399 case 19: /* HPD/DAC hotplug */
3402 if (rdev->irq.stat_regs.r600.disp_int & DC_HPD1_INTERRUPT) {
3403 rdev->irq.stat_regs.r600.disp_int &= ~DC_HPD1_INTERRUPT;
3404 queue_hotplug = true;
3405 DRM_DEBUG("IH: HPD1\n");
3409 if (rdev->irq.stat_regs.r600.disp_int & DC_HPD2_INTERRUPT) {
3410 rdev->irq.stat_regs.r600.disp_int &= ~DC_HPD2_INTERRUPT;
3411 queue_hotplug = true;
3412 DRM_DEBUG("IH: HPD2\n");
3416 if (rdev->irq.stat_regs.r600.disp_int_cont & DC_HPD3_INTERRUPT) {
3417 rdev->irq.stat_regs.r600.disp_int_cont &= ~DC_HPD3_INTERRUPT;
3418 queue_hotplug = true;
3419 DRM_DEBUG("IH: HPD3\n");
3423 if (rdev->irq.stat_regs.r600.disp_int_cont & DC_HPD4_INTERRUPT) {
3424 rdev->irq.stat_regs.r600.disp_int_cont &= ~DC_HPD4_INTERRUPT;
3425 queue_hotplug = true;
3426 DRM_DEBUG("IH: HPD4\n");
3430 if (rdev->irq.stat_regs.r600.disp_int_cont2 & DC_HPD5_INTERRUPT) {
3431 rdev->irq.stat_regs.r600.disp_int_cont2 &= ~DC_HPD5_INTERRUPT;
3432 queue_hotplug = true;
3433 DRM_DEBUG("IH: HPD5\n");
3437 if (rdev->irq.stat_regs.r600.disp_int_cont2 & DC_HPD6_INTERRUPT) {
3438 rdev->irq.stat_regs.r600.disp_int_cont2 &= ~DC_HPD6_INTERRUPT;
3439 queue_hotplug = true;
3440 DRM_DEBUG("IH: HPD6\n");
3444 DRM_DEBUG("Unhandled interrupt: %d %d\n", src_id, src_data);
3449 DRM_DEBUG("IH: HDMI: 0x%x\n", src_data);
3450 r600_audio_schedule_polling(rdev);
3452 case 176: /* CP_INT in ring buffer */
3453 case 177: /* CP_INT in IB1 */
3454 case 178: /* CP_INT in IB2 */
3455 DRM_DEBUG("IH: CP int: 0x%08x\n", src_data);
3456 radeon_fence_process(rdev);
3458 case 181: /* CP EOP event */
3459 DRM_DEBUG("IH: CP EOP\n");
3460 radeon_fence_process(rdev);
3462 case 233: /* GUI IDLE */
3463 DRM_DEBUG("IH: GUI idle\n");
3464 rdev->pm.gui_idle = true;
3465 wake_up(&rdev->irq.idle_queue);
3468 DRM_DEBUG("Unhandled interrupt: %d %d\n", src_id, src_data);
3472 /* wptr/rptr are in bytes! */
3474 rptr &= rdev->ih.ptr_mask;
3476 /* make sure wptr hasn't changed while processing */
3477 wptr = r600_get_ih_wptr(rdev);
3478 if (wptr != rdev->ih.wptr)
3481 schedule_work(&rdev->hotplug_work);
3482 rdev->ih.rptr = rptr;
3483 WREG32(IH_RB_RPTR, rdev->ih.rptr);
3484 spin_unlock_irqrestore(&rdev->ih.lock, flags);
3491 #if defined(CONFIG_DEBUG_FS)
3493 static int r600_debugfs_cp_ring_info(struct seq_file *m, void *data)
3495 struct drm_info_node *node = (struct drm_info_node *) m->private;
3496 struct drm_device *dev = node->minor->dev;
3497 struct radeon_device *rdev = dev->dev_private;
3498 unsigned count, i, j;
3500 radeon_ring_free_size(rdev);
3501 count = (rdev->cp.ring_size / 4) - rdev->cp.ring_free_dw;
3502 seq_printf(m, "CP_STAT 0x%08x\n", RREG32(CP_STAT));
3503 seq_printf(m, "CP_RB_WPTR 0x%08x\n", RREG32(CP_RB_WPTR));
3504 seq_printf(m, "CP_RB_RPTR 0x%08x\n", RREG32(CP_RB_RPTR));
3505 seq_printf(m, "driver's copy of the CP_RB_WPTR 0x%08x\n", rdev->cp.wptr);
3506 seq_printf(m, "driver's copy of the CP_RB_RPTR 0x%08x\n", rdev->cp.rptr);
3507 seq_printf(m, "%u free dwords in ring\n", rdev->cp.ring_free_dw);
3508 seq_printf(m, "%u dwords in ring\n", count);
3510 for (j = 0; j <= count; j++) {
3511 seq_printf(m, "r[%04d]=0x%08x\n", i, rdev->cp.ring[i]);
3512 i = (i + 1) & rdev->cp.ptr_mask;
3517 static int r600_debugfs_mc_info(struct seq_file *m, void *data)
3519 struct drm_info_node *node = (struct drm_info_node *) m->private;
3520 struct drm_device *dev = node->minor->dev;
3521 struct radeon_device *rdev = dev->dev_private;
3523 DREG32_SYS(m, rdev, R_000E50_SRBM_STATUS);
3524 DREG32_SYS(m, rdev, VM_L2_STATUS);
3528 static struct drm_info_list r600_mc_info_list[] = {
3529 {"r600_mc_info", r600_debugfs_mc_info, 0, NULL},
3530 {"r600_ring_info", r600_debugfs_cp_ring_info, 0, NULL},
3534 int r600_debugfs_mc_info_init(struct radeon_device *rdev)
3536 #if defined(CONFIG_DEBUG_FS)
3537 return radeon_debugfs_add_files(rdev, r600_mc_info_list, ARRAY_SIZE(r600_mc_info_list));
3544 * r600_ioctl_wait_idle - flush host path cache on wait idle ioctl
3545 * rdev: radeon device structure
3546 * bo: buffer object struct which userspace is waiting for idle
3548 * Some R6XX/R7XX doesn't seems to take into account HDP flush performed
3549 * through ring buffer, this leads to corruption in rendering, see
3550 * http://bugzilla.kernel.org/show_bug.cgi?id=15186 to avoid this we
3551 * directly perform HDP flush by writing register through MMIO.
3553 void r600_ioctl_wait_idle(struct radeon_device *rdev, struct radeon_bo *bo)
3555 /* r7xx hw bug. write to HDP_DEBUG1 followed by fb read
3556 * rather than write to HDP_REG_COHERENCY_FLUSH_CNTL.
3557 * This seems to cause problems on some AGP cards. Just use the old
3560 if ((rdev->family >= CHIP_RV770) && (rdev->family <= CHIP_RV740) &&
3561 rdev->vram_scratch.ptr && !(rdev->flags & RADEON_IS_AGP)) {
3562 void __iomem *ptr = (void *)rdev->vram_scratch.ptr;
3565 WREG32(HDP_DEBUG1, 0);
3566 tmp = readl((void __iomem *)ptr);
3568 WREG32(R_005480_HDP_MEM_COHERENCY_FLUSH_CNTL, 0x1);
3571 void r600_set_pcie_lanes(struct radeon_device *rdev, int lanes)
3573 u32 link_width_cntl, mask, target_reg;
3575 if (rdev->flags & RADEON_IS_IGP)
3578 if (!(rdev->flags & RADEON_IS_PCIE))
3581 /* x2 cards have a special sequence */
3582 if (ASIC_IS_X2(rdev))
3585 /* FIXME wait for idle */
3589 mask = RADEON_PCIE_LC_LINK_WIDTH_X0;
3592 mask = RADEON_PCIE_LC_LINK_WIDTH_X1;
3595 mask = RADEON_PCIE_LC_LINK_WIDTH_X2;
3598 mask = RADEON_PCIE_LC_LINK_WIDTH_X4;
3601 mask = RADEON_PCIE_LC_LINK_WIDTH_X8;
3604 mask = RADEON_PCIE_LC_LINK_WIDTH_X12;
3608 mask = RADEON_PCIE_LC_LINK_WIDTH_X16;
3612 link_width_cntl = RREG32_PCIE_P(RADEON_PCIE_LC_LINK_WIDTH_CNTL);
3614 if ((link_width_cntl & RADEON_PCIE_LC_LINK_WIDTH_RD_MASK) ==
3615 (mask << RADEON_PCIE_LC_LINK_WIDTH_RD_SHIFT))
3618 if (link_width_cntl & R600_PCIE_LC_UPCONFIGURE_DIS)
3621 link_width_cntl &= ~(RADEON_PCIE_LC_LINK_WIDTH_MASK |
3622 RADEON_PCIE_LC_RECONFIG_NOW |
3623 R600_PCIE_LC_RENEGOTIATE_EN |
3624 R600_PCIE_LC_RECONFIG_ARC_MISSING_ESCAPE);
3625 link_width_cntl |= mask;
3627 WREG32_PCIE_P(RADEON_PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
3629 /* some northbridges can renegotiate the link rather than requiring
3630 * a complete re-config.
3631 * e.g., AMD 780/790 northbridges (pci ids: 0x5956, 0x5957, 0x5958, etc.)
3633 if (link_width_cntl & R600_PCIE_LC_RENEGOTIATION_SUPPORT)
3634 link_width_cntl |= R600_PCIE_LC_RENEGOTIATE_EN | R600_PCIE_LC_UPCONFIGURE_SUPPORT;
3636 link_width_cntl |= R600_PCIE_LC_RECONFIG_ARC_MISSING_ESCAPE;
3638 WREG32_PCIE_P(RADEON_PCIE_LC_LINK_WIDTH_CNTL, (link_width_cntl |
3639 RADEON_PCIE_LC_RECONFIG_NOW));
3641 if (rdev->family >= CHIP_RV770)
3642 target_reg = R700_TARGET_AND_CURRENT_PROFILE_INDEX;
3644 target_reg = R600_TARGET_AND_CURRENT_PROFILE_INDEX;
3646 /* wait for lane set to complete */
3647 link_width_cntl = RREG32(target_reg);
3648 while (link_width_cntl == 0xffffffff)
3649 link_width_cntl = RREG32(target_reg);
3653 int r600_get_pcie_lanes(struct radeon_device *rdev)
3655 u32 link_width_cntl;
3657 if (rdev->flags & RADEON_IS_IGP)
3660 if (!(rdev->flags & RADEON_IS_PCIE))
3663 /* x2 cards have a special sequence */
3664 if (ASIC_IS_X2(rdev))
3667 /* FIXME wait for idle */
3669 link_width_cntl = RREG32_PCIE_P(RADEON_PCIE_LC_LINK_WIDTH_CNTL);
3671 switch ((link_width_cntl & RADEON_PCIE_LC_LINK_WIDTH_RD_MASK) >> RADEON_PCIE_LC_LINK_WIDTH_RD_SHIFT) {
3672 case RADEON_PCIE_LC_LINK_WIDTH_X0:
3674 case RADEON_PCIE_LC_LINK_WIDTH_X1:
3676 case RADEON_PCIE_LC_LINK_WIDTH_X2:
3678 case RADEON_PCIE_LC_LINK_WIDTH_X4:
3680 case RADEON_PCIE_LC_LINK_WIDTH_X8:
3682 case RADEON_PCIE_LC_LINK_WIDTH_X16:
3688 static void r600_pcie_gen2_enable(struct radeon_device *rdev)
3690 u32 link_width_cntl, lanes, speed_cntl, training_cntl, tmp;
3693 if (radeon_pcie_gen2 == 0)
3696 if (rdev->flags & RADEON_IS_IGP)
3699 if (!(rdev->flags & RADEON_IS_PCIE))
3702 /* x2 cards have a special sequence */
3703 if (ASIC_IS_X2(rdev))
3706 /* only RV6xx+ chips are supported */
3707 if (rdev->family <= CHIP_R600)
3710 /* 55 nm r6xx asics */
3711 if ((rdev->family == CHIP_RV670) ||
3712 (rdev->family == CHIP_RV620) ||
3713 (rdev->family == CHIP_RV635)) {
3714 /* advertise upconfig capability */
3715 link_width_cntl = RREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL);
3716 link_width_cntl &= ~LC_UPCONFIGURE_DIS;
3717 WREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
3718 link_width_cntl = RREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL);
3719 if (link_width_cntl & LC_RENEGOTIATION_SUPPORT) {
3720 lanes = (link_width_cntl & LC_LINK_WIDTH_RD_MASK) >> LC_LINK_WIDTH_RD_SHIFT;
3721 link_width_cntl &= ~(LC_LINK_WIDTH_MASK |
3722 LC_RECONFIG_ARC_MISSING_ESCAPE);
3723 link_width_cntl |= lanes | LC_RECONFIG_NOW | LC_RENEGOTIATE_EN;
3724 WREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
3726 link_width_cntl |= LC_UPCONFIGURE_DIS;
3727 WREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
3731 speed_cntl = RREG32_PCIE_P(PCIE_LC_SPEED_CNTL);
3732 if ((speed_cntl & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3733 (speed_cntl & LC_OTHER_SIDE_SUPPORTS_GEN2)) {
3735 /* 55 nm r6xx asics */
3736 if ((rdev->family == CHIP_RV670) ||
3737 (rdev->family == CHIP_RV620) ||
3738 (rdev->family == CHIP_RV635)) {
3739 WREG32(MM_CFGREGS_CNTL, 0x8);
3740 link_cntl2 = RREG32(0x4088);
3741 WREG32(MM_CFGREGS_CNTL, 0);
3742 /* not supported yet */
3743 if (link_cntl2 & SELECTABLE_DEEMPHASIS)
3747 speed_cntl &= ~LC_SPEED_CHANGE_ATTEMPTS_ALLOWED_MASK;
3748 speed_cntl |= (0x3 << LC_SPEED_CHANGE_ATTEMPTS_ALLOWED_SHIFT);
3749 speed_cntl &= ~LC_VOLTAGE_TIMER_SEL_MASK;
3750 speed_cntl &= ~LC_FORCE_DIS_HW_SPEED_CHANGE;
3751 speed_cntl |= LC_FORCE_EN_HW_SPEED_CHANGE;
3752 WREG32_PCIE_P(PCIE_LC_SPEED_CNTL, speed_cntl);
3754 tmp = RREG32(0x541c);
3755 WREG32(0x541c, tmp | 0x8);
3756 WREG32(MM_CFGREGS_CNTL, MM_WR_TO_CFG_EN);
3757 link_cntl2 = RREG16(0x4088);
3758 link_cntl2 &= ~TARGET_LINK_SPEED_MASK;
3760 WREG16(0x4088, link_cntl2);
3761 WREG32(MM_CFGREGS_CNTL, 0);
3763 if ((rdev->family == CHIP_RV670) ||
3764 (rdev->family == CHIP_RV620) ||
3765 (rdev->family == CHIP_RV635)) {
3766 training_cntl = RREG32_PCIE_P(PCIE_LC_TRAINING_CNTL);
3767 training_cntl &= ~LC_POINT_7_PLUS_EN;
3768 WREG32_PCIE_P(PCIE_LC_TRAINING_CNTL, training_cntl);
3770 speed_cntl = RREG32_PCIE_P(PCIE_LC_SPEED_CNTL);
3771 speed_cntl &= ~LC_TARGET_LINK_SPEED_OVERRIDE_EN;
3772 WREG32_PCIE_P(PCIE_LC_SPEED_CNTL, speed_cntl);
3775 speed_cntl = RREG32_PCIE_P(PCIE_LC_SPEED_CNTL);
3776 speed_cntl |= LC_GEN2_EN_STRAP;
3777 WREG32_PCIE_P(PCIE_LC_SPEED_CNTL, speed_cntl);
3780 link_width_cntl = RREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL);
3781 /* XXX: only disable it if gen1 bridge vendor == 0x111d or 0x1106 */
3783 link_width_cntl |= LC_UPCONFIGURE_DIS;
3785 link_width_cntl &= ~LC_UPCONFIGURE_DIS;
3786 WREG32_PCIE_P(PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);