drm/radeon: fix & improve ih ring handling v3
[linux-2.6-block.git] / drivers / gpu / drm / radeon / radeon_device.c
1 /*
2  * Copyright 2008 Advanced Micro Devices, Inc.
3  * Copyright 2008 Red Hat Inc.
4  * Copyright 2009 Jerome Glisse.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the "Software"),
8  * to deal in the Software without restriction, including without limitation
9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10  * and/or sell copies of the Software, and to permit persons to whom the
11  * Software is furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22  * OTHER DEALINGS IN THE SOFTWARE.
23  *
24  * Authors: Dave Airlie
25  *          Alex Deucher
26  *          Jerome Glisse
27  */
28 #include <linux/console.h>
29 #include <linux/slab.h>
30 #include <drm/drmP.h>
31 #include <drm/drm_crtc_helper.h>
32 #include <drm/radeon_drm.h>
33 #include <linux/vgaarb.h>
34 #include <linux/vga_switcheroo.h>
35 #include <linux/efi.h>
36 #include "radeon_reg.h"
37 #include "radeon.h"
38 #include "atom.h"
39
40 static const char radeon_family_name[][16] = {
41         "R100",
42         "RV100",
43         "RS100",
44         "RV200",
45         "RS200",
46         "R200",
47         "RV250",
48         "RS300",
49         "RV280",
50         "R300",
51         "R350",
52         "RV350",
53         "RV380",
54         "R420",
55         "R423",
56         "RV410",
57         "RS400",
58         "RS480",
59         "RS600",
60         "RS690",
61         "RS740",
62         "RV515",
63         "R520",
64         "RV530",
65         "RV560",
66         "RV570",
67         "R580",
68         "R600",
69         "RV610",
70         "RV630",
71         "RV670",
72         "RV620",
73         "RV635",
74         "RS780",
75         "RS880",
76         "RV770",
77         "RV730",
78         "RV710",
79         "RV740",
80         "CEDAR",
81         "REDWOOD",
82         "JUNIPER",
83         "CYPRESS",
84         "HEMLOCK",
85         "PALM",
86         "SUMO",
87         "SUMO2",
88         "BARTS",
89         "TURKS",
90         "CAICOS",
91         "CAYMAN",
92         "ARUBA",
93         "TAHITI",
94         "PITCAIRN",
95         "VERDE",
96         "LAST",
97 };
98
99 /*
100  * Clear GPU surface registers.
101  */
102 void radeon_surface_init(struct radeon_device *rdev)
103 {
104         /* FIXME: check this out */
105         if (rdev->family < CHIP_R600) {
106                 int i;
107
108                 for (i = 0; i < RADEON_GEM_MAX_SURFACES; i++) {
109                         if (rdev->surface_regs[i].bo)
110                                 radeon_bo_get_surface_reg(rdev->surface_regs[i].bo);
111                         else
112                                 radeon_clear_surface_reg(rdev, i);
113                 }
114                 /* enable surfaces */
115                 WREG32(RADEON_SURFACE_CNTL, 0);
116         }
117 }
118
119 /*
120  * GPU scratch registers helpers function.
121  */
122 void radeon_scratch_init(struct radeon_device *rdev)
123 {
124         int i;
125
126         /* FIXME: check this out */
127         if (rdev->family < CHIP_R300) {
128                 rdev->scratch.num_reg = 5;
129         } else {
130                 rdev->scratch.num_reg = 7;
131         }
132         rdev->scratch.reg_base = RADEON_SCRATCH_REG0;
133         for (i = 0; i < rdev->scratch.num_reg; i++) {
134                 rdev->scratch.free[i] = true;
135                 rdev->scratch.reg[i] = rdev->scratch.reg_base + (i * 4);
136         }
137 }
138
139 int radeon_scratch_get(struct radeon_device *rdev, uint32_t *reg)
140 {
141         int i;
142
143         for (i = 0; i < rdev->scratch.num_reg; i++) {
144                 if (rdev->scratch.free[i]) {
145                         rdev->scratch.free[i] = false;
146                         *reg = rdev->scratch.reg[i];
147                         return 0;
148                 }
149         }
150         return -EINVAL;
151 }
152
153 void radeon_scratch_free(struct radeon_device *rdev, uint32_t reg)
154 {
155         int i;
156
157         for (i = 0; i < rdev->scratch.num_reg; i++) {
158                 if (rdev->scratch.reg[i] == reg) {
159                         rdev->scratch.free[i] = true;
160                         return;
161                 }
162         }
163 }
164
165 void radeon_wb_disable(struct radeon_device *rdev)
166 {
167         int r;
168
169         if (rdev->wb.wb_obj) {
170                 r = radeon_bo_reserve(rdev->wb.wb_obj, false);
171                 if (unlikely(r != 0))
172                         return;
173                 radeon_bo_kunmap(rdev->wb.wb_obj);
174                 radeon_bo_unpin(rdev->wb.wb_obj);
175                 radeon_bo_unreserve(rdev->wb.wb_obj);
176         }
177         rdev->wb.enabled = false;
178 }
179
180 void radeon_wb_fini(struct radeon_device *rdev)
181 {
182         radeon_wb_disable(rdev);
183         if (rdev->wb.wb_obj) {
184                 radeon_bo_unref(&rdev->wb.wb_obj);
185                 rdev->wb.wb = NULL;
186                 rdev->wb.wb_obj = NULL;
187         }
188 }
189
190 int radeon_wb_init(struct radeon_device *rdev)
191 {
192         int r;
193
194         if (rdev->wb.wb_obj == NULL) {
195                 r = radeon_bo_create(rdev, RADEON_GPU_PAGE_SIZE, PAGE_SIZE, true,
196                                      RADEON_GEM_DOMAIN_GTT, NULL, &rdev->wb.wb_obj);
197                 if (r) {
198                         dev_warn(rdev->dev, "(%d) create WB bo failed\n", r);
199                         return r;
200                 }
201         }
202         r = radeon_bo_reserve(rdev->wb.wb_obj, false);
203         if (unlikely(r != 0)) {
204                 radeon_wb_fini(rdev);
205                 return r;
206         }
207         r = radeon_bo_pin(rdev->wb.wb_obj, RADEON_GEM_DOMAIN_GTT,
208                           &rdev->wb.gpu_addr);
209         if (r) {
210                 radeon_bo_unreserve(rdev->wb.wb_obj);
211                 dev_warn(rdev->dev, "(%d) pin WB bo failed\n", r);
212                 radeon_wb_fini(rdev);
213                 return r;
214         }
215         r = radeon_bo_kmap(rdev->wb.wb_obj, (void **)&rdev->wb.wb);
216         radeon_bo_unreserve(rdev->wb.wb_obj);
217         if (r) {
218                 dev_warn(rdev->dev, "(%d) map WB bo failed\n", r);
219                 radeon_wb_fini(rdev);
220                 return r;
221         }
222
223         /* clear wb memory */
224         memset((char *)rdev->wb.wb, 0, RADEON_GPU_PAGE_SIZE);
225         /* disable event_write fences */
226         rdev->wb.use_event = false;
227         /* disabled via module param */
228         if (radeon_no_wb == 1) {
229                 rdev->wb.enabled = false;
230         } else {
231                 if (rdev->flags & RADEON_IS_AGP) {
232                         /* often unreliable on AGP */
233                         rdev->wb.enabled = false;
234                 } else if (rdev->family < CHIP_R300) {
235                         /* often unreliable on pre-r300 */
236                         rdev->wb.enabled = false;
237                 } else {
238                         rdev->wb.enabled = true;
239                         /* event_write fences are only available on r600+ */
240                         if (rdev->family >= CHIP_R600) {
241                                 rdev->wb.use_event = true;
242                         }
243                 }
244         }
245         /* always use writeback/events on NI, APUs */
246         if (rdev->family >= CHIP_PALM) {
247                 rdev->wb.enabled = true;
248                 rdev->wb.use_event = true;
249         }
250
251         dev_info(rdev->dev, "WB %sabled\n", rdev->wb.enabled ? "en" : "dis");
252
253         return 0;
254 }
255
256 /**
257  * radeon_vram_location - try to find VRAM location
258  * @rdev: radeon device structure holding all necessary informations
259  * @mc: memory controller structure holding memory informations
260  * @base: base address at which to put VRAM
261  *
262  * Function will place try to place VRAM at base address provided
263  * as parameter (which is so far either PCI aperture address or
264  * for IGP TOM base address).
265  *
266  * If there is not enough space to fit the unvisible VRAM in the 32bits
267  * address space then we limit the VRAM size to the aperture.
268  *
269  * If we are using AGP and if the AGP aperture doesn't allow us to have
270  * room for all the VRAM than we restrict the VRAM to the PCI aperture
271  * size and print a warning.
272  *
273  * This function will never fails, worst case are limiting VRAM.
274  *
275  * Note: GTT start, end, size should be initialized before calling this
276  * function on AGP platform.
277  *
278  * Note: We don't explicitly enforce VRAM start to be aligned on VRAM size,
279  * this shouldn't be a problem as we are using the PCI aperture as a reference.
280  * Otherwise this would be needed for rv280, all r3xx, and all r4xx, but
281  * not IGP.
282  *
283  * Note: we use mc_vram_size as on some board we need to program the mc to
284  * cover the whole aperture even if VRAM size is inferior to aperture size
285  * Novell bug 204882 + along with lots of ubuntu ones
286  *
287  * Note: when limiting vram it's safe to overwritte real_vram_size because
288  * we are not in case where real_vram_size is inferior to mc_vram_size (ie
289  * note afected by bogus hw of Novell bug 204882 + along with lots of ubuntu
290  * ones)
291  *
292  * Note: IGP TOM addr should be the same as the aperture addr, we don't
293  * explicitly check for that thought.
294  *
295  * FIXME: when reducing VRAM size align new size on power of 2.
296  */
297 void radeon_vram_location(struct radeon_device *rdev, struct radeon_mc *mc, u64 base)
298 {
299         mc->vram_start = base;
300         if (mc->mc_vram_size > (0xFFFFFFFF - base + 1)) {
301                 dev_warn(rdev->dev, "limiting VRAM to PCI aperture size\n");
302                 mc->real_vram_size = mc->aper_size;
303                 mc->mc_vram_size = mc->aper_size;
304         }
305         mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
306         if (rdev->flags & RADEON_IS_AGP && mc->vram_end > mc->gtt_start && mc->vram_start <= mc->gtt_end) {
307                 dev_warn(rdev->dev, "limiting VRAM to PCI aperture size\n");
308                 mc->real_vram_size = mc->aper_size;
309                 mc->mc_vram_size = mc->aper_size;
310         }
311         mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
312         if (radeon_vram_limit && radeon_vram_limit < mc->real_vram_size)
313                 mc->real_vram_size = radeon_vram_limit;
314         dev_info(rdev->dev, "VRAM: %lluM 0x%016llX - 0x%016llX (%lluM used)\n",
315                         mc->mc_vram_size >> 20, mc->vram_start,
316                         mc->vram_end, mc->real_vram_size >> 20);
317 }
318
319 /**
320  * radeon_gtt_location - try to find GTT location
321  * @rdev: radeon device structure holding all necessary informations
322  * @mc: memory controller structure holding memory informations
323  *
324  * Function will place try to place GTT before or after VRAM.
325  *
326  * If GTT size is bigger than space left then we ajust GTT size.
327  * Thus function will never fails.
328  *
329  * FIXME: when reducing GTT size align new size on power of 2.
330  */
331 void radeon_gtt_location(struct radeon_device *rdev, struct radeon_mc *mc)
332 {
333         u64 size_af, size_bf;
334
335         size_af = ((0xFFFFFFFF - mc->vram_end) + mc->gtt_base_align) & ~mc->gtt_base_align;
336         size_bf = mc->vram_start & ~mc->gtt_base_align;
337         if (size_bf > size_af) {
338                 if (mc->gtt_size > size_bf) {
339                         dev_warn(rdev->dev, "limiting GTT\n");
340                         mc->gtt_size = size_bf;
341                 }
342                 mc->gtt_start = (mc->vram_start & ~mc->gtt_base_align) - mc->gtt_size;
343         } else {
344                 if (mc->gtt_size > size_af) {
345                         dev_warn(rdev->dev, "limiting GTT\n");
346                         mc->gtt_size = size_af;
347                 }
348                 mc->gtt_start = (mc->vram_end + 1 + mc->gtt_base_align) & ~mc->gtt_base_align;
349         }
350         mc->gtt_end = mc->gtt_start + mc->gtt_size - 1;
351         dev_info(rdev->dev, "GTT: %lluM 0x%016llX - 0x%016llX\n",
352                         mc->gtt_size >> 20, mc->gtt_start, mc->gtt_end);
353 }
354
355 /*
356  * GPU helpers function.
357  */
358 bool radeon_card_posted(struct radeon_device *rdev)
359 {
360         uint32_t reg;
361
362         if (efi_enabled && rdev->pdev->subsystem_vendor == PCI_VENDOR_ID_APPLE)
363                 return false;
364
365         /* first check CRTCs */
366         if (ASIC_IS_DCE41(rdev)) {
367                 reg = RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC0_REGISTER_OFFSET) |
368                         RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC1_REGISTER_OFFSET);
369                 if (reg & EVERGREEN_CRTC_MASTER_EN)
370                         return true;
371         } else if (ASIC_IS_DCE4(rdev)) {
372                 reg = RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC0_REGISTER_OFFSET) |
373                         RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC1_REGISTER_OFFSET) |
374                         RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC2_REGISTER_OFFSET) |
375                         RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC3_REGISTER_OFFSET) |
376                         RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC4_REGISTER_OFFSET) |
377                         RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC5_REGISTER_OFFSET);
378                 if (reg & EVERGREEN_CRTC_MASTER_EN)
379                         return true;
380         } else if (ASIC_IS_AVIVO(rdev)) {
381                 reg = RREG32(AVIVO_D1CRTC_CONTROL) |
382                       RREG32(AVIVO_D2CRTC_CONTROL);
383                 if (reg & AVIVO_CRTC_EN) {
384                         return true;
385                 }
386         } else {
387                 reg = RREG32(RADEON_CRTC_GEN_CNTL) |
388                       RREG32(RADEON_CRTC2_GEN_CNTL);
389                 if (reg & RADEON_CRTC_EN) {
390                         return true;
391                 }
392         }
393
394         /* then check MEM_SIZE, in case the crtcs are off */
395         if (rdev->family >= CHIP_R600)
396                 reg = RREG32(R600_CONFIG_MEMSIZE);
397         else
398                 reg = RREG32(RADEON_CONFIG_MEMSIZE);
399
400         if (reg)
401                 return true;
402
403         return false;
404
405 }
406
407 void radeon_update_bandwidth_info(struct radeon_device *rdev)
408 {
409         fixed20_12 a;
410         u32 sclk = rdev->pm.current_sclk;
411         u32 mclk = rdev->pm.current_mclk;
412
413         /* sclk/mclk in Mhz */
414         a.full = dfixed_const(100);
415         rdev->pm.sclk.full = dfixed_const(sclk);
416         rdev->pm.sclk.full = dfixed_div(rdev->pm.sclk, a);
417         rdev->pm.mclk.full = dfixed_const(mclk);
418         rdev->pm.mclk.full = dfixed_div(rdev->pm.mclk, a);
419
420         if (rdev->flags & RADEON_IS_IGP) {
421                 a.full = dfixed_const(16);
422                 /* core_bandwidth = sclk(Mhz) * 16 */
423                 rdev->pm.core_bandwidth.full = dfixed_div(rdev->pm.sclk, a);
424         }
425 }
426
427 bool radeon_boot_test_post_card(struct radeon_device *rdev)
428 {
429         if (radeon_card_posted(rdev))
430                 return true;
431
432         if (rdev->bios) {
433                 DRM_INFO("GPU not posted. posting now...\n");
434                 if (rdev->is_atom_bios)
435                         atom_asic_init(rdev->mode_info.atom_context);
436                 else
437                         radeon_combios_asic_init(rdev->ddev);
438                 return true;
439         } else {
440                 dev_err(rdev->dev, "Card not posted and no BIOS - ignoring\n");
441                 return false;
442         }
443 }
444
445 int radeon_dummy_page_init(struct radeon_device *rdev)
446 {
447         if (rdev->dummy_page.page)
448                 return 0;
449         rdev->dummy_page.page = alloc_page(GFP_DMA32 | GFP_KERNEL | __GFP_ZERO);
450         if (rdev->dummy_page.page == NULL)
451                 return -ENOMEM;
452         rdev->dummy_page.addr = pci_map_page(rdev->pdev, rdev->dummy_page.page,
453                                         0, PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
454         if (pci_dma_mapping_error(rdev->pdev, rdev->dummy_page.addr)) {
455                 dev_err(&rdev->pdev->dev, "Failed to DMA MAP the dummy page\n");
456                 __free_page(rdev->dummy_page.page);
457                 rdev->dummy_page.page = NULL;
458                 return -ENOMEM;
459         }
460         return 0;
461 }
462
463 void radeon_dummy_page_fini(struct radeon_device *rdev)
464 {
465         if (rdev->dummy_page.page == NULL)
466                 return;
467         pci_unmap_page(rdev->pdev, rdev->dummy_page.addr,
468                         PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
469         __free_page(rdev->dummy_page.page);
470         rdev->dummy_page.page = NULL;
471 }
472
473
474 /* ATOM accessor methods */
475 static uint32_t cail_pll_read(struct card_info *info, uint32_t reg)
476 {
477         struct radeon_device *rdev = info->dev->dev_private;
478         uint32_t r;
479
480         r = rdev->pll_rreg(rdev, reg);
481         return r;
482 }
483
484 static void cail_pll_write(struct card_info *info, uint32_t reg, uint32_t val)
485 {
486         struct radeon_device *rdev = info->dev->dev_private;
487
488         rdev->pll_wreg(rdev, reg, val);
489 }
490
491 static uint32_t cail_mc_read(struct card_info *info, uint32_t reg)
492 {
493         struct radeon_device *rdev = info->dev->dev_private;
494         uint32_t r;
495
496         r = rdev->mc_rreg(rdev, reg);
497         return r;
498 }
499
500 static void cail_mc_write(struct card_info *info, uint32_t reg, uint32_t val)
501 {
502         struct radeon_device *rdev = info->dev->dev_private;
503
504         rdev->mc_wreg(rdev, reg, val);
505 }
506
507 static void cail_reg_write(struct card_info *info, uint32_t reg, uint32_t val)
508 {
509         struct radeon_device *rdev = info->dev->dev_private;
510
511         WREG32(reg*4, val);
512 }
513
514 static uint32_t cail_reg_read(struct card_info *info, uint32_t reg)
515 {
516         struct radeon_device *rdev = info->dev->dev_private;
517         uint32_t r;
518
519         r = RREG32(reg*4);
520         return r;
521 }
522
523 static void cail_ioreg_write(struct card_info *info, uint32_t reg, uint32_t val)
524 {
525         struct radeon_device *rdev = info->dev->dev_private;
526
527         WREG32_IO(reg*4, val);
528 }
529
530 static uint32_t cail_ioreg_read(struct card_info *info, uint32_t reg)
531 {
532         struct radeon_device *rdev = info->dev->dev_private;
533         uint32_t r;
534
535         r = RREG32_IO(reg*4);
536         return r;
537 }
538
539 int radeon_atombios_init(struct radeon_device *rdev)
540 {
541         struct card_info *atom_card_info =
542             kzalloc(sizeof(struct card_info), GFP_KERNEL);
543
544         if (!atom_card_info)
545                 return -ENOMEM;
546
547         rdev->mode_info.atom_card_info = atom_card_info;
548         atom_card_info->dev = rdev->ddev;
549         atom_card_info->reg_read = cail_reg_read;
550         atom_card_info->reg_write = cail_reg_write;
551         /* needed for iio ops */
552         if (rdev->rio_mem) {
553                 atom_card_info->ioreg_read = cail_ioreg_read;
554                 atom_card_info->ioreg_write = cail_ioreg_write;
555         } else {
556                 DRM_ERROR("Unable to find PCI I/O BAR; using MMIO for ATOM IIO\n");
557                 atom_card_info->ioreg_read = cail_reg_read;
558                 atom_card_info->ioreg_write = cail_reg_write;
559         }
560         atom_card_info->mc_read = cail_mc_read;
561         atom_card_info->mc_write = cail_mc_write;
562         atom_card_info->pll_read = cail_pll_read;
563         atom_card_info->pll_write = cail_pll_write;
564
565         rdev->mode_info.atom_context = atom_parse(atom_card_info, rdev->bios);
566         mutex_init(&rdev->mode_info.atom_context->mutex);
567         radeon_atom_initialize_bios_scratch_regs(rdev->ddev);
568         atom_allocate_fb_scratch(rdev->mode_info.atom_context);
569         return 0;
570 }
571
572 void radeon_atombios_fini(struct radeon_device *rdev)
573 {
574         if (rdev->mode_info.atom_context) {
575                 kfree(rdev->mode_info.atom_context->scratch);
576                 kfree(rdev->mode_info.atom_context);
577         }
578         kfree(rdev->mode_info.atom_card_info);
579 }
580
581 int radeon_combios_init(struct radeon_device *rdev)
582 {
583         radeon_combios_initialize_bios_scratch_regs(rdev->ddev);
584         return 0;
585 }
586
587 void radeon_combios_fini(struct radeon_device *rdev)
588 {
589 }
590
591 /* if we get transitioned to only one device, tak VGA back */
592 static unsigned int radeon_vga_set_decode(void *cookie, bool state)
593 {
594         struct radeon_device *rdev = cookie;
595         radeon_vga_set_state(rdev, state);
596         if (state)
597                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
598                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
599         else
600                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
601 }
602
603 void radeon_check_arguments(struct radeon_device *rdev)
604 {
605         /* vramlimit must be a power of two */
606         switch (radeon_vram_limit) {
607         case 0:
608         case 4:
609         case 8:
610         case 16:
611         case 32:
612         case 64:
613         case 128:
614         case 256:
615         case 512:
616         case 1024:
617         case 2048:
618         case 4096:
619                 break;
620         default:
621                 dev_warn(rdev->dev, "vram limit (%d) must be a power of 2\n",
622                                 radeon_vram_limit);
623                 radeon_vram_limit = 0;
624                 break;
625         }
626         radeon_vram_limit = radeon_vram_limit << 20;
627         /* gtt size must be power of two and greater or equal to 32M */
628         switch (radeon_gart_size) {
629         case 4:
630         case 8:
631         case 16:
632                 dev_warn(rdev->dev, "gart size (%d) too small forcing to 512M\n",
633                                 radeon_gart_size);
634                 radeon_gart_size = 512;
635                 break;
636         case 32:
637         case 64:
638         case 128:
639         case 256:
640         case 512:
641         case 1024:
642         case 2048:
643         case 4096:
644                 break;
645         default:
646                 dev_warn(rdev->dev, "gart size (%d) must be a power of 2\n",
647                                 radeon_gart_size);
648                 radeon_gart_size = 512;
649                 break;
650         }
651         rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
652         /* AGP mode can only be -1, 1, 2, 4, 8 */
653         switch (radeon_agpmode) {
654         case -1:
655         case 0:
656         case 1:
657         case 2:
658         case 4:
659         case 8:
660                 break;
661         default:
662                 dev_warn(rdev->dev, "invalid AGP mode %d (valid mode: "
663                                 "-1, 0, 1, 2, 4, 8)\n", radeon_agpmode);
664                 radeon_agpmode = 0;
665                 break;
666         }
667 }
668
669 static void radeon_switcheroo_set_state(struct pci_dev *pdev, enum vga_switcheroo_state state)
670 {
671         struct drm_device *dev = pci_get_drvdata(pdev);
672         pm_message_t pmm = { .event = PM_EVENT_SUSPEND };
673         if (state == VGA_SWITCHEROO_ON) {
674                 printk(KERN_INFO "radeon: switched on\n");
675                 /* don't suspend or resume card normally */
676                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
677                 radeon_resume_kms(dev);
678                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
679                 drm_kms_helper_poll_enable(dev);
680         } else {
681                 printk(KERN_INFO "radeon: switched off\n");
682                 drm_kms_helper_poll_disable(dev);
683                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
684                 radeon_suspend_kms(dev, pmm);
685                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
686         }
687 }
688
689 static bool radeon_switcheroo_can_switch(struct pci_dev *pdev)
690 {
691         struct drm_device *dev = pci_get_drvdata(pdev);
692         bool can_switch;
693
694         spin_lock(&dev->count_lock);
695         can_switch = (dev->open_count == 0);
696         spin_unlock(&dev->count_lock);
697         return can_switch;
698 }
699
700 static const struct vga_switcheroo_client_ops radeon_switcheroo_ops = {
701         .set_gpu_state = radeon_switcheroo_set_state,
702         .reprobe = NULL,
703         .can_switch = radeon_switcheroo_can_switch,
704 };
705
706 int radeon_device_init(struct radeon_device *rdev,
707                        struct drm_device *ddev,
708                        struct pci_dev *pdev,
709                        uint32_t flags)
710 {
711         int r, i;
712         int dma_bits;
713
714         rdev->shutdown = false;
715         rdev->dev = &pdev->dev;
716         rdev->ddev = ddev;
717         rdev->pdev = pdev;
718         rdev->flags = flags;
719         rdev->family = flags & RADEON_FAMILY_MASK;
720         rdev->is_atom_bios = false;
721         rdev->usec_timeout = RADEON_MAX_USEC_TIMEOUT;
722         rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
723         rdev->accel_working = false;
724
725         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X).\n",
726                 radeon_family_name[rdev->family], pdev->vendor, pdev->device,
727                 pdev->subsystem_vendor, pdev->subsystem_device);
728
729         /* mutex initialization are all done here so we
730          * can recall function without having locking issues */
731         radeon_mutex_init(&rdev->cs_mutex);
732         mutex_init(&rdev->ring_lock);
733         mutex_init(&rdev->dc_hw_i2c_mutex);
734         atomic_set(&rdev->ih.lock, 0);
735         mutex_init(&rdev->gem.mutex);
736         mutex_init(&rdev->pm.mutex);
737         init_rwsem(&rdev->pm.mclk_lock);
738         init_waitqueue_head(&rdev->irq.vblank_queue);
739         init_waitqueue_head(&rdev->irq.idle_queue);
740         r = radeon_gem_init(rdev);
741         if (r)
742                 return r;
743         /* initialize vm here */
744         rdev->vm_manager.use_bitmap = 1;
745         rdev->vm_manager.max_pfn = 1 << 20;
746         INIT_LIST_HEAD(&rdev->vm_manager.lru_vm);
747
748         /* Set asic functions */
749         r = radeon_asic_init(rdev);
750         if (r)
751                 return r;
752         radeon_check_arguments(rdev);
753
754         /* all of the newer IGP chips have an internal gart
755          * However some rs4xx report as AGP, so remove that here.
756          */
757         if ((rdev->family >= CHIP_RS400) &&
758             (rdev->flags & RADEON_IS_IGP)) {
759                 rdev->flags &= ~RADEON_IS_AGP;
760         }
761
762         if (rdev->flags & RADEON_IS_AGP && radeon_agpmode == -1) {
763                 radeon_agp_disable(rdev);
764         }
765
766         /* set DMA mask + need_dma32 flags.
767          * PCIE - can handle 40-bits.
768          * IGP - can handle 40-bits
769          * AGP - generally dma32 is safest
770          * PCI - dma32 for legacy pci gart, 40 bits on newer asics
771          */
772         rdev->need_dma32 = false;
773         if (rdev->flags & RADEON_IS_AGP)
774                 rdev->need_dma32 = true;
775         if ((rdev->flags & RADEON_IS_PCI) &&
776             (rdev->family < CHIP_RS400))
777                 rdev->need_dma32 = true;
778
779         dma_bits = rdev->need_dma32 ? 32 : 40;
780         r = pci_set_dma_mask(rdev->pdev, DMA_BIT_MASK(dma_bits));
781         if (r) {
782                 rdev->need_dma32 = true;
783                 dma_bits = 32;
784                 printk(KERN_WARNING "radeon: No suitable DMA available.\n");
785         }
786         r = pci_set_consistent_dma_mask(rdev->pdev, DMA_BIT_MASK(dma_bits));
787         if (r) {
788                 pci_set_consistent_dma_mask(rdev->pdev, DMA_BIT_MASK(32));
789                 printk(KERN_WARNING "radeon: No coherent DMA available.\n");
790         }
791
792         /* Registers mapping */
793         /* TODO: block userspace mapping of io register */
794         rdev->rmmio_base = pci_resource_start(rdev->pdev, 2);
795         rdev->rmmio_size = pci_resource_len(rdev->pdev, 2);
796         rdev->rmmio = ioremap(rdev->rmmio_base, rdev->rmmio_size);
797         if (rdev->rmmio == NULL) {
798                 return -ENOMEM;
799         }
800         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)rdev->rmmio_base);
801         DRM_INFO("register mmio size: %u\n", (unsigned)rdev->rmmio_size);
802
803         /* io port mapping */
804         for (i = 0; i < DEVICE_COUNT_RESOURCE; i++) {
805                 if (pci_resource_flags(rdev->pdev, i) & IORESOURCE_IO) {
806                         rdev->rio_mem_size = pci_resource_len(rdev->pdev, i);
807                         rdev->rio_mem = pci_iomap(rdev->pdev, i, rdev->rio_mem_size);
808                         break;
809                 }
810         }
811         if (rdev->rio_mem == NULL)
812                 DRM_ERROR("Unable to find PCI I/O BAR\n");
813
814         /* if we have > 1 VGA cards, then disable the radeon VGA resources */
815         /* this will fail for cards that aren't VGA class devices, just
816          * ignore it */
817         vga_client_register(rdev->pdev, rdev, NULL, radeon_vga_set_decode);
818         vga_switcheroo_register_client(rdev->pdev, &radeon_switcheroo_ops);
819
820         r = radeon_init(rdev);
821         if (r)
822                 return r;
823
824         if (rdev->flags & RADEON_IS_AGP && !rdev->accel_working) {
825                 /* Acceleration not working on AGP card try again
826                  * with fallback to PCI or PCIE GART
827                  */
828                 radeon_asic_reset(rdev);
829                 radeon_fini(rdev);
830                 radeon_agp_disable(rdev);
831                 r = radeon_init(rdev);
832                 if (r)
833                         return r;
834         }
835         if ((radeon_testing & 1)) {
836                 radeon_test_moves(rdev);
837         }
838         if ((radeon_testing & 2)) {
839                 radeon_test_syncing(rdev);
840         }
841         if (radeon_benchmarking) {
842                 radeon_benchmark(rdev, radeon_benchmarking);
843         }
844         return 0;
845 }
846
847 static void radeon_debugfs_remove_files(struct radeon_device *rdev);
848
849 void radeon_device_fini(struct radeon_device *rdev)
850 {
851         DRM_INFO("radeon: finishing device.\n");
852         rdev->shutdown = true;
853         /* evict vram memory */
854         radeon_bo_evict_vram(rdev);
855         radeon_fini(rdev);
856         vga_switcheroo_unregister_client(rdev->pdev);
857         vga_client_register(rdev->pdev, NULL, NULL, NULL);
858         if (rdev->rio_mem)
859                 pci_iounmap(rdev->pdev, rdev->rio_mem);
860         rdev->rio_mem = NULL;
861         iounmap(rdev->rmmio);
862         rdev->rmmio = NULL;
863         radeon_debugfs_remove_files(rdev);
864 }
865
866
867 /*
868  * Suspend & resume.
869  */
870 int radeon_suspend_kms(struct drm_device *dev, pm_message_t state)
871 {
872         struct radeon_device *rdev;
873         struct drm_crtc *crtc;
874         struct drm_connector *connector;
875         int i, r;
876
877         if (dev == NULL || dev->dev_private == NULL) {
878                 return -ENODEV;
879         }
880         if (state.event == PM_EVENT_PRETHAW) {
881                 return 0;
882         }
883         rdev = dev->dev_private;
884
885         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
886                 return 0;
887
888         drm_kms_helper_poll_disable(dev);
889
890         /* turn off display hw */
891         list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
892                 drm_helper_connector_dpms(connector, DRM_MODE_DPMS_OFF);
893         }
894
895         /* unpin the front buffers */
896         list_for_each_entry(crtc, &dev->mode_config.crtc_list, head) {
897                 struct radeon_framebuffer *rfb = to_radeon_framebuffer(crtc->fb);
898                 struct radeon_bo *robj;
899
900                 if (rfb == NULL || rfb->obj == NULL) {
901                         continue;
902                 }
903                 robj = gem_to_radeon_bo(rfb->obj);
904                 /* don't unpin kernel fb objects */
905                 if (!radeon_fbdev_robj_is_fb(rdev, robj)) {
906                         r = radeon_bo_reserve(robj, false);
907                         if (r == 0) {
908                                 radeon_bo_unpin(robj);
909                                 radeon_bo_unreserve(robj);
910                         }
911                 }
912         }
913         /* evict vram memory */
914         radeon_bo_evict_vram(rdev);
915
916         mutex_lock(&rdev->ring_lock);
917         /* wait for gpu to finish processing current batch */
918         for (i = 0; i < RADEON_NUM_RINGS; i++)
919                 radeon_fence_wait_empty_locked(rdev, i);
920         mutex_unlock(&rdev->ring_lock);
921
922         radeon_save_bios_scratch_regs(rdev);
923
924         radeon_pm_suspend(rdev);
925         radeon_suspend(rdev);
926         radeon_hpd_fini(rdev);
927         /* evict remaining vram memory */
928         radeon_bo_evict_vram(rdev);
929
930         radeon_agp_suspend(rdev);
931
932         pci_save_state(dev->pdev);
933         if (state.event == PM_EVENT_SUSPEND) {
934                 /* Shut down the device */
935                 pci_disable_device(dev->pdev);
936                 pci_set_power_state(dev->pdev, PCI_D3hot);
937         }
938         console_lock();
939         radeon_fbdev_set_suspend(rdev, 1);
940         console_unlock();
941         return 0;
942 }
943
944 int radeon_resume_kms(struct drm_device *dev)
945 {
946         struct drm_connector *connector;
947         struct radeon_device *rdev = dev->dev_private;
948
949         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
950                 return 0;
951
952         console_lock();
953         pci_set_power_state(dev->pdev, PCI_D0);
954         pci_restore_state(dev->pdev);
955         if (pci_enable_device(dev->pdev)) {
956                 console_unlock();
957                 return -1;
958         }
959         /* resume AGP if in use */
960         radeon_agp_resume(rdev);
961         radeon_resume(rdev);
962         radeon_pm_resume(rdev);
963         radeon_restore_bios_scratch_regs(rdev);
964
965         radeon_fbdev_set_suspend(rdev, 0);
966         console_unlock();
967
968         /* init dig PHYs, disp eng pll */
969         if (rdev->is_atom_bios) {
970                 radeon_atom_encoder_init(rdev);
971                 radeon_atom_disp_eng_pll_init(rdev);
972         }
973         /* reset hpd state */
974         radeon_hpd_init(rdev);
975         /* blat the mode back in */
976         drm_helper_resume_force_mode(dev);
977         /* turn on display hw */
978         list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
979                 drm_helper_connector_dpms(connector, DRM_MODE_DPMS_ON);
980         }
981
982         drm_kms_helper_poll_enable(dev);
983         return 0;
984 }
985
986 int radeon_gpu_reset(struct radeon_device *rdev)
987 {
988         int r;
989         int resched;
990
991         radeon_save_bios_scratch_regs(rdev);
992         /* block TTM */
993         resched = ttm_bo_lock_delayed_workqueue(&rdev->mman.bdev);
994         radeon_suspend(rdev);
995
996         r = radeon_asic_reset(rdev);
997         if (!r) {
998                 dev_info(rdev->dev, "GPU reset succeed\n");
999                 radeon_resume(rdev);
1000                 radeon_restore_bios_scratch_regs(rdev);
1001                 drm_helper_resume_force_mode(rdev->ddev);
1002                 ttm_bo_unlock_delayed_workqueue(&rdev->mman.bdev, resched);
1003         }
1004
1005         if (r) {
1006                 /* bad news, how to tell it to userspace ? */
1007                 dev_info(rdev->dev, "GPU reset failed\n");
1008         }
1009
1010         return r;
1011 }
1012
1013
1014 /*
1015  * Debugfs
1016  */
1017 int radeon_debugfs_add_files(struct radeon_device *rdev,
1018                              struct drm_info_list *files,
1019                              unsigned nfiles)
1020 {
1021         unsigned i;
1022
1023         for (i = 0; i < rdev->debugfs_count; i++) {
1024                 if (rdev->debugfs[i].files == files) {
1025                         /* Already registered */
1026                         return 0;
1027                 }
1028         }
1029
1030         i = rdev->debugfs_count + 1;
1031         if (i > RADEON_DEBUGFS_MAX_COMPONENTS) {
1032                 DRM_ERROR("Reached maximum number of debugfs components.\n");
1033                 DRM_ERROR("Report so we increase "
1034                           "RADEON_DEBUGFS_MAX_COMPONENTS.\n");
1035                 return -EINVAL;
1036         }
1037         rdev->debugfs[rdev->debugfs_count].files = files;
1038         rdev->debugfs[rdev->debugfs_count].num_files = nfiles;
1039         rdev->debugfs_count = i;
1040 #if defined(CONFIG_DEBUG_FS)
1041         drm_debugfs_create_files(files, nfiles,
1042                                  rdev->ddev->control->debugfs_root,
1043                                  rdev->ddev->control);
1044         drm_debugfs_create_files(files, nfiles,
1045                                  rdev->ddev->primary->debugfs_root,
1046                                  rdev->ddev->primary);
1047 #endif
1048         return 0;
1049 }
1050
1051 static void radeon_debugfs_remove_files(struct radeon_device *rdev)
1052 {
1053 #if defined(CONFIG_DEBUG_FS)
1054         unsigned i;
1055
1056         for (i = 0; i < rdev->debugfs_count; i++) {
1057                 drm_debugfs_remove_files(rdev->debugfs[i].files,
1058                                          rdev->debugfs[i].num_files,
1059                                          rdev->ddev->control);
1060                 drm_debugfs_remove_files(rdev->debugfs[i].files,
1061                                          rdev->debugfs[i].num_files,
1062                                          rdev->ddev->primary);
1063         }
1064 #endif
1065 }
1066
1067 #if defined(CONFIG_DEBUG_FS)
1068 int radeon_debugfs_init(struct drm_minor *minor)
1069 {
1070         return 0;
1071 }
1072
1073 void radeon_debugfs_cleanup(struct drm_minor *minor)
1074 {
1075 }
1076 #endif