1/*
2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
23 *
24 * Authors: Dave Airlie
25 *          Alex Deucher
26 *          Jerome Glisse
27 */
28
29#include <linux/console.h>
30#include <linux/efi.h>
31#include <linux/pci.h>
32#include <linux/pm_runtime.h>
33#include <linux/slab.h>
34#include <linux/vga_switcheroo.h>
35#include <linux/vgaarb.h>
36
37#include <drm/drm_cache.h>
38#include <drm/drm_crtc_helper.h>
39#include <drm/drm_debugfs.h>
40#include <drm/drm_device.h>
41#include <drm/drm_file.h>
42#include <drm/drm_probe_helper.h>
43#include <drm/radeon_drm.h>
44
45#include "radeon_reg.h"
46#include "radeon.h"
47#include "atom.h"
48
49static const char radeon_family_name[][16] = {
50	"R100",
51	"RV100",
52	"RS100",
53	"RV200",
54	"RS200",
55	"R200",
56	"RV250",
57	"RS300",
58	"RV280",
59	"R300",
60	"R350",
61	"RV350",
62	"RV380",
63	"R420",
64	"R423",
65	"RV410",
66	"RS400",
67	"RS480",
68	"RS600",
69	"RS690",
70	"RS740",
71	"RV515",
72	"R520",
73	"RV530",
74	"RV560",
75	"RV570",
76	"R580",
77	"R600",
78	"RV610",
79	"RV630",
80	"RV670",
81	"RV620",
82	"RV635",
83	"RS780",
84	"RS880",
85	"RV770",
86	"RV730",
87	"RV710",
88	"RV740",
89	"CEDAR",
90	"REDWOOD",
91	"JUNIPER",
92	"CYPRESS",
93	"HEMLOCK",
94	"PALM",
95	"SUMO",
96	"SUMO2",
97	"BARTS",
98	"TURKS",
99	"CAICOS",
100	"CAYMAN",
101	"ARUBA",
102	"TAHITI",
103	"PITCAIRN",
104	"VERDE",
105	"OLAND",
106	"HAINAN",
107	"BONAIRE",
108	"KAVERI",
109	"KABINI",
110	"HAWAII",
111	"MULLINS",
112	"LAST",
113};
114
115#if defined(CONFIG_VGA_SWITCHEROO)
116bool radeon_has_atpx_dgpu_power_cntl(void);
117bool radeon_is_atpx_hybrid(void);
118#else
119static inline bool radeon_has_atpx_dgpu_power_cntl(void) { return false; }
120static inline bool radeon_is_atpx_hybrid(void) { return false; }
121#endif
122
123#define RADEON_PX_QUIRK_DISABLE_PX  (1 << 0)
124
125struct radeon_px_quirk {
126	u32 chip_vendor;
127	u32 chip_device;
128	u32 subsys_vendor;
129	u32 subsys_device;
130	u32 px_quirk_flags;
131};
132
133static struct radeon_px_quirk radeon_px_quirk_list[] = {
134	/* Acer aspire 5560g (CPU: AMD A4-3305M; GPU: AMD Radeon HD 6480g + 7470m)
135	 * https://bugzilla.kernel.org/show_bug.cgi?id=74551
136	 */
137	{ PCI_VENDOR_ID_ATI, 0x6760, 0x1025, 0x0672, RADEON_PX_QUIRK_DISABLE_PX },
138	/* Asus K73TA laptop with AMD A6-3400M APU and Radeon 6550 GPU
139	 * https://bugzilla.kernel.org/show_bug.cgi?id=51381
140	 */
141	{ PCI_VENDOR_ID_ATI, 0x6741, 0x1043, 0x108c, RADEON_PX_QUIRK_DISABLE_PX },
142	/* Asus K53TK laptop with AMD A6-3420M APU and Radeon 7670m GPU
143	 * https://bugzilla.kernel.org/show_bug.cgi?id=51381
144	 */
145	{ PCI_VENDOR_ID_ATI, 0x6840, 0x1043, 0x2122, RADEON_PX_QUIRK_DISABLE_PX },
146	/* Asus K53TK laptop with AMD A6-3420M APU and Radeon 7670m GPU
147	 * https://bugs.freedesktop.org/show_bug.cgi?id=101491
148	 */
149	{ PCI_VENDOR_ID_ATI, 0x6741, 0x1043, 0x2122, RADEON_PX_QUIRK_DISABLE_PX },
150	/* Asus K73TK laptop with AMD A6-3420M APU and Radeon 7670m GPU
151	 * https://bugzilla.kernel.org/show_bug.cgi?id=51381#c52
152	 */
153	{ PCI_VENDOR_ID_ATI, 0x6840, 0x1043, 0x2123, RADEON_PX_QUIRK_DISABLE_PX },
154	{ 0, 0, 0, 0, 0 },
155};
156
157bool radeon_is_px(struct drm_device *dev)
158{
159	struct radeon_device *rdev = dev->dev_private;
160
161	if (rdev->flags & RADEON_IS_PX)
162		return true;
163	return false;
164}
165
166static void radeon_device_handle_px_quirks(struct radeon_device *rdev)
167{
168	struct radeon_px_quirk *p = radeon_px_quirk_list;
169
170	/* Apply PX quirks */
171	while (p && p->chip_device != 0) {
172		if (rdev->pdev->vendor == p->chip_vendor &&
173		    rdev->pdev->device == p->chip_device &&
174		    rdev->pdev->subsystem_vendor == p->subsys_vendor &&
175		    rdev->pdev->subsystem_device == p->subsys_device) {
176			rdev->px_quirk_flags = p->px_quirk_flags;
177			break;
178		}
179		++p;
180	}
181
182	if (rdev->px_quirk_flags & RADEON_PX_QUIRK_DISABLE_PX)
183		rdev->flags &= ~RADEON_IS_PX;
184
185	/* disable PX is the system doesn't support dGPU power control or hybrid gfx */
186	if (!radeon_is_atpx_hybrid() &&
187	    !radeon_has_atpx_dgpu_power_cntl())
188		rdev->flags &= ~RADEON_IS_PX;
189}
190
191/**
192 * radeon_program_register_sequence - program an array of registers.
193 *
194 * @rdev: radeon_device pointer
195 * @registers: pointer to the register array
196 * @array_size: size of the register array
197 *
198 * Programs an array or registers with and and or masks.
199 * This is a helper for setting golden registers.
200 */
201void radeon_program_register_sequence(struct radeon_device *rdev,
202				      const u32 *registers,
203				      const u32 array_size)
204{
205	u32 tmp, reg, and_mask, or_mask;
206	int i;
207
208	if (array_size % 3)
209		return;
210
211	for (i = 0; i < array_size; i +=3) {
212		reg = registers[i + 0];
213		and_mask = registers[i + 1];
214		or_mask = registers[i + 2];
215
216		if (and_mask == 0xffffffff) {
217			tmp = or_mask;
218		} else {
219			tmp = RREG32(reg);
220			tmp &= ~and_mask;
221			tmp |= or_mask;
222		}
223		WREG32(reg, tmp);
224	}
225}
226
227void radeon_pci_config_reset(struct radeon_device *rdev)
228{
229	pci_write_config_dword(rdev->pdev, 0x7c, RADEON_ASIC_RESET_DATA);
230}
231
232/**
233 * radeon_surface_init - Clear GPU surface registers.
234 *
235 * @rdev: radeon_device pointer
236 *
237 * Clear GPU surface registers (r1xx-r5xx).
238 */
239void radeon_surface_init(struct radeon_device *rdev)
240{
241	/* FIXME: check this out */
242	if (rdev->family < CHIP_R600) {
243		int i;
244
245		for (i = 0; i < RADEON_GEM_MAX_SURFACES; i++) {
246			if (rdev->surface_regs[i].bo)
247				radeon_bo_get_surface_reg(rdev->surface_regs[i].bo);
248			else
249				radeon_clear_surface_reg(rdev, i);
250		}
251		/* enable surfaces */
252		WREG32(RADEON_SURFACE_CNTL, 0);
253	}
254}
255
256/*
257 * GPU scratch registers helpers function.
258 */
259/**
260 * radeon_scratch_init - Init scratch register driver information.
261 *
262 * @rdev: radeon_device pointer
263 *
264 * Init CP scratch register driver information (r1xx-r5xx)
265 */
266void radeon_scratch_init(struct radeon_device *rdev)
267{
268	int i;
269
270	/* FIXME: check this out */
271	if (rdev->family < CHIP_R300) {
272		rdev->scratch.num_reg = 5;
273	} else {
274		rdev->scratch.num_reg = 7;
275	}
276	rdev->scratch.reg_base = RADEON_SCRATCH_REG0;
277	for (i = 0; i < rdev->scratch.num_reg; i++) {
278		rdev->scratch.free[i] = true;
279		rdev->scratch.reg[i] = rdev->scratch.reg_base + (i * 4);
280	}
281}
282
283/**
284 * radeon_scratch_get - Allocate a scratch register
285 *
286 * @rdev: radeon_device pointer
287 * @reg: scratch register mmio offset
288 *
289 * Allocate a CP scratch register for use by the driver (all asics).
290 * Returns 0 on success or -EINVAL on failure.
291 */
292int radeon_scratch_get(struct radeon_device *rdev, uint32_t *reg)
293{
294	int i;
295
296	for (i = 0; i < rdev->scratch.num_reg; i++) {
297		if (rdev->scratch.free[i]) {
298			rdev->scratch.free[i] = false;
299			*reg = rdev->scratch.reg[i];
300			return 0;
301		}
302	}
303	return -EINVAL;
304}
305
306/**
307 * radeon_scratch_free - Free a scratch register
308 *
309 * @rdev: radeon_device pointer
310 * @reg: scratch register mmio offset
311 *
312 * Free a CP scratch register allocated for use by the driver (all asics)
313 */
314void radeon_scratch_free(struct radeon_device *rdev, uint32_t reg)
315{
316	int i;
317
318	for (i = 0; i < rdev->scratch.num_reg; i++) {
319		if (rdev->scratch.reg[i] == reg) {
320			rdev->scratch.free[i] = true;
321			return;
322		}
323	}
324}
325
326/*
327 * GPU doorbell aperture helpers function.
328 */
329/**
330 * radeon_doorbell_init - Init doorbell driver information.
331 *
332 * @rdev: radeon_device pointer
333 *
334 * Init doorbell driver information (CIK)
335 * Returns 0 on success, error on failure.
336 */
337static int radeon_doorbell_init(struct radeon_device *rdev)
338{
339	/* doorbell bar mapping */
340	rdev->doorbell.base = pci_resource_start(rdev->pdev, 2);
341	rdev->doorbell.size = pci_resource_len(rdev->pdev, 2);
342
343	rdev->doorbell.num_doorbells = min_t(u32, rdev->doorbell.size / sizeof(u32), RADEON_MAX_DOORBELLS);
344	if (rdev->doorbell.num_doorbells == 0)
345		return -EINVAL;
346
347	rdev->doorbell.ptr = ioremap(rdev->doorbell.base, rdev->doorbell.num_doorbells * sizeof(u32));
348	if (rdev->doorbell.ptr == NULL) {
349		return -ENOMEM;
350	}
351	DRM_INFO("doorbell mmio base: 0x%08X\n", (uint32_t)rdev->doorbell.base);
352	DRM_INFO("doorbell mmio size: %u\n", (unsigned)rdev->doorbell.size);
353
354	memset(&rdev->doorbell.used, 0, sizeof(rdev->doorbell.used));
355
356	return 0;
357}
358
359/**
360 * radeon_doorbell_fini - Tear down doorbell driver information.
361 *
362 * @rdev: radeon_device pointer
363 *
364 * Tear down doorbell driver information (CIK)
365 */
366static void radeon_doorbell_fini(struct radeon_device *rdev)
367{
368	iounmap(rdev->doorbell.ptr);
369	rdev->doorbell.ptr = NULL;
370}
371
372/**
373 * radeon_doorbell_get - Allocate a doorbell entry
374 *
375 * @rdev: radeon_device pointer
376 * @doorbell: doorbell index
377 *
378 * Allocate a doorbell for use by the driver (all asics).
379 * Returns 0 on success or -EINVAL on failure.
380 */
381int radeon_doorbell_get(struct radeon_device *rdev, u32 *doorbell)
382{
383	unsigned long offset = find_first_zero_bit(rdev->doorbell.used, rdev->doorbell.num_doorbells);
384	if (offset < rdev->doorbell.num_doorbells) {
385		__set_bit(offset, rdev->doorbell.used);
386		*doorbell = offset;
387		return 0;
388	} else {
389		return -EINVAL;
390	}
391}
392
393/**
394 * radeon_doorbell_free - Free a doorbell entry
395 *
396 * @rdev: radeon_device pointer
397 * @doorbell: doorbell index
398 *
399 * Free a doorbell allocated for use by the driver (all asics)
400 */
401void radeon_doorbell_free(struct radeon_device *rdev, u32 doorbell)
402{
403	if (doorbell < rdev->doorbell.num_doorbells)
404		__clear_bit(doorbell, rdev->doorbell.used);
405}
406
407/*
408 * radeon_wb_*()
409 * Writeback is the the method by which the the GPU updates special pages
410 * in memory with the status of certain GPU events (fences, ring pointers,
411 * etc.).
412 */
413
414/**
415 * radeon_wb_disable - Disable Writeback
416 *
417 * @rdev: radeon_device pointer
418 *
419 * Disables Writeback (all asics).  Used for suspend.
420 */
421void radeon_wb_disable(struct radeon_device *rdev)
422{
423	rdev->wb.enabled = false;
424}
425
426/**
427 * radeon_wb_fini - Disable Writeback and free memory
428 *
429 * @rdev: radeon_device pointer
430 *
431 * Disables Writeback and frees the Writeback memory (all asics).
432 * Used at driver shutdown.
433 */
434void radeon_wb_fini(struct radeon_device *rdev)
435{
436	radeon_wb_disable(rdev);
437	if (rdev->wb.wb_obj) {
438		if (!radeon_bo_reserve(rdev->wb.wb_obj, false)) {
439			radeon_bo_kunmap(rdev->wb.wb_obj);
440			radeon_bo_unpin(rdev->wb.wb_obj);
441			radeon_bo_unreserve(rdev->wb.wb_obj);
442		}
443		radeon_bo_unref(&rdev->wb.wb_obj);
444		rdev->wb.wb = NULL;
445		rdev->wb.wb_obj = NULL;
446	}
447}
448
449/**
450 * radeon_wb_init- Init Writeback driver info and allocate memory
451 *
452 * @rdev: radeon_device pointer
453 *
454 * Disables Writeback and frees the Writeback memory (all asics).
455 * Used at driver startup.
456 * Returns 0 on success or an -error on failure.
457 */
458int radeon_wb_init(struct radeon_device *rdev)
459{
460	int r;
461
462	if (rdev->wb.wb_obj == NULL) {
463		r = radeon_bo_create(rdev, RADEON_GPU_PAGE_SIZE, PAGE_SIZE, true,
464				     RADEON_GEM_DOMAIN_GTT, 0, NULL, NULL,
465				     &rdev->wb.wb_obj);
466		if (r) {
467			dev_warn(rdev->dev, "(%d) create WB bo failed\n", r);
468			return r;
469		}
470		r = radeon_bo_reserve(rdev->wb.wb_obj, false);
471		if (unlikely(r != 0)) {
472			radeon_wb_fini(rdev);
473			return r;
474		}
475		r = radeon_bo_pin(rdev->wb.wb_obj, RADEON_GEM_DOMAIN_GTT,
476				&rdev->wb.gpu_addr);
477		if (r) {
478			radeon_bo_unreserve(rdev->wb.wb_obj);
479			dev_warn(rdev->dev, "(%d) pin WB bo failed\n", r);
480			radeon_wb_fini(rdev);
481			return r;
482		}
483		r = radeon_bo_kmap(rdev->wb.wb_obj, (void **)&rdev->wb.wb);
484		radeon_bo_unreserve(rdev->wb.wb_obj);
485		if (r) {
486			dev_warn(rdev->dev, "(%d) map WB bo failed\n", r);
487			radeon_wb_fini(rdev);
488			return r;
489		}
490	}
491
492	/* clear wb memory */
493	memset((char *)rdev->wb.wb, 0, RADEON_GPU_PAGE_SIZE);
494	/* disable event_write fences */
495	rdev->wb.use_event = false;
496	/* disabled via module param */
497	if (radeon_no_wb == 1) {
498		rdev->wb.enabled = false;
499	} else {
500		if (rdev->flags & RADEON_IS_AGP) {
501			/* often unreliable on AGP */
502			rdev->wb.enabled = false;
503		} else if (rdev->family < CHIP_R300) {
504			/* often unreliable on pre-r300 */
505			rdev->wb.enabled = false;
506		} else {
507			rdev->wb.enabled = true;
508			/* event_write fences are only available on r600+ */
509			if (rdev->family >= CHIP_R600) {
510				rdev->wb.use_event = true;
511			}
512		}
513	}
514	/* always use writeback/events on NI, APUs */
515	if (rdev->family >= CHIP_PALM) {
516		rdev->wb.enabled = true;
517		rdev->wb.use_event = true;
518	}
519
520	dev_info(rdev->dev, "WB %sabled\n", rdev->wb.enabled ? "en" : "dis");
521
522	return 0;
523}
524
525/**
526 * radeon_vram_location - try to find VRAM location
527 * @rdev: radeon device structure holding all necessary informations
528 * @mc: memory controller structure holding memory informations
529 * @base: base address at which to put VRAM
530 *
531 * Function will place try to place VRAM at base address provided
532 * as parameter (which is so far either PCI aperture address or
533 * for IGP TOM base address).
534 *
535 * If there is not enough space to fit the unvisible VRAM in the 32bits
536 * address space then we limit the VRAM size to the aperture.
537 *
538 * If we are using AGP and if the AGP aperture doesn't allow us to have
539 * room for all the VRAM than we restrict the VRAM to the PCI aperture
540 * size and print a warning.
541 *
542 * This function will never fails, worst case are limiting VRAM.
543 *
544 * Note: GTT start, end, size should be initialized before calling this
545 * function on AGP platform.
546 *
547 * Note: We don't explicitly enforce VRAM start to be aligned on VRAM size,
548 * this shouldn't be a problem as we are using the PCI aperture as a reference.
549 * Otherwise this would be needed for rv280, all r3xx, and all r4xx, but
550 * not IGP.
551 *
552 * Note: we use mc_vram_size as on some board we need to program the mc to
553 * cover the whole aperture even if VRAM size is inferior to aperture size
554 * Novell bug 204882 + along with lots of ubuntu ones
555 *
556 * Note: when limiting vram it's safe to overwritte real_vram_size because
557 * we are not in case where real_vram_size is inferior to mc_vram_size (ie
558 * note afected by bogus hw of Novell bug 204882 + along with lots of ubuntu
559 * ones)
560 *
561 * Note: IGP TOM addr should be the same as the aperture addr, we don't
562 * explicitly check for that thought.
563 *
564 * FIXME: when reducing VRAM size align new size on power of 2.
565 */
566void radeon_vram_location(struct radeon_device *rdev, struct radeon_mc *mc, u64 base)
567{
568	uint64_t limit = (uint64_t)radeon_vram_limit << 20;
569
570	mc->vram_start = base;
571	if (mc->mc_vram_size > (rdev->mc.mc_mask - base + 1)) {
572		dev_warn(rdev->dev, "limiting VRAM to PCI aperture size\n");
573		mc->real_vram_size = mc->aper_size;
574		mc->mc_vram_size = mc->aper_size;
575	}
576	mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
577	if (rdev->flags & RADEON_IS_AGP && mc->vram_end > mc->gtt_start && mc->vram_start <= mc->gtt_end) {
578		dev_warn(rdev->dev, "limiting VRAM to PCI aperture size\n");
579		mc->real_vram_size = mc->aper_size;
580		mc->mc_vram_size = mc->aper_size;
581	}
582	mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
583	if (limit && limit < mc->real_vram_size)
584		mc->real_vram_size = limit;
585	dev_info(rdev->dev, "VRAM: %lluM 0x%016llX - 0x%016llX (%lluM used)\n",
586			mc->mc_vram_size >> 20, mc->vram_start,
587			mc->vram_end, mc->real_vram_size >> 20);
588}
589
590/**
591 * radeon_gtt_location - try to find GTT location
592 * @rdev: radeon device structure holding all necessary informations
593 * @mc: memory controller structure holding memory informations
594 *
595 * Function will place try to place GTT before or after VRAM.
596 *
597 * If GTT size is bigger than space left then we ajust GTT size.
598 * Thus function will never fails.
599 *
600 * FIXME: when reducing GTT size align new size on power of 2.
601 */
602void radeon_gtt_location(struct radeon_device *rdev, struct radeon_mc *mc)
603{
604	u64 size_af, size_bf;
605
606	size_af = ((rdev->mc.mc_mask - mc->vram_end) + mc->gtt_base_align) & ~mc->gtt_base_align;
607	size_bf = mc->vram_start & ~mc->gtt_base_align;
608	if (size_bf > size_af) {
609		if (mc->gtt_size > size_bf) {
610			dev_warn(rdev->dev, "limiting GTT\n");
611			mc->gtt_size = size_bf;
612		}
613		mc->gtt_start = (mc->vram_start & ~mc->gtt_base_align) - mc->gtt_size;
614	} else {
615		if (mc->gtt_size > size_af) {
616			dev_warn(rdev->dev, "limiting GTT\n");
617			mc->gtt_size = size_af;
618		}
619		mc->gtt_start = (mc->vram_end + 1 + mc->gtt_base_align) & ~mc->gtt_base_align;
620	}
621	mc->gtt_end = mc->gtt_start + mc->gtt_size - 1;
622	dev_info(rdev->dev, "GTT: %lluM 0x%016llX - 0x%016llX\n",
623			mc->gtt_size >> 20, mc->gtt_start, mc->gtt_end);
624}
625
626/*
627 * GPU helpers function.
628 */
629
630/**
631 * radeon_device_is_virtual - check if we are running is a virtual environment
632 *
633 * Check if the asic has been passed through to a VM (all asics).
634 * Used at driver startup.
635 * Returns true if virtual or false if not.
636 */
637bool radeon_device_is_virtual(void)
638{
639#ifdef CONFIG_X86
640	return boot_cpu_has(X86_FEATURE_HYPERVISOR);
641#else
642	return false;
643#endif
644}
645
646/**
647 * radeon_card_posted - check if the hw has already been initialized
648 *
649 * @rdev: radeon_device pointer
650 *
651 * Check if the asic has been initialized (all asics).
652 * Used at driver startup.
653 * Returns true if initialized or false if not.
654 */
655bool radeon_card_posted(struct radeon_device *rdev)
656{
657	uint32_t reg;
658
659	/* for pass through, always force asic_init for CI */
660	if (rdev->family >= CHIP_BONAIRE &&
661	    radeon_device_is_virtual())
662		return false;
663
664	/* required for EFI mode on macbook2,1 which uses an r5xx asic */
665	if (efi_enabled(EFI_BOOT) &&
666	    (rdev->pdev->subsystem_vendor == PCI_VENDOR_ID_APPLE) &&
667	    (rdev->family < CHIP_R600))
668		return false;
669
670	if (ASIC_IS_NODCE(rdev))
671		goto check_memsize;
672
673	/* first check CRTCs */
674	if (ASIC_IS_DCE4(rdev)) {
675		reg = RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC0_REGISTER_OFFSET) |
676			RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC1_REGISTER_OFFSET);
677			if (rdev->num_crtc >= 4) {
678				reg |= RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC2_REGISTER_OFFSET) |
679					RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC3_REGISTER_OFFSET);
680			}
681			if (rdev->num_crtc >= 6) {
682				reg |= RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC4_REGISTER_OFFSET) |
683					RREG32(EVERGREEN_CRTC_CONTROL + EVERGREEN_CRTC5_REGISTER_OFFSET);
684			}
685		if (reg & EVERGREEN_CRTC_MASTER_EN)
686			return true;
687	} else if (ASIC_IS_AVIVO(rdev)) {
688		reg = RREG32(AVIVO_D1CRTC_CONTROL) |
689		      RREG32(AVIVO_D2CRTC_CONTROL);
690		if (reg & AVIVO_CRTC_EN) {
691			return true;
692		}
693	} else {
694		reg = RREG32(RADEON_CRTC_GEN_CNTL) |
695		      RREG32(RADEON_CRTC2_GEN_CNTL);
696		if (reg & RADEON_CRTC_EN) {
697			return true;
698		}
699	}
700
701check_memsize:
702	/* then check MEM_SIZE, in case the crtcs are off */
703	if (rdev->family >= CHIP_R600)
704		reg = RREG32(R600_CONFIG_MEMSIZE);
705	else
706		reg = RREG32(RADEON_CONFIG_MEMSIZE);
707
708	if (reg)
709		return true;
710
711	return false;
712
713}
714
715/**
716 * radeon_update_bandwidth_info - update display bandwidth params
717 *
718 * @rdev: radeon_device pointer
719 *
720 * Used when sclk/mclk are switched or display modes are set.
721 * params are used to calculate display watermarks (all asics)
722 */
723void radeon_update_bandwidth_info(struct radeon_device *rdev)
724{
725	fixed20_12 a;
726	u32 sclk = rdev->pm.current_sclk;
727	u32 mclk = rdev->pm.current_mclk;
728
729	/* sclk/mclk in Mhz */
730	a.full = dfixed_const(100);
731	rdev->pm.sclk.full = dfixed_const(sclk);
732	rdev->pm.sclk.full = dfixed_div(rdev->pm.sclk, a);
733	rdev->pm.mclk.full = dfixed_const(mclk);
734	rdev->pm.mclk.full = dfixed_div(rdev->pm.mclk, a);
735
736	if (rdev->flags & RADEON_IS_IGP) {
737		a.full = dfixed_const(16);
738		/* core_bandwidth = sclk(Mhz) * 16 */
739		rdev->pm.core_bandwidth.full = dfixed_div(rdev->pm.sclk, a);
740	}
741}
742
743/**
744 * radeon_boot_test_post_card - check and possibly initialize the hw
745 *
746 * @rdev: radeon_device pointer
747 *
748 * Check if the asic is initialized and if not, attempt to initialize
749 * it (all asics).
750 * Returns true if initialized or false if not.
751 */
752bool radeon_boot_test_post_card(struct radeon_device *rdev)
753{
754	if (radeon_card_posted(rdev))
755		return true;
756
757	if (rdev->bios) {
758		DRM_INFO("GPU not posted. posting now...\n");
759		if (rdev->is_atom_bios)
760			atom_asic_init(rdev->mode_info.atom_context);
761		else
762			radeon_combios_asic_init(rdev->ddev);
763		return true;
764	} else {
765		dev_err(rdev->dev, "Card not posted and no BIOS - ignoring\n");
766		return false;
767	}
768}
769
770/**
771 * radeon_dummy_page_init - init dummy page used by the driver
772 *
773 * @rdev: radeon_device pointer
774 *
775 * Allocate the dummy page used by the driver (all asics).
776 * This dummy page is used by the driver as a filler for gart entries
777 * when pages are taken out of the GART
778 * Returns 0 on sucess, -ENOMEM on failure.
779 */
780int radeon_dummy_page_init(struct radeon_device *rdev)
781{
782	if (rdev->dummy_page.page)
783		return 0;
784	rdev->dummy_page.page = alloc_page(GFP_DMA32 | GFP_KERNEL | __GFP_ZERO);
785	if (rdev->dummy_page.page == NULL)
786		return -ENOMEM;
787	rdev->dummy_page.addr = pci_map_page(rdev->pdev, rdev->dummy_page.page,
788					0, PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
789	if (pci_dma_mapping_error(rdev->pdev, rdev->dummy_page.addr)) {
790		dev_err(&rdev->pdev->dev, "Failed to DMA MAP the dummy page\n");
791		__free_page(rdev->dummy_page.page);
792		rdev->dummy_page.page = NULL;
793		return -ENOMEM;
794	}
795	rdev->dummy_page.entry = radeon_gart_get_page_entry(rdev->dummy_page.addr,
796							    RADEON_GART_PAGE_DUMMY);
797	return 0;
798}
799
800/**
801 * radeon_dummy_page_fini - free dummy page used by the driver
802 *
803 * @rdev: radeon_device pointer
804 *
805 * Frees the dummy page used by the driver (all asics).
806 */
807void radeon_dummy_page_fini(struct radeon_device *rdev)
808{
809	if (rdev->dummy_page.page == NULL)
810		return;
811	pci_unmap_page(rdev->pdev, rdev->dummy_page.addr,
812			PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
813	__free_page(rdev->dummy_page.page);
814	rdev->dummy_page.page = NULL;
815}
816
817
818/* ATOM accessor methods */
819/*
820 * ATOM is an interpreted byte code stored in tables in the vbios.  The
821 * driver registers callbacks to access registers and the interpreter
822 * in the driver parses the tables and executes then to program specific
823 * actions (set display modes, asic init, etc.).  See radeon_atombios.c,
824 * atombios.h, and atom.c
825 */
826
827/**
828 * cail_pll_read - read PLL register
829 *
830 * @info: atom card_info pointer
831 * @reg: PLL register offset
832 *
833 * Provides a PLL register accessor for the atom interpreter (r4xx+).
834 * Returns the value of the PLL register.
835 */
836static uint32_t cail_pll_read(struct card_info *info, uint32_t reg)
837{
838	struct radeon_device *rdev = info->dev->dev_private;
839	uint32_t r;
840
841	r = rdev->pll_rreg(rdev, reg);
842	return r;
843}
844
845/**
846 * cail_pll_write - write PLL register
847 *
848 * @info: atom card_info pointer
849 * @reg: PLL register offset
850 * @val: value to write to the pll register
851 *
852 * Provides a PLL register accessor for the atom interpreter (r4xx+).
853 */
854static void cail_pll_write(struct card_info *info, uint32_t reg, uint32_t val)
855{
856	struct radeon_device *rdev = info->dev->dev_private;
857
858	rdev->pll_wreg(rdev, reg, val);
859}
860
861/**
862 * cail_mc_read - read MC (Memory Controller) register
863 *
864 * @info: atom card_info pointer
865 * @reg: MC register offset
866 *
867 * Provides an MC register accessor for the atom interpreter (r4xx+).
868 * Returns the value of the MC register.
869 */
870static uint32_t cail_mc_read(struct card_info *info, uint32_t reg)
871{
872	struct radeon_device *rdev = info->dev->dev_private;
873	uint32_t r;
874
875	r = rdev->mc_rreg(rdev, reg);
876	return r;
877}
878
879/**
880 * cail_mc_write - write MC (Memory Controller) register
881 *
882 * @info: atom card_info pointer
883 * @reg: MC register offset
884 * @val: value to write to the pll register
885 *
886 * Provides a MC register accessor for the atom interpreter (r4xx+).
887 */
888static void cail_mc_write(struct card_info *info, uint32_t reg, uint32_t val)
889{
890	struct radeon_device *rdev = info->dev->dev_private;
891
892	rdev->mc_wreg(rdev, reg, val);
893}
894
895/**
896 * cail_reg_write - write MMIO register
897 *
898 * @info: atom card_info pointer
899 * @reg: MMIO register offset
900 * @val: value to write to the pll register
901 *
902 * Provides a MMIO register accessor for the atom interpreter (r4xx+).
903 */
904static void cail_reg_write(struct card_info *info, uint32_t reg, uint32_t val)
905{
906	struct radeon_device *rdev = info->dev->dev_private;
907
908	WREG32(reg*4, val);
909}
910
911/**
912 * cail_reg_read - read MMIO register
913 *
914 * @info: atom card_info pointer
915 * @reg: MMIO register offset
916 *
917 * Provides an MMIO register accessor for the atom interpreter (r4xx+).
918 * Returns the value of the MMIO register.
919 */
920static uint32_t cail_reg_read(struct card_info *info, uint32_t reg)
921{
922	struct radeon_device *rdev = info->dev->dev_private;
923	uint32_t r;
924
925	r = RREG32(reg*4);
926	return r;
927}
928
929/**
930 * cail_ioreg_write - write IO register
931 *
932 * @info: atom card_info pointer
933 * @reg: IO register offset
934 * @val: value to write to the pll register
935 *
936 * Provides a IO register accessor for the atom interpreter (r4xx+).
937 */
938static void cail_ioreg_write(struct card_info *info, uint32_t reg, uint32_t val)
939{
940	struct radeon_device *rdev = info->dev->dev_private;
941
942	WREG32_IO(reg*4, val);
943}
944
945/**
946 * cail_ioreg_read - read IO register
947 *
948 * @info: atom card_info pointer
949 * @reg: IO register offset
950 *
951 * Provides an IO register accessor for the atom interpreter (r4xx+).
952 * Returns the value of the IO register.
953 */
954static uint32_t cail_ioreg_read(struct card_info *info, uint32_t reg)
955{
956	struct radeon_device *rdev = info->dev->dev_private;
957	uint32_t r;
958
959	r = RREG32_IO(reg*4);
960	return r;
961}
962
963/**
964 * radeon_atombios_init - init the driver info and callbacks for atombios
965 *
966 * @rdev: radeon_device pointer
967 *
968 * Initializes the driver info and register access callbacks for the
969 * ATOM interpreter (r4xx+).
970 * Returns 0 on sucess, -ENOMEM on failure.
971 * Called at driver startup.
972 */
973int radeon_atombios_init(struct radeon_device *rdev)
974{
975	struct card_info *atom_card_info =
976	    kzalloc(sizeof(struct card_info), GFP_KERNEL);
977
978	if (!atom_card_info)
979		return -ENOMEM;
980
981	rdev->mode_info.atom_card_info = atom_card_info;
982	atom_card_info->dev = rdev->ddev;
983	atom_card_info->reg_read = cail_reg_read;
984	atom_card_info->reg_write = cail_reg_write;
985	/* needed for iio ops */
986	if (rdev->rio_mem) {
987		atom_card_info->ioreg_read = cail_ioreg_read;
988		atom_card_info->ioreg_write = cail_ioreg_write;
989	} else {
990		DRM_ERROR("Unable to find PCI I/O BAR; using MMIO for ATOM IIO\n");
991		atom_card_info->ioreg_read = cail_reg_read;
992		atom_card_info->ioreg_write = cail_reg_write;
993	}
994	atom_card_info->mc_read = cail_mc_read;
995	atom_card_info->mc_write = cail_mc_write;
996	atom_card_info->pll_read = cail_pll_read;
997	atom_card_info->pll_write = cail_pll_write;
998
999	rdev->mode_info.atom_context = atom_parse(atom_card_info, rdev->bios);
1000	if (!rdev->mode_info.atom_context) {
1001		radeon_atombios_fini(rdev);
1002		return -ENOMEM;
1003	}
1004
1005	mutex_init(&rdev->mode_info.atom_context->mutex);
1006	mutex_init(&rdev->mode_info.atom_context->scratch_mutex);
1007	radeon_atom_initialize_bios_scratch_regs(rdev->ddev);
1008	atom_allocate_fb_scratch(rdev->mode_info.atom_context);
1009	return 0;
1010}
1011
1012/**
1013 * radeon_atombios_fini - free the driver info and callbacks for atombios
1014 *
1015 * @rdev: radeon_device pointer
1016 *
1017 * Frees the driver info and register access callbacks for the ATOM
1018 * interpreter (r4xx+).
1019 * Called at driver shutdown.
1020 */
1021void radeon_atombios_fini(struct radeon_device *rdev)
1022{
1023	if (rdev->mode_info.atom_context) {
1024		kfree(rdev->mode_info.atom_context->scratch);
1025		kfree(rdev->mode_info.atom_context->iio);
1026	}
1027	kfree(rdev->mode_info.atom_context);
1028	rdev->mode_info.atom_context = NULL;
1029	kfree(rdev->mode_info.atom_card_info);
1030	rdev->mode_info.atom_card_info = NULL;
1031}
1032
1033/* COMBIOS */
1034/*
1035 * COMBIOS is the bios format prior to ATOM. It provides
1036 * command tables similar to ATOM, but doesn't have a unified
1037 * parser.  See radeon_combios.c
1038 */
1039
1040/**
1041 * radeon_combios_init - init the driver info for combios
1042 *
1043 * @rdev: radeon_device pointer
1044 *
1045 * Initializes the driver info for combios (r1xx-r3xx).
1046 * Returns 0 on sucess.
1047 * Called at driver startup.
1048 */
1049int radeon_combios_init(struct radeon_device *rdev)
1050{
1051	radeon_combios_initialize_bios_scratch_regs(rdev->ddev);
1052	return 0;
1053}
1054
1055/**
1056 * radeon_combios_fini - free the driver info for combios
1057 *
1058 * @rdev: radeon_device pointer
1059 *
1060 * Frees the driver info for combios (r1xx-r3xx).
1061 * Called at driver shutdown.
1062 */
1063void radeon_combios_fini(struct radeon_device *rdev)
1064{
1065}
1066
1067/* if we get transitioned to only one device, take VGA back */
1068/**
1069 * radeon_vga_set_decode - enable/disable vga decode
1070 *
1071 * @cookie: radeon_device pointer
1072 * @state: enable/disable vga decode
1073 *
1074 * Enable/disable vga decode (all asics).
1075 * Returns VGA resource flags.
1076 */
1077static unsigned int radeon_vga_set_decode(void *cookie, bool state)
1078{
1079	struct radeon_device *rdev = cookie;
1080	radeon_vga_set_state(rdev, state);
1081	if (state)
1082		return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1083		       VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1084	else
1085		return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1086}
1087
1088/**
1089 * radeon_check_pot_argument - check that argument is a power of two
1090 *
1091 * @arg: value to check
1092 *
1093 * Validates that a certain argument is a power of two (all asics).
1094 * Returns true if argument is valid.
1095 */
1096static bool radeon_check_pot_argument(int arg)
1097{
1098	return (arg & (arg - 1)) == 0;
1099}
1100
1101/**
1102 * Determine a sensible default GART size according to ASIC family.
1103 *
1104 * @family ASIC family name
1105 */
1106static int radeon_gart_size_auto(enum radeon_family family)
1107{
1108	/* default to a larger gart size on newer asics */
1109	if (family >= CHIP_TAHITI)
1110		return 2048;
1111	else if (family >= CHIP_RV770)
1112		return 1024;
1113	else
1114		return 512;
1115}
1116
1117/**
1118 * radeon_check_arguments - validate module params
1119 *
1120 * @rdev: radeon_device pointer
1121 *
1122 * Validates certain module parameters and updates
1123 * the associated values used by the driver (all asics).
1124 */
1125static void radeon_check_arguments(struct radeon_device *rdev)
1126{
1127	/* vramlimit must be a power of two */
1128	if (!radeon_check_pot_argument(radeon_vram_limit)) {
1129		dev_warn(rdev->dev, "vram limit (%d) must be a power of 2\n",
1130				radeon_vram_limit);
1131		radeon_vram_limit = 0;
1132	}
1133
1134	if (radeon_gart_size == -1) {
1135		radeon_gart_size = radeon_gart_size_auto(rdev->family);
1136	}
1137	/* gtt size must be power of two and greater or equal to 32M */
1138	if (radeon_gart_size < 32) {
1139		dev_warn(rdev->dev, "gart size (%d) too small\n",
1140				radeon_gart_size);
1141		radeon_gart_size = radeon_gart_size_auto(rdev->family);
1142	} else if (!radeon_check_pot_argument(radeon_gart_size)) {
1143		dev_warn(rdev->dev, "gart size (%d) must be a power of 2\n",
1144				radeon_gart_size);
1145		radeon_gart_size = radeon_gart_size_auto(rdev->family);
1146	}
1147	rdev->mc.gtt_size = (uint64_t)radeon_gart_size << 20;
1148
1149	/* AGP mode can only be -1, 1, 2, 4, 8 */
1150	switch (radeon_agpmode) {
1151	case -1:
1152	case 0:
1153	case 1:
1154	case 2:
1155	case 4:
1156	case 8:
1157		break;
1158	default:
1159		dev_warn(rdev->dev, "invalid AGP mode %d (valid mode: "
1160				"-1, 0, 1, 2, 4, 8)\n", radeon_agpmode);
1161		radeon_agpmode = 0;
1162		break;
1163	}
1164
1165	if (!radeon_check_pot_argument(radeon_vm_size)) {
1166		dev_warn(rdev->dev, "VM size (%d) must be a power of 2\n",
1167			 radeon_vm_size);
1168		radeon_vm_size = 4;
1169	}
1170
1171	if (radeon_vm_size < 1) {
1172		dev_warn(rdev->dev, "VM size (%d) too small, min is 1GB\n",
1173			 radeon_vm_size);
1174		radeon_vm_size = 4;
1175	}
1176
1177	/*
1178	 * Max GPUVM size for Cayman, SI and CI are 40 bits.
1179	 */
1180	if (radeon_vm_size > 1024) {
1181		dev_warn(rdev->dev, "VM size (%d) too large, max is 1TB\n",
1182			 radeon_vm_size);
1183		radeon_vm_size = 4;
1184	}
1185
1186	/* defines number of bits in page table versus page directory,
1187	 * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1188	 * page table and the remaining bits are in the page directory */
1189	if (radeon_vm_block_size == -1) {
1190
1191		/* Total bits covered by PD + PTs */
1192		unsigned bits = ilog2(radeon_vm_size) + 18;
1193
1194		/* Make sure the PD is 4K in size up to 8GB address space.
1195		   Above that split equal between PD and PTs */
1196		if (radeon_vm_size <= 8)
1197			radeon_vm_block_size = bits - 9;
1198		else
1199			radeon_vm_block_size = (bits + 3) / 2;
1200
1201	} else if (radeon_vm_block_size < 9) {
1202		dev_warn(rdev->dev, "VM page table size (%d) too small\n",
1203			 radeon_vm_block_size);
1204		radeon_vm_block_size = 9;
1205	}
1206
1207	if (radeon_vm_block_size > 24 ||
1208	    (radeon_vm_size * 1024) < (1ull << radeon_vm_block_size)) {
1209		dev_warn(rdev->dev, "VM page table size (%d) too large\n",
1210			 radeon_vm_block_size);
1211		radeon_vm_block_size = 9;
1212	}
1213}
1214
1215/**
1216 * radeon_switcheroo_set_state - set switcheroo state
1217 *
1218 * @pdev: pci dev pointer
1219 * @state: vga_switcheroo state
1220 *
1221 * Callback for the switcheroo driver.  Suspends or resumes the
1222 * the asics before or after it is powered up using ACPI methods.
1223 */
1224static void radeon_switcheroo_set_state(struct pci_dev *pdev, enum vga_switcheroo_state state)
1225{
1226	struct drm_device *dev = pci_get_drvdata(pdev);
1227
1228	if (radeon_is_px(dev) && state == VGA_SWITCHEROO_OFF)
1229		return;
1230
1231	if (state == VGA_SWITCHEROO_ON) {
1232		pr_info("radeon: switched on\n");
1233		/* don't suspend or resume card normally */
1234		dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1235
1236		radeon_resume_kms(dev, true, true);
1237
1238		dev->switch_power_state = DRM_SWITCH_POWER_ON;
1239		drm_kms_helper_poll_enable(dev);
1240	} else {
1241		pr_info("radeon: switched off\n");
1242		drm_kms_helper_poll_disable(dev);
1243		dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1244		radeon_suspend_kms(dev, true, true, false);
1245		dev->switch_power_state = DRM_SWITCH_POWER_OFF;
1246	}
1247}
1248
1249/**
1250 * radeon_switcheroo_can_switch - see if switcheroo state can change
1251 *
1252 * @pdev: pci dev pointer
1253 *
1254 * Callback for the switcheroo driver.  Check of the switcheroo
1255 * state can be changed.
1256 * Returns true if the state can be changed, false if not.
1257 */
1258static bool radeon_switcheroo_can_switch(struct pci_dev *pdev)
1259{
1260	struct drm_device *dev = pci_get_drvdata(pdev);
1261
1262	/*
1263	 * FIXME: open_count is protected by drm_global_mutex but that would lead to
1264	 * locking inversion with the driver load path. And the access here is
1265	 * completely racy anyway. So don't bother with locking for now.
1266	 */
1267	return atomic_read(&dev->open_count) == 0;
1268}
1269
1270static const struct vga_switcheroo_client_ops radeon_switcheroo_ops = {
1271	.set_gpu_state = radeon_switcheroo_set_state,
1272	.reprobe = NULL,
1273	.can_switch = radeon_switcheroo_can_switch,
1274};
1275
1276/**
1277 * radeon_device_init - initialize the driver
1278 *
1279 * @rdev: radeon_device pointer
1280 * @pdev: drm dev pointer
1281 * @pdev: pci dev pointer
1282 * @flags: driver flags
1283 *
1284 * Initializes the driver info and hw (all asics).
1285 * Returns 0 for success or an error on failure.
1286 * Called at driver startup.
1287 */
1288int radeon_device_init(struct radeon_device *rdev,
1289		       struct drm_device *ddev,
1290		       struct pci_dev *pdev,
1291		       uint32_t flags)
1292{
1293	int r, i;
1294	int dma_bits;
1295	bool runtime = false;
1296
1297	rdev->shutdown = false;
1298	rdev->dev = &pdev->dev;
1299	rdev->ddev = ddev;
1300	rdev->pdev = pdev;
1301	rdev->flags = flags;
1302	rdev->family = flags & RADEON_FAMILY_MASK;
1303	rdev->is_atom_bios = false;
1304	rdev->usec_timeout = RADEON_MAX_USEC_TIMEOUT;
1305	rdev->mc.gtt_size = 512 * 1024 * 1024;
1306	rdev->accel_working = false;
1307	/* set up ring ids */
1308	for (i = 0; i < RADEON_NUM_RINGS; i++) {
1309		rdev->ring[i].idx = i;
1310	}
1311	rdev->fence_context = dma_fence_context_alloc(RADEON_NUM_RINGS);
1312
1313	DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
1314		 radeon_family_name[rdev->family], pdev->vendor, pdev->device,
1315		 pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
1316
1317	/* mutex initialization are all done here so we
1318	 * can recall function without having locking issues */
1319	mutex_init(&rdev->ring_lock);
1320	mutex_init(&rdev->dc_hw_i2c_mutex);
1321	atomic_set(&rdev->ih.lock, 0);
1322	mutex_init(&rdev->gem.mutex);
1323	mutex_init(&rdev->pm.mutex);
1324	mutex_init(&rdev->gpu_clock_mutex);
1325	mutex_init(&rdev->srbm_mutex);
1326	init_rwsem(&rdev->pm.mclk_lock);
1327	init_rwsem(&rdev->exclusive_lock);
1328	init_waitqueue_head(&rdev->irq.vblank_queue);
1329	r = radeon_gem_init(rdev);
1330	if (r)
1331		return r;
1332
1333	radeon_check_arguments(rdev);
1334	/* Adjust VM size here.
1335	 * Max GPUVM size for cayman+ is 40 bits.
1336	 */
1337	rdev->vm_manager.max_pfn = radeon_vm_size << 18;
1338
1339	/* Set asic functions */
1340	r = radeon_asic_init(rdev);
1341	if (r)
1342		return r;
1343
1344	/* all of the newer IGP chips have an internal gart
1345	 * However some rs4xx report as AGP, so remove that here.
1346	 */
1347	if ((rdev->family >= CHIP_RS400) &&
1348	    (rdev->flags & RADEON_IS_IGP)) {
1349		rdev->flags &= ~RADEON_IS_AGP;
1350	}
1351
1352	if (rdev->flags & RADEON_IS_AGP && radeon_agpmode == -1) {
1353		radeon_agp_disable(rdev);
1354	}
1355
1356	/* Set the internal MC address mask
1357	 * This is the max address of the GPU's
1358	 * internal address space.
1359	 */
1360	if (rdev->family >= CHIP_CAYMAN)
1361		rdev->mc.mc_mask = 0xffffffffffULL; /* 40 bit MC */
1362	else if (rdev->family >= CHIP_CEDAR)
1363		rdev->mc.mc_mask = 0xfffffffffULL; /* 36 bit MC */
1364	else
1365		rdev->mc.mc_mask = 0xffffffffULL; /* 32 bit MC */
1366
1367	/* set DMA mask.
1368	 * PCIE - can handle 40-bits.
1369	 * IGP - can handle 40-bits
1370	 * AGP - generally dma32 is safest
1371	 * PCI - dma32 for legacy pci gart, 40 bits on newer asics
1372	 */
1373	dma_bits = 40;
1374	if (rdev->flags & RADEON_IS_AGP)
1375		dma_bits = 32;
1376	if ((rdev->flags & RADEON_IS_PCI) &&
1377	    (rdev->family <= CHIP_RS740))
1378		dma_bits = 32;
1379#ifdef CONFIG_PPC64
1380	if (rdev->family == CHIP_CEDAR)
1381		dma_bits = 32;
1382#endif
1383
1384	r = dma_set_mask_and_coherent(&rdev->pdev->dev, DMA_BIT_MASK(dma_bits));
1385	if (r) {
1386		pr_warn("radeon: No suitable DMA available\n");
1387		return r;
1388	}
1389	rdev->need_swiotlb = drm_need_swiotlb(dma_bits);
1390
1391	/* Registers mapping */
1392	/* TODO: block userspace mapping of io register */
1393	spin_lock_init(&rdev->mmio_idx_lock);
1394	spin_lock_init(&rdev->smc_idx_lock);
1395	spin_lock_init(&rdev->pll_idx_lock);
1396	spin_lock_init(&rdev->mc_idx_lock);
1397	spin_lock_init(&rdev->pcie_idx_lock);
1398	spin_lock_init(&rdev->pciep_idx_lock);
1399	spin_lock_init(&rdev->pif_idx_lock);
1400	spin_lock_init(&rdev->cg_idx_lock);
1401	spin_lock_init(&rdev->uvd_idx_lock);
1402	spin_lock_init(&rdev->rcu_idx_lock);
1403	spin_lock_init(&rdev->didt_idx_lock);
1404	spin_lock_init(&rdev->end_idx_lock);
1405	if (rdev->family >= CHIP_BONAIRE) {
1406		rdev->rmmio_base = pci_resource_start(rdev->pdev, 5);
1407		rdev->rmmio_size = pci_resource_len(rdev->pdev, 5);
1408	} else {
1409		rdev->rmmio_base = pci_resource_start(rdev->pdev, 2);
1410		rdev->rmmio_size = pci_resource_len(rdev->pdev, 2);
1411	}
1412	rdev->rmmio = ioremap(rdev->rmmio_base, rdev->rmmio_size);
1413	if (rdev->rmmio == NULL)
1414		return -ENOMEM;
1415
1416	/* doorbell bar mapping */
1417	if (rdev->family >= CHIP_BONAIRE)
1418		radeon_doorbell_init(rdev);
1419
1420	/* io port mapping */
1421	for (i = 0; i < DEVICE_COUNT_RESOURCE; i++) {
1422		if (pci_resource_flags(rdev->pdev, i) & IORESOURCE_IO) {
1423			rdev->rio_mem_size = pci_resource_len(rdev->pdev, i);
1424			rdev->rio_mem = pci_iomap(rdev->pdev, i, rdev->rio_mem_size);
1425			break;
1426		}
1427	}
1428	if (rdev->rio_mem == NULL)
1429		DRM_ERROR("Unable to find PCI I/O BAR\n");
1430
1431	if (rdev->flags & RADEON_IS_PX)
1432		radeon_device_handle_px_quirks(rdev);
1433
1434	/* if we have > 1 VGA cards, then disable the radeon VGA resources */
1435	/* this will fail for cards that aren't VGA class devices, just
1436	 * ignore it */
1437	vga_client_register(rdev->pdev, rdev, NULL, radeon_vga_set_decode);
1438
1439	if (rdev->flags & RADEON_IS_PX)
1440		runtime = true;
1441	if (!pci_is_thunderbolt_attached(rdev->pdev))
1442		vga_switcheroo_register_client(rdev->pdev,
1443					       &radeon_switcheroo_ops, runtime);
1444	if (runtime)
1445		vga_switcheroo_init_domain_pm_ops(rdev->dev, &rdev->vga_pm_domain);
1446
1447	r = radeon_init(rdev);
1448	if (r)
1449		goto failed;
1450
1451	r = radeon_gem_debugfs_init(rdev);
1452	if (r) {
1453		DRM_ERROR("registering gem debugfs failed (%d).\n", r);
1454	}
1455
1456	r = radeon_mst_debugfs_init(rdev);
1457	if (r) {
1458		DRM_ERROR("registering mst debugfs failed (%d).\n", r);
1459	}
1460
1461	if (rdev->flags & RADEON_IS_AGP && !rdev->accel_working) {
1462		/* Acceleration not working on AGP card try again
1463		 * with fallback to PCI or PCIE GART
1464		 */
1465		radeon_asic_reset(rdev);
1466		radeon_fini(rdev);
1467		radeon_agp_disable(rdev);
1468		r = radeon_init(rdev);
1469		if (r)
1470			goto failed;
1471	}
1472
1473	r = radeon_ib_ring_tests(rdev);
1474	if (r)
1475		DRM_ERROR("ib ring test failed (%d).\n", r);
1476
1477	/*
1478	 * Turks/Thames GPU will freeze whole laptop if DPM is not restarted
1479	 * after the CP ring have chew one packet at least. Hence here we stop
1480	 * and restart DPM after the radeon_ib_ring_tests().
1481	 */
1482	if (rdev->pm.dpm_enabled &&
1483	    (rdev->pm.pm_method == PM_METHOD_DPM) &&
1484	    (rdev->family == CHIP_TURKS) &&
1485	    (rdev->flags & RADEON_IS_MOBILITY)) {
1486		mutex_lock(&rdev->pm.mutex);
1487		radeon_dpm_disable(rdev);
1488		radeon_dpm_enable(rdev);
1489		mutex_unlock(&rdev->pm.mutex);
1490	}
1491
1492	if ((radeon_testing & 1)) {
1493		if (rdev->accel_working)
1494			radeon_test_moves(rdev);
1495		else
1496			DRM_INFO("radeon: acceleration disabled, skipping move tests\n");
1497	}
1498	if ((radeon_testing & 2)) {
1499		if (rdev->accel_working)
1500			radeon_test_syncing(rdev);
1501		else
1502			DRM_INFO("radeon: acceleration disabled, skipping sync tests\n");
1503	}
1504	if (radeon_benchmarking) {
1505		if (rdev->accel_working)
1506			radeon_benchmark(rdev, radeon_benchmarking);
1507		else
1508			DRM_INFO("radeon: acceleration disabled, skipping benchmarks\n");
1509	}
1510	return 0;
1511
1512failed:
1513	/* balance pm_runtime_get_sync() in radeon_driver_unload_kms() */
1514	if (radeon_is_px(ddev))
1515		pm_runtime_put_noidle(ddev->dev);
1516	if (runtime)
1517		vga_switcheroo_fini_domain_pm_ops(rdev->dev);
1518	return r;
1519}
1520
1521/**
1522 * radeon_device_fini - tear down the driver
1523 *
1524 * @rdev: radeon_device pointer
1525 *
1526 * Tear down the driver info (all asics).
1527 * Called at driver shutdown.
1528 */
1529void radeon_device_fini(struct radeon_device *rdev)
1530{
1531	DRM_INFO("radeon: finishing device.\n");
1532	rdev->shutdown = true;
1533	/* evict vram memory */
1534	radeon_bo_evict_vram(rdev);
1535	radeon_fini(rdev);
1536	if (!pci_is_thunderbolt_attached(rdev->pdev))
1537		vga_switcheroo_unregister_client(rdev->pdev);
1538	if (rdev->flags & RADEON_IS_PX)
1539		vga_switcheroo_fini_domain_pm_ops(rdev->dev);
1540	vga_client_register(rdev->pdev, NULL, NULL, NULL);
1541	if (rdev->rio_mem)
1542		pci_iounmap(rdev->pdev, rdev->rio_mem);
1543	rdev->rio_mem = NULL;
1544	iounmap(rdev->rmmio);
1545	rdev->rmmio = NULL;
1546	if (rdev->family >= CHIP_BONAIRE)
1547		radeon_doorbell_fini(rdev);
1548}
1549
1550
1551/*
1552 * Suspend & resume.
1553 */
1554/**
1555 * radeon_suspend_kms - initiate device suspend
1556 *
1557 * @pdev: drm dev pointer
1558 * @state: suspend state
1559 *
1560 * Puts the hw in the suspend state (all asics).
1561 * Returns 0 for success or an error on failure.
1562 * Called at driver suspend.
1563 */
1564int radeon_suspend_kms(struct drm_device *dev, bool suspend,
1565		       bool fbcon, bool freeze)
1566{
1567	struct radeon_device *rdev;
1568	struct drm_crtc *crtc;
1569	struct drm_connector *connector;
1570	int i, r;
1571
1572	if (dev == NULL || dev->dev_private == NULL) {
1573		return -ENODEV;
1574	}
1575
1576	rdev = dev->dev_private;
1577
1578	if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
1579		return 0;
1580
1581	drm_kms_helper_poll_disable(dev);
1582
1583	drm_modeset_lock_all(dev);
1584	/* turn off display hw */
1585	list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
1586		drm_helper_connector_dpms(connector, DRM_MODE_DPMS_OFF);
1587	}
1588	drm_modeset_unlock_all(dev);
1589
1590	/* unpin the front buffers and cursors */
1591	list_for_each_entry(crtc, &dev->mode_config.crtc_list, head) {
1592		struct radeon_crtc *radeon_crtc = to_radeon_crtc(crtc);
1593		struct drm_framebuffer *fb = crtc->primary->fb;
1594		struct radeon_bo *robj;
1595
1596		if (radeon_crtc->cursor_bo) {
1597			struct radeon_bo *robj = gem_to_radeon_bo(radeon_crtc->cursor_bo);
1598			r = radeon_bo_reserve(robj, false);
1599			if (r == 0) {
1600				radeon_bo_unpin(robj);
1601				radeon_bo_unreserve(robj);
1602			}
1603		}
1604
1605		if (fb == NULL || fb->obj[0] == NULL) {
1606			continue;
1607		}
1608		robj = gem_to_radeon_bo(fb->obj[0]);
1609		/* don't unpin kernel fb objects */
1610		if (!radeon_fbdev_robj_is_fb(rdev, robj)) {
1611			r = radeon_bo_reserve(robj, false);
1612			if (r == 0) {
1613				radeon_bo_unpin(robj);
1614				radeon_bo_unreserve(robj);
1615			}
1616		}
1617	}
1618	/* evict vram memory */
1619	radeon_bo_evict_vram(rdev);
1620
1621	/* wait for gpu to finish processing current batch */
1622	for (i = 0; i < RADEON_NUM_RINGS; i++) {
1623		r = radeon_fence_wait_empty(rdev, i);
1624		if (r) {
1625			/* delay GPU reset to resume */
1626			radeon_fence_driver_force_completion(rdev, i);
1627		} else {
1628			/* finish executing delayed work */
1629			flush_delayed_work(&rdev->fence_drv[i].lockup_work);
1630		}
1631	}
1632
1633	radeon_save_bios_scratch_regs(rdev);
1634
1635	radeon_suspend(rdev);
1636	radeon_hpd_fini(rdev);
1637	/* evict remaining vram memory
1638	 * This second call to evict vram is to evict the gart page table
1639	 * using the CPU.
1640	 */
1641	radeon_bo_evict_vram(rdev);
1642
1643	radeon_agp_suspend(rdev);
1644
1645	pci_save_state(dev->pdev);
1646	if (freeze && rdev->family >= CHIP_CEDAR && !(rdev->flags & RADEON_IS_IGP)) {
1647		rdev->asic->asic_reset(rdev, true);
1648		pci_restore_state(dev->pdev);
1649	} else if (suspend) {
1650		/* Shut down the device */
1651		pci_disable_device(dev->pdev);
1652		pci_set_power_state(dev->pdev, PCI_D3hot);
1653	}
1654
1655	if (fbcon) {
1656		console_lock();
1657		radeon_fbdev_set_suspend(rdev, 1);
1658		console_unlock();
1659	}
1660	return 0;
1661}
1662
1663/**
1664 * radeon_resume_kms - initiate device resume
1665 *
1666 * @pdev: drm dev pointer
1667 *
1668 * Bring the hw back to operating state (all asics).
1669 * Returns 0 for success or an error on failure.
1670 * Called at driver resume.
1671 */
1672int radeon_resume_kms(struct drm_device *dev, bool resume, bool fbcon)
1673{
1674	struct drm_connector *connector;
1675	struct radeon_device *rdev = dev->dev_private;
1676	struct drm_crtc *crtc;
1677	int r;
1678
1679	if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
1680		return 0;
1681
1682	if (fbcon) {
1683		console_lock();
1684	}
1685	if (resume) {
1686		pci_set_power_state(dev->pdev, PCI_D0);
1687		pci_restore_state(dev->pdev);
1688		if (pci_enable_device(dev->pdev)) {
1689			if (fbcon)
1690				console_unlock();
1691			return -1;
1692		}
1693	}
1694	/* resume AGP if in use */
1695	radeon_agp_resume(rdev);
1696	radeon_resume(rdev);
1697
1698	r = radeon_ib_ring_tests(rdev);
1699	if (r)
1700		DRM_ERROR("ib ring test failed (%d).\n", r);
1701
1702	if ((rdev->pm.pm_method == PM_METHOD_DPM) && rdev->pm.dpm_enabled) {
1703		/* do dpm late init */
1704		r = radeon_pm_late_init(rdev);
1705		if (r) {
1706			rdev->pm.dpm_enabled = false;
1707			DRM_ERROR("radeon_pm_late_init failed, disabling dpm\n");
1708		}
1709	} else {
1710		/* resume old pm late */
1711		radeon_pm_resume(rdev);
1712	}
1713
1714	radeon_restore_bios_scratch_regs(rdev);
1715
1716	/* pin cursors */
1717	list_for_each_entry(crtc, &dev->mode_config.crtc_list, head) {
1718		struct radeon_crtc *radeon_crtc = to_radeon_crtc(crtc);
1719
1720		if (radeon_crtc->cursor_bo) {
1721			struct radeon_bo *robj = gem_to_radeon_bo(radeon_crtc->cursor_bo);
1722			r = radeon_bo_reserve(robj, false);
1723			if (r == 0) {
1724				/* Only 27 bit offset for legacy cursor */
1725				r = radeon_bo_pin_restricted(robj,
1726							     RADEON_GEM_DOMAIN_VRAM,
1727							     ASIC_IS_AVIVO(rdev) ?
1728							     0 : 1 << 27,
1729							     &radeon_crtc->cursor_addr);
1730				if (r != 0)
1731					DRM_ERROR("Failed to pin cursor BO (%d)\n", r);
1732				radeon_bo_unreserve(robj);
1733			}
1734		}
1735	}
1736
1737	/* init dig PHYs, disp eng pll */
1738	if (rdev->is_atom_bios) {
1739		radeon_atom_encoder_init(rdev);
1740		radeon_atom_disp_eng_pll_init(rdev);
1741		/* turn on the BL */
1742		if (rdev->mode_info.bl_encoder) {
1743			u8 bl_level = radeon_get_backlight_level(rdev,
1744								 rdev->mode_info.bl_encoder);
1745			radeon_set_backlight_level(rdev, rdev->mode_info.bl_encoder,
1746						   bl_level);
1747		}
1748	}
1749	/* reset hpd state */
1750	radeon_hpd_init(rdev);
1751	/* blat the mode back in */
1752	if (fbcon) {
1753		drm_helper_resume_force_mode(dev);
1754		/* turn on display hw */
1755		drm_modeset_lock_all(dev);
1756		list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
1757			drm_helper_connector_dpms(connector, DRM_MODE_DPMS_ON);
1758		}
1759		drm_modeset_unlock_all(dev);
1760	}
1761
1762	drm_kms_helper_poll_enable(dev);
1763
1764	/* set the power state here in case we are a PX system or headless */
1765	if ((rdev->pm.pm_method == PM_METHOD_DPM) && rdev->pm.dpm_enabled)
1766		radeon_pm_compute_clocks(rdev);
1767
1768	if (fbcon) {
1769		radeon_fbdev_set_suspend(rdev, 0);
1770		console_unlock();
1771	}
1772
1773	return 0;
1774}
1775
1776/**
1777 * radeon_gpu_reset - reset the asic
1778 *
1779 * @rdev: radeon device pointer
1780 *
1781 * Attempt the reset the GPU if it has hung (all asics).
1782 * Returns 0 for success or an error on failure.
1783 */
1784int radeon_gpu_reset(struct radeon_device *rdev)
1785{
1786	unsigned ring_sizes[RADEON_NUM_RINGS];
1787	uint32_t *ring_data[RADEON_NUM_RINGS];
1788
1789	bool saved = false;
1790
1791	int i, r;
1792	int resched;
1793
1794	down_write(&rdev->exclusive_lock);
1795
1796	if (!rdev->needs_reset) {
1797		up_write(&rdev->exclusive_lock);
1798		return 0;
1799	}
1800
1801	atomic_inc(&rdev->gpu_reset_counter);
1802
1803	radeon_save_bios_scratch_regs(rdev);
1804	/* block TTM */
1805	resched = ttm_bo_lock_delayed_workqueue(&rdev->mman.bdev);
1806	radeon_suspend(rdev);
1807	radeon_hpd_fini(rdev);
1808
1809	for (i = 0; i < RADEON_NUM_RINGS; ++i) {
1810		ring_sizes[i] = radeon_ring_backup(rdev, &rdev->ring[i],
1811						   &ring_data[i]);
1812		if (ring_sizes[i]) {
1813			saved = true;
1814			dev_info(rdev->dev, "Saved %d dwords of commands "
1815				 "on ring %d.\n", ring_sizes[i], i);
1816		}
1817	}
1818
1819	r = radeon_asic_reset(rdev);
1820	if (!r) {
1821		dev_info(rdev->dev, "GPU reset succeeded, trying to resume\n");
1822		radeon_resume(rdev);
1823	}
1824
1825	radeon_restore_bios_scratch_regs(rdev);
1826
1827	for (i = 0; i < RADEON_NUM_RINGS; ++i) {
1828		if (!r && ring_data[i]) {
1829			radeon_ring_restore(rdev, &rdev->ring[i],
1830					    ring_sizes[i], ring_data[i]);
1831		} else {
1832			radeon_fence_driver_force_completion(rdev, i);
1833			kfree(ring_data[i]);
1834		}
1835	}
1836
1837	if ((rdev->pm.pm_method == PM_METHOD_DPM) && rdev->pm.dpm_enabled) {
1838		/* do dpm late init */
1839		r = radeon_pm_late_init(rdev);
1840		if (r) {
1841			rdev->pm.dpm_enabled = false;
1842			DRM_ERROR("radeon_pm_late_init failed, disabling dpm\n");
1843		}
1844	} else {
1845		/* resume old pm late */
1846		radeon_pm_resume(rdev);
1847	}
1848
1849	/* init dig PHYs, disp eng pll */
1850	if (rdev->is_atom_bios) {
1851		radeon_atom_encoder_init(rdev);
1852		radeon_atom_disp_eng_pll_init(rdev);
1853		/* turn on the BL */
1854		if (rdev->mode_info.bl_encoder) {
1855			u8 bl_level = radeon_get_backlight_level(rdev,
1856								 rdev->mode_info.bl_encoder);
1857			radeon_set_backlight_level(rdev, rdev->mode_info.bl_encoder,
1858						   bl_level);
1859		}
1860	}
1861	/* reset hpd state */
1862	radeon_hpd_init(rdev);
1863
1864	ttm_bo_unlock_delayed_workqueue(&rdev->mman.bdev, resched);
1865
1866	rdev->in_reset = true;
1867	rdev->needs_reset = false;
1868
1869	downgrade_write(&rdev->exclusive_lock);
1870
1871	drm_helper_resume_force_mode(rdev->ddev);
1872
1873	/* set the power state here in case we are a PX system or headless */
1874	if ((rdev->pm.pm_method == PM_METHOD_DPM) && rdev->pm.dpm_enabled)
1875		radeon_pm_compute_clocks(rdev);
1876
1877	if (!r) {
1878		r = radeon_ib_ring_tests(rdev);
1879		if (r && saved)
1880			r = -EAGAIN;
1881	} else {
1882		/* bad news, how to tell it to userspace ? */
1883		dev_info(rdev->dev, "GPU reset failed\n");
1884	}
1885
1886	rdev->needs_reset = r == -EAGAIN;
1887	rdev->in_reset = false;
1888
1889	up_read(&rdev->exclusive_lock);
1890	return r;
1891}
1892
1893
1894/*
1895 * Debugfs
1896 */
1897int radeon_debugfs_add_files(struct radeon_device *rdev,
1898			     struct drm_info_list *files,
1899			     unsigned nfiles)
1900{
1901	unsigned i;
1902
1903	for (i = 0; i < rdev->debugfs_count; i++) {
1904		if (rdev->debugfs[i].files == files) {
1905			/* Already registered */
1906			return 0;
1907		}
1908	}
1909
1910	i = rdev->debugfs_count + 1;
1911	if (i > RADEON_DEBUGFS_MAX_COMPONENTS) {
1912		DRM_ERROR("Reached maximum number of debugfs components.\n");
1913		DRM_ERROR("Report so we increase "
1914			  "RADEON_DEBUGFS_MAX_COMPONENTS.\n");
1915		return -EINVAL;
1916	}
1917	rdev->debugfs[rdev->debugfs_count].files = files;
1918	rdev->debugfs[rdev->debugfs_count].num_files = nfiles;
1919	rdev->debugfs_count = i;
1920#if defined(CONFIG_DEBUG_FS)
1921	drm_debugfs_create_files(files, nfiles,
1922				 rdev->ddev->primary->debugfs_root,
1923				 rdev->ddev->primary);
1924#endif
1925	return 0;
1926}
1927