3ddae5ff41bbaad238ae2d508a041f807b58b10c
[cascardo/linux.git] / drivers / gpu / drm / amd / amdgpu / amdgpu_device.c
1 /*
2  * Copyright 2008 Advanced Micro Devices, Inc.
3  * Copyright 2008 Red Hat Inc.
4  * Copyright 2009 Jerome Glisse.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the "Software"),
8  * to deal in the Software without restriction, including without limitation
9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10  * and/or sell copies of the Software, and to permit persons to whom the
11  * Software is furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22  * OTHER DEALINGS IN THE SOFTWARE.
23  *
24  * Authors: Dave Airlie
25  *          Alex Deucher
26  *          Jerome Glisse
27  */
28 #include <linux/kthread.h>
29 #include <linux/console.h>
30 #include <linux/slab.h>
31 #include <linux/debugfs.h>
32 #include <drm/drmP.h>
33 #include <drm/drm_crtc_helper.h>
34 #include <drm/amdgpu_drm.h>
35 #include <linux/vgaarb.h>
36 #include <linux/vga_switcheroo.h>
37 #include <linux/efi.h>
38 #include "amdgpu.h"
39 #include "amdgpu_trace.h"
40 #include "amdgpu_i2c.h"
41 #include "atom.h"
42 #include "amdgpu_atombios.h"
43 #include "amd_pcie.h"
44 #ifdef CONFIG_DRM_AMDGPU_SI
45 #include "si.h"
46 #endif
47 #ifdef CONFIG_DRM_AMDGPU_CIK
48 #include "cik.h"
49 #endif
50 #include "vi.h"
51 #include "bif/bif_4_1_d.h"
52 #include <linux/pci.h>
53
54 static int amdgpu_debugfs_regs_init(struct amdgpu_device *adev);
55 static void amdgpu_debugfs_regs_cleanup(struct amdgpu_device *adev);
56
57 static const char *amdgpu_asic_name[] = {
58         "TAHITI",
59         "PITCAIRN",
60         "VERDE",
61         "OLAND",
62         "HAINAN",
63         "BONAIRE",
64         "KAVERI",
65         "KABINI",
66         "HAWAII",
67         "MULLINS",
68         "TOPAZ",
69         "TONGA",
70         "FIJI",
71         "CARRIZO",
72         "STONEY",
73         "POLARIS10",
74         "POLARIS11",
75         "LAST",
76 };
77
78 bool amdgpu_device_is_px(struct drm_device *dev)
79 {
80         struct amdgpu_device *adev = dev->dev_private;
81
82         if (adev->flags & AMD_IS_PX)
83                 return true;
84         return false;
85 }
86
87 /*
88  * MMIO register access helper functions.
89  */
90 uint32_t amdgpu_mm_rreg(struct amdgpu_device *adev, uint32_t reg,
91                         bool always_indirect)
92 {
93         uint32_t ret;
94
95         if ((reg * 4) < adev->rmmio_size && !always_indirect)
96                 ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
97         else {
98                 unsigned long flags;
99
100                 spin_lock_irqsave(&adev->mmio_idx_lock, flags);
101                 writel((reg * 4), ((void __iomem *)adev->rmmio) + (mmMM_INDEX * 4));
102                 ret = readl(((void __iomem *)adev->rmmio) + (mmMM_DATA * 4));
103                 spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
104         }
105         trace_amdgpu_mm_rreg(adev->pdev->device, reg, ret);
106         return ret;
107 }
108
109 void amdgpu_mm_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v,
110                     bool always_indirect)
111 {
112         trace_amdgpu_mm_wreg(adev->pdev->device, reg, v);
113         
114         if ((reg * 4) < adev->rmmio_size && !always_indirect)
115                 writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
116         else {
117                 unsigned long flags;
118
119                 spin_lock_irqsave(&adev->mmio_idx_lock, flags);
120                 writel((reg * 4), ((void __iomem *)adev->rmmio) + (mmMM_INDEX * 4));
121                 writel(v, ((void __iomem *)adev->rmmio) + (mmMM_DATA * 4));
122                 spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
123         }
124 }
125
126 u32 amdgpu_io_rreg(struct amdgpu_device *adev, u32 reg)
127 {
128         if ((reg * 4) < adev->rio_mem_size)
129                 return ioread32(adev->rio_mem + (reg * 4));
130         else {
131                 iowrite32((reg * 4), adev->rio_mem + (mmMM_INDEX * 4));
132                 return ioread32(adev->rio_mem + (mmMM_DATA * 4));
133         }
134 }
135
136 void amdgpu_io_wreg(struct amdgpu_device *adev, u32 reg, u32 v)
137 {
138
139         if ((reg * 4) < adev->rio_mem_size)
140                 iowrite32(v, adev->rio_mem + (reg * 4));
141         else {
142                 iowrite32((reg * 4), adev->rio_mem + (mmMM_INDEX * 4));
143                 iowrite32(v, adev->rio_mem + (mmMM_DATA * 4));
144         }
145 }
146
147 /**
148  * amdgpu_mm_rdoorbell - read a doorbell dword
149  *
150  * @adev: amdgpu_device pointer
151  * @index: doorbell index
152  *
153  * Returns the value in the doorbell aperture at the
154  * requested doorbell index (CIK).
155  */
156 u32 amdgpu_mm_rdoorbell(struct amdgpu_device *adev, u32 index)
157 {
158         if (index < adev->doorbell.num_doorbells) {
159                 return readl(adev->doorbell.ptr + index);
160         } else {
161                 DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
162                 return 0;
163         }
164 }
165
166 /**
167  * amdgpu_mm_wdoorbell - write a doorbell dword
168  *
169  * @adev: amdgpu_device pointer
170  * @index: doorbell index
171  * @v: value to write
172  *
173  * Writes @v to the doorbell aperture at the
174  * requested doorbell index (CIK).
175  */
176 void amdgpu_mm_wdoorbell(struct amdgpu_device *adev, u32 index, u32 v)
177 {
178         if (index < adev->doorbell.num_doorbells) {
179                 writel(v, adev->doorbell.ptr + index);
180         } else {
181                 DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
182         }
183 }
184
185 /**
186  * amdgpu_invalid_rreg - dummy reg read function
187  *
188  * @adev: amdgpu device pointer
189  * @reg: offset of register
190  *
191  * Dummy register read function.  Used for register blocks
192  * that certain asics don't have (all asics).
193  * Returns the value in the register.
194  */
195 static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
196 {
197         DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
198         BUG();
199         return 0;
200 }
201
202 /**
203  * amdgpu_invalid_wreg - dummy reg write function
204  *
205  * @adev: amdgpu device pointer
206  * @reg: offset of register
207  * @v: value to write to the register
208  *
209  * Dummy register read function.  Used for register blocks
210  * that certain asics don't have (all asics).
211  */
212 static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
213 {
214         DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
215                   reg, v);
216         BUG();
217 }
218
219 /**
220  * amdgpu_block_invalid_rreg - dummy reg read function
221  *
222  * @adev: amdgpu device pointer
223  * @block: offset of instance
224  * @reg: offset of register
225  *
226  * Dummy register read function.  Used for register blocks
227  * that certain asics don't have (all asics).
228  * Returns the value in the register.
229  */
230 static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
231                                           uint32_t block, uint32_t reg)
232 {
233         DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
234                   reg, block);
235         BUG();
236         return 0;
237 }
238
239 /**
240  * amdgpu_block_invalid_wreg - dummy reg write function
241  *
242  * @adev: amdgpu device pointer
243  * @block: offset of instance
244  * @reg: offset of register
245  * @v: value to write to the register
246  *
247  * Dummy register read function.  Used for register blocks
248  * that certain asics don't have (all asics).
249  */
250 static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
251                                       uint32_t block,
252                                       uint32_t reg, uint32_t v)
253 {
254         DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
255                   reg, block, v);
256         BUG();
257 }
258
259 static int amdgpu_vram_scratch_init(struct amdgpu_device *adev)
260 {
261         int r;
262
263         if (adev->vram_scratch.robj == NULL) {
264                 r = amdgpu_bo_create(adev, AMDGPU_GPU_PAGE_SIZE,
265                                      PAGE_SIZE, true, AMDGPU_GEM_DOMAIN_VRAM,
266                                      AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED,
267                                      NULL, NULL, &adev->vram_scratch.robj);
268                 if (r) {
269                         return r;
270                 }
271         }
272
273         r = amdgpu_bo_reserve(adev->vram_scratch.robj, false);
274         if (unlikely(r != 0))
275                 return r;
276         r = amdgpu_bo_pin(adev->vram_scratch.robj,
277                           AMDGPU_GEM_DOMAIN_VRAM, &adev->vram_scratch.gpu_addr);
278         if (r) {
279                 amdgpu_bo_unreserve(adev->vram_scratch.robj);
280                 return r;
281         }
282         r = amdgpu_bo_kmap(adev->vram_scratch.robj,
283                                 (void **)&adev->vram_scratch.ptr);
284         if (r)
285                 amdgpu_bo_unpin(adev->vram_scratch.robj);
286         amdgpu_bo_unreserve(adev->vram_scratch.robj);
287
288         return r;
289 }
290
291 static void amdgpu_vram_scratch_fini(struct amdgpu_device *adev)
292 {
293         int r;
294
295         if (adev->vram_scratch.robj == NULL) {
296                 return;
297         }
298         r = amdgpu_bo_reserve(adev->vram_scratch.robj, false);
299         if (likely(r == 0)) {
300                 amdgpu_bo_kunmap(adev->vram_scratch.robj);
301                 amdgpu_bo_unpin(adev->vram_scratch.robj);
302                 amdgpu_bo_unreserve(adev->vram_scratch.robj);
303         }
304         amdgpu_bo_unref(&adev->vram_scratch.robj);
305 }
306
307 /**
308  * amdgpu_program_register_sequence - program an array of registers.
309  *
310  * @adev: amdgpu_device pointer
311  * @registers: pointer to the register array
312  * @array_size: size of the register array
313  *
314  * Programs an array or registers with and and or masks.
315  * This is a helper for setting golden registers.
316  */
317 void amdgpu_program_register_sequence(struct amdgpu_device *adev,
318                                       const u32 *registers,
319                                       const u32 array_size)
320 {
321         u32 tmp, reg, and_mask, or_mask;
322         int i;
323
324         if (array_size % 3)
325                 return;
326
327         for (i = 0; i < array_size; i +=3) {
328                 reg = registers[i + 0];
329                 and_mask = registers[i + 1];
330                 or_mask = registers[i + 2];
331
332                 if (and_mask == 0xffffffff) {
333                         tmp = or_mask;
334                 } else {
335                         tmp = RREG32(reg);
336                         tmp &= ~and_mask;
337                         tmp |= or_mask;
338                 }
339                 WREG32(reg, tmp);
340         }
341 }
342
343 void amdgpu_pci_config_reset(struct amdgpu_device *adev)
344 {
345         pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);
346 }
347
348 /*
349  * GPU doorbell aperture helpers function.
350  */
351 /**
352  * amdgpu_doorbell_init - Init doorbell driver information.
353  *
354  * @adev: amdgpu_device pointer
355  *
356  * Init doorbell driver information (CIK)
357  * Returns 0 on success, error on failure.
358  */
359 static int amdgpu_doorbell_init(struct amdgpu_device *adev)
360 {
361         /* doorbell bar mapping */
362         adev->doorbell.base = pci_resource_start(adev->pdev, 2);
363         adev->doorbell.size = pci_resource_len(adev->pdev, 2);
364
365         adev->doorbell.num_doorbells = min_t(u32, adev->doorbell.size / sizeof(u32),
366                                              AMDGPU_DOORBELL_MAX_ASSIGNMENT+1);
367         if (adev->doorbell.num_doorbells == 0)
368                 return -EINVAL;
369
370         adev->doorbell.ptr = ioremap(adev->doorbell.base, adev->doorbell.num_doorbells * sizeof(u32));
371         if (adev->doorbell.ptr == NULL) {
372                 return -ENOMEM;
373         }
374         DRM_INFO("doorbell mmio base: 0x%08X\n", (uint32_t)adev->doorbell.base);
375         DRM_INFO("doorbell mmio size: %u\n", (unsigned)adev->doorbell.size);
376
377         return 0;
378 }
379
380 /**
381  * amdgpu_doorbell_fini - Tear down doorbell driver information.
382  *
383  * @adev: amdgpu_device pointer
384  *
385  * Tear down doorbell driver information (CIK)
386  */
387 static void amdgpu_doorbell_fini(struct amdgpu_device *adev)
388 {
389         iounmap(adev->doorbell.ptr);
390         adev->doorbell.ptr = NULL;
391 }
392
393 /**
394  * amdgpu_doorbell_get_kfd_info - Report doorbell configuration required to
395  *                                setup amdkfd
396  *
397  * @adev: amdgpu_device pointer
398  * @aperture_base: output returning doorbell aperture base physical address
399  * @aperture_size: output returning doorbell aperture size in bytes
400  * @start_offset: output returning # of doorbell bytes reserved for amdgpu.
401  *
402  * amdgpu and amdkfd share the doorbell aperture. amdgpu sets it up,
403  * takes doorbells required for its own rings and reports the setup to amdkfd.
404  * amdgpu reserved doorbells are at the start of the doorbell aperture.
405  */
406 void amdgpu_doorbell_get_kfd_info(struct amdgpu_device *adev,
407                                 phys_addr_t *aperture_base,
408                                 size_t *aperture_size,
409                                 size_t *start_offset)
410 {
411         /*
412          * The first num_doorbells are used by amdgpu.
413          * amdkfd takes whatever's left in the aperture.
414          */
415         if (adev->doorbell.size > adev->doorbell.num_doorbells * sizeof(u32)) {
416                 *aperture_base = adev->doorbell.base;
417                 *aperture_size = adev->doorbell.size;
418                 *start_offset = adev->doorbell.num_doorbells * sizeof(u32);
419         } else {
420                 *aperture_base = 0;
421                 *aperture_size = 0;
422                 *start_offset = 0;
423         }
424 }
425
426 /*
427  * amdgpu_wb_*()
428  * Writeback is the the method by which the the GPU updates special pages
429  * in memory with the status of certain GPU events (fences, ring pointers,
430  * etc.).
431  */
432
433 /**
434  * amdgpu_wb_fini - Disable Writeback and free memory
435  *
436  * @adev: amdgpu_device pointer
437  *
438  * Disables Writeback and frees the Writeback memory (all asics).
439  * Used at driver shutdown.
440  */
441 static void amdgpu_wb_fini(struct amdgpu_device *adev)
442 {
443         if (adev->wb.wb_obj) {
444                 if (!amdgpu_bo_reserve(adev->wb.wb_obj, false)) {
445                         amdgpu_bo_kunmap(adev->wb.wb_obj);
446                         amdgpu_bo_unpin(adev->wb.wb_obj);
447                         amdgpu_bo_unreserve(adev->wb.wb_obj);
448                 }
449                 amdgpu_bo_unref(&adev->wb.wb_obj);
450                 adev->wb.wb = NULL;
451                 adev->wb.wb_obj = NULL;
452         }
453 }
454
455 /**
456  * amdgpu_wb_init- Init Writeback driver info and allocate memory
457  *
458  * @adev: amdgpu_device pointer
459  *
460  * Disables Writeback and frees the Writeback memory (all asics).
461  * Used at driver startup.
462  * Returns 0 on success or an -error on failure.
463  */
464 static int amdgpu_wb_init(struct amdgpu_device *adev)
465 {
466         int r;
467
468         if (adev->wb.wb_obj == NULL) {
469                 r = amdgpu_bo_create(adev, AMDGPU_MAX_WB * 4, PAGE_SIZE, true,
470                                      AMDGPU_GEM_DOMAIN_GTT, 0,  NULL, NULL,
471                                      &adev->wb.wb_obj);
472                 if (r) {
473                         dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
474                         return r;
475                 }
476                 r = amdgpu_bo_reserve(adev->wb.wb_obj, false);
477                 if (unlikely(r != 0)) {
478                         amdgpu_wb_fini(adev);
479                         return r;
480                 }
481                 r = amdgpu_bo_pin(adev->wb.wb_obj, AMDGPU_GEM_DOMAIN_GTT,
482                                 &adev->wb.gpu_addr);
483                 if (r) {
484                         amdgpu_bo_unreserve(adev->wb.wb_obj);
485                         dev_warn(adev->dev, "(%d) pin WB bo failed\n", r);
486                         amdgpu_wb_fini(adev);
487                         return r;
488                 }
489                 r = amdgpu_bo_kmap(adev->wb.wb_obj, (void **)&adev->wb.wb);
490                 amdgpu_bo_unreserve(adev->wb.wb_obj);
491                 if (r) {
492                         dev_warn(adev->dev, "(%d) map WB bo failed\n", r);
493                         amdgpu_wb_fini(adev);
494                         return r;
495                 }
496
497                 adev->wb.num_wb = AMDGPU_MAX_WB;
498                 memset(&adev->wb.used, 0, sizeof(adev->wb.used));
499
500                 /* clear wb memory */
501                 memset((char *)adev->wb.wb, 0, AMDGPU_GPU_PAGE_SIZE);
502         }
503
504         return 0;
505 }
506
507 /**
508  * amdgpu_wb_get - Allocate a wb entry
509  *
510  * @adev: amdgpu_device pointer
511  * @wb: wb index
512  *
513  * Allocate a wb slot for use by the driver (all asics).
514  * Returns 0 on success or -EINVAL on failure.
515  */
516 int amdgpu_wb_get(struct amdgpu_device *adev, u32 *wb)
517 {
518         unsigned long offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
519         if (offset < adev->wb.num_wb) {
520                 __set_bit(offset, adev->wb.used);
521                 *wb = offset;
522                 return 0;
523         } else {
524                 return -EINVAL;
525         }
526 }
527
528 /**
529  * amdgpu_wb_free - Free a wb entry
530  *
531  * @adev: amdgpu_device pointer
532  * @wb: wb index
533  *
534  * Free a wb slot allocated for use by the driver (all asics)
535  */
536 void amdgpu_wb_free(struct amdgpu_device *adev, u32 wb)
537 {
538         if (wb < adev->wb.num_wb)
539                 __clear_bit(wb, adev->wb.used);
540 }
541
542 /**
543  * amdgpu_vram_location - try to find VRAM location
544  * @adev: amdgpu device structure holding all necessary informations
545  * @mc: memory controller structure holding memory informations
546  * @base: base address at which to put VRAM
547  *
548  * Function will place try to place VRAM at base address provided
549  * as parameter (which is so far either PCI aperture address or
550  * for IGP TOM base address).
551  *
552  * If there is not enough space to fit the unvisible VRAM in the 32bits
553  * address space then we limit the VRAM size to the aperture.
554  *
555  * Note: We don't explicitly enforce VRAM start to be aligned on VRAM size,
556  * this shouldn't be a problem as we are using the PCI aperture as a reference.
557  * Otherwise this would be needed for rv280, all r3xx, and all r4xx, but
558  * not IGP.
559  *
560  * Note: we use mc_vram_size as on some board we need to program the mc to
561  * cover the whole aperture even if VRAM size is inferior to aperture size
562  * Novell bug 204882 + along with lots of ubuntu ones
563  *
564  * Note: when limiting vram it's safe to overwritte real_vram_size because
565  * we are not in case where real_vram_size is inferior to mc_vram_size (ie
566  * note afected by bogus hw of Novell bug 204882 + along with lots of ubuntu
567  * ones)
568  *
569  * Note: IGP TOM addr should be the same as the aperture addr, we don't
570  * explicitly check for that thought.
571  *
572  * FIXME: when reducing VRAM size align new size on power of 2.
573  */
574 void amdgpu_vram_location(struct amdgpu_device *adev, struct amdgpu_mc *mc, u64 base)
575 {
576         uint64_t limit = (uint64_t)amdgpu_vram_limit << 20;
577
578         mc->vram_start = base;
579         if (mc->mc_vram_size > (adev->mc.mc_mask - base + 1)) {
580                 dev_warn(adev->dev, "limiting VRAM to PCI aperture size\n");
581                 mc->real_vram_size = mc->aper_size;
582                 mc->mc_vram_size = mc->aper_size;
583         }
584         mc->vram_end = mc->vram_start + mc->mc_vram_size - 1;
585         if (limit && limit < mc->real_vram_size)
586                 mc->real_vram_size = limit;
587         dev_info(adev->dev, "VRAM: %lluM 0x%016llX - 0x%016llX (%lluM used)\n",
588                         mc->mc_vram_size >> 20, mc->vram_start,
589                         mc->vram_end, mc->real_vram_size >> 20);
590 }
591
592 /**
593  * amdgpu_gtt_location - try to find GTT location
594  * @adev: amdgpu device structure holding all necessary informations
595  * @mc: memory controller structure holding memory informations
596  *
597  * Function will place try to place GTT before or after VRAM.
598  *
599  * If GTT size is bigger than space left then we ajust GTT size.
600  * Thus function will never fails.
601  *
602  * FIXME: when reducing GTT size align new size on power of 2.
603  */
604 void amdgpu_gtt_location(struct amdgpu_device *adev, struct amdgpu_mc *mc)
605 {
606         u64 size_af, size_bf;
607
608         size_af = ((adev->mc.mc_mask - mc->vram_end) + mc->gtt_base_align) & ~mc->gtt_base_align;
609         size_bf = mc->vram_start & ~mc->gtt_base_align;
610         if (size_bf > size_af) {
611                 if (mc->gtt_size > size_bf) {
612                         dev_warn(adev->dev, "limiting GTT\n");
613                         mc->gtt_size = size_bf;
614                 }
615                 mc->gtt_start = (mc->vram_start & ~mc->gtt_base_align) - mc->gtt_size;
616         } else {
617                 if (mc->gtt_size > size_af) {
618                         dev_warn(adev->dev, "limiting GTT\n");
619                         mc->gtt_size = size_af;
620                 }
621                 mc->gtt_start = (mc->vram_end + 1 + mc->gtt_base_align) & ~mc->gtt_base_align;
622         }
623         mc->gtt_end = mc->gtt_start + mc->gtt_size - 1;
624         dev_info(adev->dev, "GTT: %lluM 0x%016llX - 0x%016llX\n",
625                         mc->gtt_size >> 20, mc->gtt_start, mc->gtt_end);
626 }
627
628 /*
629  * GPU helpers function.
630  */
631 /**
632  * amdgpu_card_posted - check if the hw has already been initialized
633  *
634  * @adev: amdgpu_device pointer
635  *
636  * Check if the asic has been initialized (all asics).
637  * Used at driver startup.
638  * Returns true if initialized or false if not.
639  */
640 bool amdgpu_card_posted(struct amdgpu_device *adev)
641 {
642         uint32_t reg;
643
644         /* then check MEM_SIZE, in case the crtcs are off */
645         reg = RREG32(mmCONFIG_MEMSIZE);
646
647         if (reg)
648                 return true;
649
650         return false;
651
652 }
653
654 /**
655  * amdgpu_dummy_page_init - init dummy page used by the driver
656  *
657  * @adev: amdgpu_device pointer
658  *
659  * Allocate the dummy page used by the driver (all asics).
660  * This dummy page is used by the driver as a filler for gart entries
661  * when pages are taken out of the GART
662  * Returns 0 on sucess, -ENOMEM on failure.
663  */
664 int amdgpu_dummy_page_init(struct amdgpu_device *adev)
665 {
666         if (adev->dummy_page.page)
667                 return 0;
668         adev->dummy_page.page = alloc_page(GFP_DMA32 | GFP_KERNEL | __GFP_ZERO);
669         if (adev->dummy_page.page == NULL)
670                 return -ENOMEM;
671         adev->dummy_page.addr = pci_map_page(adev->pdev, adev->dummy_page.page,
672                                         0, PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
673         if (pci_dma_mapping_error(adev->pdev, adev->dummy_page.addr)) {
674                 dev_err(&adev->pdev->dev, "Failed to DMA MAP the dummy page\n");
675                 __free_page(adev->dummy_page.page);
676                 adev->dummy_page.page = NULL;
677                 return -ENOMEM;
678         }
679         return 0;
680 }
681
682 /**
683  * amdgpu_dummy_page_fini - free dummy page used by the driver
684  *
685  * @adev: amdgpu_device pointer
686  *
687  * Frees the dummy page used by the driver (all asics).
688  */
689 void amdgpu_dummy_page_fini(struct amdgpu_device *adev)
690 {
691         if (adev->dummy_page.page == NULL)
692                 return;
693         pci_unmap_page(adev->pdev, adev->dummy_page.addr,
694                         PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
695         __free_page(adev->dummy_page.page);
696         adev->dummy_page.page = NULL;
697 }
698
699
700 /* ATOM accessor methods */
701 /*
702  * ATOM is an interpreted byte code stored in tables in the vbios.  The
703  * driver registers callbacks to access registers and the interpreter
704  * in the driver parses the tables and executes then to program specific
705  * actions (set display modes, asic init, etc.).  See amdgpu_atombios.c,
706  * atombios.h, and atom.c
707  */
708
709 /**
710  * cail_pll_read - read PLL register
711  *
712  * @info: atom card_info pointer
713  * @reg: PLL register offset
714  *
715  * Provides a PLL register accessor for the atom interpreter (r4xx+).
716  * Returns the value of the PLL register.
717  */
718 static uint32_t cail_pll_read(struct card_info *info, uint32_t reg)
719 {
720         return 0;
721 }
722
723 /**
724  * cail_pll_write - write PLL register
725  *
726  * @info: atom card_info pointer
727  * @reg: PLL register offset
728  * @val: value to write to the pll register
729  *
730  * Provides a PLL register accessor for the atom interpreter (r4xx+).
731  */
732 static void cail_pll_write(struct card_info *info, uint32_t reg, uint32_t val)
733 {
734
735 }
736
737 /**
738  * cail_mc_read - read MC (Memory Controller) register
739  *
740  * @info: atom card_info pointer
741  * @reg: MC register offset
742  *
743  * Provides an MC register accessor for the atom interpreter (r4xx+).
744  * Returns the value of the MC register.
745  */
746 static uint32_t cail_mc_read(struct card_info *info, uint32_t reg)
747 {
748         return 0;
749 }
750
751 /**
752  * cail_mc_write - write MC (Memory Controller) register
753  *
754  * @info: atom card_info pointer
755  * @reg: MC register offset
756  * @val: value to write to the pll register
757  *
758  * Provides a MC register accessor for the atom interpreter (r4xx+).
759  */
760 static void cail_mc_write(struct card_info *info, uint32_t reg, uint32_t val)
761 {
762
763 }
764
765 /**
766  * cail_reg_write - write MMIO register
767  *
768  * @info: atom card_info pointer
769  * @reg: MMIO register offset
770  * @val: value to write to the pll register
771  *
772  * Provides a MMIO register accessor for the atom interpreter (r4xx+).
773  */
774 static void cail_reg_write(struct card_info *info, uint32_t reg, uint32_t val)
775 {
776         struct amdgpu_device *adev = info->dev->dev_private;
777
778         WREG32(reg, val);
779 }
780
781 /**
782  * cail_reg_read - read MMIO register
783  *
784  * @info: atom card_info pointer
785  * @reg: MMIO register offset
786  *
787  * Provides an MMIO register accessor for the atom interpreter (r4xx+).
788  * Returns the value of the MMIO register.
789  */
790 static uint32_t cail_reg_read(struct card_info *info, uint32_t reg)
791 {
792         struct amdgpu_device *adev = info->dev->dev_private;
793         uint32_t r;
794
795         r = RREG32(reg);
796         return r;
797 }
798
799 /**
800  * cail_ioreg_write - write IO register
801  *
802  * @info: atom card_info pointer
803  * @reg: IO register offset
804  * @val: value to write to the pll register
805  *
806  * Provides a IO register accessor for the atom interpreter (r4xx+).
807  */
808 static void cail_ioreg_write(struct card_info *info, uint32_t reg, uint32_t val)
809 {
810         struct amdgpu_device *adev = info->dev->dev_private;
811
812         WREG32_IO(reg, val);
813 }
814
815 /**
816  * cail_ioreg_read - read IO register
817  *
818  * @info: atom card_info pointer
819  * @reg: IO register offset
820  *
821  * Provides an IO register accessor for the atom interpreter (r4xx+).
822  * Returns the value of the IO register.
823  */
824 static uint32_t cail_ioreg_read(struct card_info *info, uint32_t reg)
825 {
826         struct amdgpu_device *adev = info->dev->dev_private;
827         uint32_t r;
828
829         r = RREG32_IO(reg);
830         return r;
831 }
832
833 /**
834  * amdgpu_atombios_fini - free the driver info and callbacks for atombios
835  *
836  * @adev: amdgpu_device pointer
837  *
838  * Frees the driver info and register access callbacks for the ATOM
839  * interpreter (r4xx+).
840  * Called at driver shutdown.
841  */
842 static void amdgpu_atombios_fini(struct amdgpu_device *adev)
843 {
844         if (adev->mode_info.atom_context) {
845                 kfree(adev->mode_info.atom_context->scratch);
846                 kfree(adev->mode_info.atom_context->iio);
847         }
848         kfree(adev->mode_info.atom_context);
849         adev->mode_info.atom_context = NULL;
850         kfree(adev->mode_info.atom_card_info);
851         adev->mode_info.atom_card_info = NULL;
852 }
853
854 /**
855  * amdgpu_atombios_init - init the driver info and callbacks for atombios
856  *
857  * @adev: amdgpu_device pointer
858  *
859  * Initializes the driver info and register access callbacks for the
860  * ATOM interpreter (r4xx+).
861  * Returns 0 on sucess, -ENOMEM on failure.
862  * Called at driver startup.
863  */
864 static int amdgpu_atombios_init(struct amdgpu_device *adev)
865 {
866         struct card_info *atom_card_info =
867             kzalloc(sizeof(struct card_info), GFP_KERNEL);
868
869         if (!atom_card_info)
870                 return -ENOMEM;
871
872         adev->mode_info.atom_card_info = atom_card_info;
873         atom_card_info->dev = adev->ddev;
874         atom_card_info->reg_read = cail_reg_read;
875         atom_card_info->reg_write = cail_reg_write;
876         /* needed for iio ops */
877         if (adev->rio_mem) {
878                 atom_card_info->ioreg_read = cail_ioreg_read;
879                 atom_card_info->ioreg_write = cail_ioreg_write;
880         } else {
881                 DRM_ERROR("Unable to find PCI I/O BAR; using MMIO for ATOM IIO\n");
882                 atom_card_info->ioreg_read = cail_reg_read;
883                 atom_card_info->ioreg_write = cail_reg_write;
884         }
885         atom_card_info->mc_read = cail_mc_read;
886         atom_card_info->mc_write = cail_mc_write;
887         atom_card_info->pll_read = cail_pll_read;
888         atom_card_info->pll_write = cail_pll_write;
889
890         adev->mode_info.atom_context = amdgpu_atom_parse(atom_card_info, adev->bios);
891         if (!adev->mode_info.atom_context) {
892                 amdgpu_atombios_fini(adev);
893                 return -ENOMEM;
894         }
895
896         mutex_init(&adev->mode_info.atom_context->mutex);
897         amdgpu_atombios_scratch_regs_init(adev);
898         amdgpu_atom_allocate_fb_scratch(adev->mode_info.atom_context);
899         return 0;
900 }
901
902 /* if we get transitioned to only one device, take VGA back */
903 /**
904  * amdgpu_vga_set_decode - enable/disable vga decode
905  *
906  * @cookie: amdgpu_device pointer
907  * @state: enable/disable vga decode
908  *
909  * Enable/disable vga decode (all asics).
910  * Returns VGA resource flags.
911  */
912 static unsigned int amdgpu_vga_set_decode(void *cookie, bool state)
913 {
914         struct amdgpu_device *adev = cookie;
915         amdgpu_asic_set_vga_state(adev, state);
916         if (state)
917                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
918                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
919         else
920                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
921 }
922
923 /**
924  * amdgpu_check_pot_argument - check that argument is a power of two
925  *
926  * @arg: value to check
927  *
928  * Validates that a certain argument is a power of two (all asics).
929  * Returns true if argument is valid.
930  */
931 static bool amdgpu_check_pot_argument(int arg)
932 {
933         return (arg & (arg - 1)) == 0;
934 }
935
936 /**
937  * amdgpu_check_arguments - validate module params
938  *
939  * @adev: amdgpu_device pointer
940  *
941  * Validates certain module parameters and updates
942  * the associated values used by the driver (all asics).
943  */
944 static void amdgpu_check_arguments(struct amdgpu_device *adev)
945 {
946         if (amdgpu_sched_jobs < 4) {
947                 dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
948                          amdgpu_sched_jobs);
949                 amdgpu_sched_jobs = 4;
950         } else if (!amdgpu_check_pot_argument(amdgpu_sched_jobs)){
951                 dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
952                          amdgpu_sched_jobs);
953                 amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
954         }
955
956         if (amdgpu_gart_size != -1) {
957                 /* gtt size must be greater or equal to 32M */
958                 if (amdgpu_gart_size < 32) {
959                         dev_warn(adev->dev, "gart size (%d) too small\n",
960                                  amdgpu_gart_size);
961                         amdgpu_gart_size = -1;
962                 }
963         }
964
965         if (!amdgpu_check_pot_argument(amdgpu_vm_size)) {
966                 dev_warn(adev->dev, "VM size (%d) must be a power of 2\n",
967                          amdgpu_vm_size);
968                 amdgpu_vm_size = 8;
969         }
970
971         if (amdgpu_vm_size < 1) {
972                 dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
973                          amdgpu_vm_size);
974                 amdgpu_vm_size = 8;
975         }
976
977         /*
978          * Max GPUVM size for Cayman, SI and CI are 40 bits.
979          */
980         if (amdgpu_vm_size > 1024) {
981                 dev_warn(adev->dev, "VM size (%d) too large, max is 1TB\n",
982                          amdgpu_vm_size);
983                 amdgpu_vm_size = 8;
984         }
985
986         /* defines number of bits in page table versus page directory,
987          * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
988          * page table and the remaining bits are in the page directory */
989         if (amdgpu_vm_block_size == -1) {
990
991                 /* Total bits covered by PD + PTs */
992                 unsigned bits = ilog2(amdgpu_vm_size) + 18;
993
994                 /* Make sure the PD is 4K in size up to 8GB address space.
995                    Above that split equal between PD and PTs */
996                 if (amdgpu_vm_size <= 8)
997                         amdgpu_vm_block_size = bits - 9;
998                 else
999                         amdgpu_vm_block_size = (bits + 3) / 2;
1000
1001         } else if (amdgpu_vm_block_size < 9) {
1002                 dev_warn(adev->dev, "VM page table size (%d) too small\n",
1003                          amdgpu_vm_block_size);
1004                 amdgpu_vm_block_size = 9;
1005         }
1006
1007         if (amdgpu_vm_block_size > 24 ||
1008             (amdgpu_vm_size * 1024) < (1ull << amdgpu_vm_block_size)) {
1009                 dev_warn(adev->dev, "VM page table size (%d) too large\n",
1010                          amdgpu_vm_block_size);
1011                 amdgpu_vm_block_size = 9;
1012         }
1013 }
1014
1015 /**
1016  * amdgpu_switcheroo_set_state - set switcheroo state
1017  *
1018  * @pdev: pci dev pointer
1019  * @state: vga_switcheroo state
1020  *
1021  * Callback for the switcheroo driver.  Suspends or resumes the
1022  * the asics before or after it is powered up using ACPI methods.
1023  */
1024 static void amdgpu_switcheroo_set_state(struct pci_dev *pdev, enum vga_switcheroo_state state)
1025 {
1026         struct drm_device *dev = pci_get_drvdata(pdev);
1027
1028         if (amdgpu_device_is_px(dev) && state == VGA_SWITCHEROO_OFF)
1029                 return;
1030
1031         if (state == VGA_SWITCHEROO_ON) {
1032                 unsigned d3_delay = dev->pdev->d3_delay;
1033
1034                 printk(KERN_INFO "amdgpu: switched on\n");
1035                 /* don't suspend or resume card normally */
1036                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1037
1038                 amdgpu_device_resume(dev, true, true);
1039
1040                 dev->pdev->d3_delay = d3_delay;
1041
1042                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
1043                 drm_kms_helper_poll_enable(dev);
1044         } else {
1045                 printk(KERN_INFO "amdgpu: switched off\n");
1046                 drm_kms_helper_poll_disable(dev);
1047                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1048                 amdgpu_device_suspend(dev, true, true);
1049                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
1050         }
1051 }
1052
1053 /**
1054  * amdgpu_switcheroo_can_switch - see if switcheroo state can change
1055  *
1056  * @pdev: pci dev pointer
1057  *
1058  * Callback for the switcheroo driver.  Check of the switcheroo
1059  * state can be changed.
1060  * Returns true if the state can be changed, false if not.
1061  */
1062 static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
1063 {
1064         struct drm_device *dev = pci_get_drvdata(pdev);
1065
1066         /*
1067         * FIXME: open_count is protected by drm_global_mutex but that would lead to
1068         * locking inversion with the driver load path. And the access here is
1069         * completely racy anyway. So don't bother with locking for now.
1070         */
1071         return dev->open_count == 0;
1072 }
1073
1074 static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
1075         .set_gpu_state = amdgpu_switcheroo_set_state,
1076         .reprobe = NULL,
1077         .can_switch = amdgpu_switcheroo_can_switch,
1078 };
1079
1080 int amdgpu_set_clockgating_state(struct amdgpu_device *adev,
1081                                   enum amd_ip_block_type block_type,
1082                                   enum amd_clockgating_state state)
1083 {
1084         int i, r = 0;
1085
1086         for (i = 0; i < adev->num_ip_blocks; i++) {
1087                 if (!adev->ip_block_status[i].valid)
1088                         continue;
1089                 if (adev->ip_blocks[i].type == block_type) {
1090                         r = adev->ip_blocks[i].funcs->set_clockgating_state((void *)adev,
1091                                                                             state);
1092                         if (r)
1093                                 return r;
1094                         break;
1095                 }
1096         }
1097         return r;
1098 }
1099
1100 int amdgpu_set_powergating_state(struct amdgpu_device *adev,
1101                                   enum amd_ip_block_type block_type,
1102                                   enum amd_powergating_state state)
1103 {
1104         int i, r = 0;
1105
1106         for (i = 0; i < adev->num_ip_blocks; i++) {
1107                 if (!adev->ip_block_status[i].valid)
1108                         continue;
1109                 if (adev->ip_blocks[i].type == block_type) {
1110                         r = adev->ip_blocks[i].funcs->set_powergating_state((void *)adev,
1111                                                                             state);
1112                         if (r)
1113                                 return r;
1114                         break;
1115                 }
1116         }
1117         return r;
1118 }
1119
1120 int amdgpu_wait_for_idle(struct amdgpu_device *adev,
1121                          enum amd_ip_block_type block_type)
1122 {
1123         int i, r;
1124
1125         for (i = 0; i < adev->num_ip_blocks; i++) {
1126                 if (!adev->ip_block_status[i].valid)
1127                         continue;
1128                 if (adev->ip_blocks[i].type == block_type) {
1129                         r = adev->ip_blocks[i].funcs->wait_for_idle((void *)adev);
1130                         if (r)
1131                                 return r;
1132                         break;
1133                 }
1134         }
1135         return 0;
1136
1137 }
1138
1139 bool amdgpu_is_idle(struct amdgpu_device *adev,
1140                     enum amd_ip_block_type block_type)
1141 {
1142         int i;
1143
1144         for (i = 0; i < adev->num_ip_blocks; i++) {
1145                 if (!adev->ip_block_status[i].valid)
1146                         continue;
1147                 if (adev->ip_blocks[i].type == block_type)
1148                         return adev->ip_blocks[i].funcs->is_idle((void *)adev);
1149         }
1150         return true;
1151
1152 }
1153
1154 const struct amdgpu_ip_block_version * amdgpu_get_ip_block(
1155                                         struct amdgpu_device *adev,
1156                                         enum amd_ip_block_type type)
1157 {
1158         int i;
1159
1160         for (i = 0; i < adev->num_ip_blocks; i++)
1161                 if (adev->ip_blocks[i].type == type)
1162                         return &adev->ip_blocks[i];
1163
1164         return NULL;
1165 }
1166
1167 /**
1168  * amdgpu_ip_block_version_cmp
1169  *
1170  * @adev: amdgpu_device pointer
1171  * @type: enum amd_ip_block_type
1172  * @major: major version
1173  * @minor: minor version
1174  *
1175  * return 0 if equal or greater
1176  * return 1 if smaller or the ip_block doesn't exist
1177  */
1178 int amdgpu_ip_block_version_cmp(struct amdgpu_device *adev,
1179                                 enum amd_ip_block_type type,
1180                                 u32 major, u32 minor)
1181 {
1182         const struct amdgpu_ip_block_version *ip_block;
1183         ip_block = amdgpu_get_ip_block(adev, type);
1184
1185         if (ip_block && ((ip_block->major > major) ||
1186                         ((ip_block->major == major) &&
1187                         (ip_block->minor >= minor))))
1188                 return 0;
1189
1190         return 1;
1191 }
1192
1193 static void amdgpu_whether_enable_virtual_display(struct amdgpu_device *adev)
1194 {
1195         adev->enable_virtual_display = false;
1196
1197         if (amdgpu_virtual_display) {
1198                 struct drm_device *ddev = adev->ddev;
1199                 const char *pci_address_name = pci_name(ddev->pdev);
1200                 char *pciaddstr, *pciaddstr_tmp, *pciaddname;
1201
1202                 pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
1203                 pciaddstr_tmp = pciaddstr;
1204                 while ((pciaddname = strsep(&pciaddstr_tmp, ";"))) {
1205                         if (!strcmp(pci_address_name, pciaddname)) {
1206                                 adev->enable_virtual_display = true;
1207                                 break;
1208                         }
1209                 }
1210
1211                 DRM_INFO("virtual display string:%s, %s:virtual_display:%d\n",
1212                                  amdgpu_virtual_display, pci_address_name,
1213                                  adev->enable_virtual_display);
1214
1215                 kfree(pciaddstr);
1216         }
1217 }
1218
1219 static int amdgpu_early_init(struct amdgpu_device *adev)
1220 {
1221         int i, r;
1222
1223         amdgpu_whether_enable_virtual_display(adev);
1224
1225         switch (adev->asic_type) {
1226         case CHIP_TOPAZ:
1227         case CHIP_TONGA:
1228         case CHIP_FIJI:
1229         case CHIP_POLARIS11:
1230         case CHIP_POLARIS10:
1231         case CHIP_CARRIZO:
1232         case CHIP_STONEY:
1233                 if (adev->asic_type == CHIP_CARRIZO || adev->asic_type == CHIP_STONEY)
1234                         adev->family = AMDGPU_FAMILY_CZ;
1235                 else
1236                         adev->family = AMDGPU_FAMILY_VI;
1237
1238                 r = vi_set_ip_blocks(adev);
1239                 if (r)
1240                         return r;
1241                 break;
1242 #ifdef CONFIG_DRM_AMDGPU_SI
1243         case CHIP_VERDE:
1244         case CHIP_TAHITI:
1245         case CHIP_PITCAIRN:
1246         case CHIP_OLAND:
1247         case CHIP_HAINAN:
1248                 adev->family = AMDGPU_FAMILY_SI;
1249                 r = si_set_ip_blocks(adev);
1250                 if (r)
1251                         return r;
1252                 break;
1253 #endif
1254 #ifdef CONFIG_DRM_AMDGPU_CIK
1255         case CHIP_BONAIRE:
1256         case CHIP_HAWAII:
1257         case CHIP_KAVERI:
1258         case CHIP_KABINI:
1259         case CHIP_MULLINS:
1260                 if ((adev->asic_type == CHIP_BONAIRE) || (adev->asic_type == CHIP_HAWAII))
1261                         adev->family = AMDGPU_FAMILY_CI;
1262                 else
1263                         adev->family = AMDGPU_FAMILY_KV;
1264
1265                 r = cik_set_ip_blocks(adev);
1266                 if (r)
1267                         return r;
1268                 break;
1269 #endif
1270         default:
1271                 /* FIXME: not supported yet */
1272                 return -EINVAL;
1273         }
1274
1275         adev->ip_block_status = kcalloc(adev->num_ip_blocks,
1276                                         sizeof(struct amdgpu_ip_block_status), GFP_KERNEL);
1277         if (adev->ip_block_status == NULL)
1278                 return -ENOMEM;
1279
1280         if (adev->ip_blocks == NULL) {
1281                 DRM_ERROR("No IP blocks found!\n");
1282                 return r;
1283         }
1284
1285         for (i = 0; i < adev->num_ip_blocks; i++) {
1286                 if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
1287                         DRM_ERROR("disabled ip block: %d\n", i);
1288                         adev->ip_block_status[i].valid = false;
1289                 } else {
1290                         if (adev->ip_blocks[i].funcs->early_init) {
1291                                 r = adev->ip_blocks[i].funcs->early_init((void *)adev);
1292                                 if (r == -ENOENT) {
1293                                         adev->ip_block_status[i].valid = false;
1294                                 } else if (r) {
1295                                         DRM_ERROR("early_init of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1296                                         return r;
1297                                 } else {
1298                                         adev->ip_block_status[i].valid = true;
1299                                 }
1300                         } else {
1301                                 adev->ip_block_status[i].valid = true;
1302                         }
1303                 }
1304         }
1305
1306         adev->cg_flags &= amdgpu_cg_mask;
1307         adev->pg_flags &= amdgpu_pg_mask;
1308
1309         return 0;
1310 }
1311
1312 static int amdgpu_init(struct amdgpu_device *adev)
1313 {
1314         int i, r;
1315
1316         for (i = 0; i < adev->num_ip_blocks; i++) {
1317                 if (!adev->ip_block_status[i].valid)
1318                         continue;
1319                 r = adev->ip_blocks[i].funcs->sw_init((void *)adev);
1320                 if (r) {
1321                         DRM_ERROR("sw_init of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1322                         return r;
1323                 }
1324                 adev->ip_block_status[i].sw = true;
1325                 /* need to do gmc hw init early so we can allocate gpu mem */
1326                 if (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_GMC) {
1327                         r = amdgpu_vram_scratch_init(adev);
1328                         if (r) {
1329                                 DRM_ERROR("amdgpu_vram_scratch_init failed %d\n", r);
1330                                 return r;
1331                         }
1332                         r = adev->ip_blocks[i].funcs->hw_init((void *)adev);
1333                         if (r) {
1334                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
1335                                 return r;
1336                         }
1337                         r = amdgpu_wb_init(adev);
1338                         if (r) {
1339                                 DRM_ERROR("amdgpu_wb_init failed %d\n", r);
1340                                 return r;
1341                         }
1342                         adev->ip_block_status[i].hw = true;
1343                 }
1344         }
1345
1346         for (i = 0; i < adev->num_ip_blocks; i++) {
1347                 if (!adev->ip_block_status[i].sw)
1348                         continue;
1349                 /* gmc hw init is done early */
1350                 if (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_GMC)
1351                         continue;
1352                 r = adev->ip_blocks[i].funcs->hw_init((void *)adev);
1353                 if (r) {
1354                         DRM_ERROR("hw_init of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1355                         return r;
1356                 }
1357                 adev->ip_block_status[i].hw = true;
1358         }
1359
1360         return 0;
1361 }
1362
1363 static int amdgpu_late_init(struct amdgpu_device *adev)
1364 {
1365         int i = 0, r;
1366
1367         for (i = 0; i < adev->num_ip_blocks; i++) {
1368                 if (!adev->ip_block_status[i].valid)
1369                         continue;
1370                 if (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_UVD ||
1371                         adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_VCE)
1372                         continue;
1373                 /* enable clockgating to save power */
1374                 r = adev->ip_blocks[i].funcs->set_clockgating_state((void *)adev,
1375                                                                     AMD_CG_STATE_GATE);
1376                 if (r) {
1377                         DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1378                         return r;
1379                 }
1380                 if (adev->ip_blocks[i].funcs->late_init) {
1381                         r = adev->ip_blocks[i].funcs->late_init((void *)adev);
1382                         if (r) {
1383                                 DRM_ERROR("late_init of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1384                                 return r;
1385                         }
1386                 }
1387         }
1388
1389         return 0;
1390 }
1391
1392 static int amdgpu_fini(struct amdgpu_device *adev)
1393 {
1394         int i, r;
1395
1396         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
1397                 if (!adev->ip_block_status[i].hw)
1398                         continue;
1399                 if (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_GMC) {
1400                         amdgpu_wb_fini(adev);
1401                         amdgpu_vram_scratch_fini(adev);
1402                 }
1403                 /* ungate blocks before hw fini so that we can shutdown the blocks safely */
1404                 r = adev->ip_blocks[i].funcs->set_clockgating_state((void *)adev,
1405                                                                     AMD_CG_STATE_UNGATE);
1406                 if (r) {
1407                         DRM_ERROR("set_clockgating_state(ungate) of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1408                         return r;
1409                 }
1410                 r = adev->ip_blocks[i].funcs->hw_fini((void *)adev);
1411                 /* XXX handle errors */
1412                 if (r) {
1413                         DRM_DEBUG("hw_fini of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1414                 }
1415                 adev->ip_block_status[i].hw = false;
1416         }
1417
1418         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
1419                 if (!adev->ip_block_status[i].sw)
1420                         continue;
1421                 r = adev->ip_blocks[i].funcs->sw_fini((void *)adev);
1422                 /* XXX handle errors */
1423                 if (r) {
1424                         DRM_DEBUG("sw_fini of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1425                 }
1426                 adev->ip_block_status[i].sw = false;
1427                 adev->ip_block_status[i].valid = false;
1428         }
1429
1430         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
1431                 if (adev->ip_blocks[i].funcs->late_fini)
1432                         adev->ip_blocks[i].funcs->late_fini((void *)adev);
1433         }
1434
1435         return 0;
1436 }
1437
1438 static int amdgpu_suspend(struct amdgpu_device *adev)
1439 {
1440         int i, r;
1441
1442         /* ungate SMC block first */
1443         r = amdgpu_set_clockgating_state(adev, AMD_IP_BLOCK_TYPE_SMC,
1444                                          AMD_CG_STATE_UNGATE);
1445         if (r) {
1446                 DRM_ERROR("set_clockgating_state(ungate) SMC failed %d\n",r);
1447         }
1448
1449         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
1450                 if (!adev->ip_block_status[i].valid)
1451                         continue;
1452                 /* ungate blocks so that suspend can properly shut them down */
1453                 if (i != AMD_IP_BLOCK_TYPE_SMC) {
1454                         r = adev->ip_blocks[i].funcs->set_clockgating_state((void *)adev,
1455                                                                             AMD_CG_STATE_UNGATE);
1456                         if (r) {
1457                                 DRM_ERROR("set_clockgating_state(ungate) of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1458                         }
1459                 }
1460                 /* XXX handle errors */
1461                 r = adev->ip_blocks[i].funcs->suspend(adev);
1462                 /* XXX handle errors */
1463                 if (r) {
1464                         DRM_ERROR("suspend of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1465                 }
1466         }
1467
1468         return 0;
1469 }
1470
1471 static int amdgpu_resume(struct amdgpu_device *adev)
1472 {
1473         int i, r;
1474
1475         for (i = 0; i < adev->num_ip_blocks; i++) {
1476                 if (!adev->ip_block_status[i].valid)
1477                         continue;
1478                 r = adev->ip_blocks[i].funcs->resume(adev);
1479                 if (r) {
1480                         DRM_ERROR("resume of IP block <%s> failed %d\n", adev->ip_blocks[i].funcs->name, r);
1481                         return r;
1482                 }
1483         }
1484
1485         return 0;
1486 }
1487
1488 static bool amdgpu_device_is_virtual(void)
1489 {
1490 #ifdef CONFIG_X86
1491         return boot_cpu_has(X86_FEATURE_HYPERVISOR);
1492 #else
1493         return false;
1494 #endif
1495 }
1496
1497 /**
1498  * amdgpu_device_init - initialize the driver
1499  *
1500  * @adev: amdgpu_device pointer
1501  * @pdev: drm dev pointer
1502  * @pdev: pci dev pointer
1503  * @flags: driver flags
1504  *
1505  * Initializes the driver info and hw (all asics).
1506  * Returns 0 for success or an error on failure.
1507  * Called at driver startup.
1508  */
1509 int amdgpu_device_init(struct amdgpu_device *adev,
1510                        struct drm_device *ddev,
1511                        struct pci_dev *pdev,
1512                        uint32_t flags)
1513 {
1514         int r, i;
1515         bool runtime = false;
1516         u32 max_MBps;
1517
1518         adev->shutdown = false;
1519         adev->dev = &pdev->dev;
1520         adev->ddev = ddev;
1521         adev->pdev = pdev;
1522         adev->flags = flags;
1523         adev->asic_type = flags & AMD_ASIC_MASK;
1524         adev->is_atom_bios = false;
1525         adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
1526         adev->mc.gtt_size = 512 * 1024 * 1024;
1527         adev->accel_working = false;
1528         adev->num_rings = 0;
1529         adev->mman.buffer_funcs = NULL;
1530         adev->mman.buffer_funcs_ring = NULL;
1531         adev->vm_manager.vm_pte_funcs = NULL;
1532         adev->vm_manager.vm_pte_num_rings = 0;
1533         adev->gart.gart_funcs = NULL;
1534         adev->fence_context = fence_context_alloc(AMDGPU_MAX_RINGS);
1535
1536         adev->smc_rreg = &amdgpu_invalid_rreg;
1537         adev->smc_wreg = &amdgpu_invalid_wreg;
1538         adev->pcie_rreg = &amdgpu_invalid_rreg;
1539         adev->pcie_wreg = &amdgpu_invalid_wreg;
1540         adev->pciep_rreg = &amdgpu_invalid_rreg;
1541         adev->pciep_wreg = &amdgpu_invalid_wreg;
1542         adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
1543         adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
1544         adev->didt_rreg = &amdgpu_invalid_rreg;
1545         adev->didt_wreg = &amdgpu_invalid_wreg;
1546         adev->gc_cac_rreg = &amdgpu_invalid_rreg;
1547         adev->gc_cac_wreg = &amdgpu_invalid_wreg;
1548         adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
1549         adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
1550
1551
1552         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
1553                  amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
1554                  pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
1555
1556         /* mutex initialization are all done here so we
1557          * can recall function without having locking issues */
1558         mutex_init(&adev->vm_manager.lock);
1559         atomic_set(&adev->irq.ih.lock, 0);
1560         mutex_init(&adev->pm.mutex);
1561         mutex_init(&adev->gfx.gpu_clock_mutex);
1562         mutex_init(&adev->srbm_mutex);
1563         mutex_init(&adev->grbm_idx_mutex);
1564         mutex_init(&adev->mn_lock);
1565         hash_init(adev->mn_hash);
1566
1567         amdgpu_check_arguments(adev);
1568
1569         /* Registers mapping */
1570         /* TODO: block userspace mapping of io register */
1571         spin_lock_init(&adev->mmio_idx_lock);
1572         spin_lock_init(&adev->smc_idx_lock);
1573         spin_lock_init(&adev->pcie_idx_lock);
1574         spin_lock_init(&adev->uvd_ctx_idx_lock);
1575         spin_lock_init(&adev->didt_idx_lock);
1576         spin_lock_init(&adev->gc_cac_idx_lock);
1577         spin_lock_init(&adev->audio_endpt_idx_lock);
1578         spin_lock_init(&adev->mm_stats.lock);
1579
1580         INIT_LIST_HEAD(&adev->shadow_list);
1581         mutex_init(&adev->shadow_list_lock);
1582
1583         INIT_LIST_HEAD(&adev->gtt_list);
1584         spin_lock_init(&adev->gtt_list_lock);
1585
1586         if (adev->asic_type >= CHIP_BONAIRE) {
1587                 adev->rmmio_base = pci_resource_start(adev->pdev, 5);
1588                 adev->rmmio_size = pci_resource_len(adev->pdev, 5);
1589         } else {
1590                 adev->rmmio_base = pci_resource_start(adev->pdev, 2);
1591                 adev->rmmio_size = pci_resource_len(adev->pdev, 2);
1592         }
1593
1594         adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
1595         if (adev->rmmio == NULL) {
1596                 return -ENOMEM;
1597         }
1598         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
1599         DRM_INFO("register mmio size: %u\n", (unsigned)adev->rmmio_size);
1600
1601         if (adev->asic_type >= CHIP_BONAIRE)
1602                 /* doorbell bar mapping */
1603                 amdgpu_doorbell_init(adev);
1604
1605         /* io port mapping */
1606         for (i = 0; i < DEVICE_COUNT_RESOURCE; i++) {
1607                 if (pci_resource_flags(adev->pdev, i) & IORESOURCE_IO) {
1608                         adev->rio_mem_size = pci_resource_len(adev->pdev, i);
1609                         adev->rio_mem = pci_iomap(adev->pdev, i, adev->rio_mem_size);
1610                         break;
1611                 }
1612         }
1613         if (adev->rio_mem == NULL)
1614                 DRM_ERROR("Unable to find PCI I/O BAR\n");
1615
1616         /* early init functions */
1617         r = amdgpu_early_init(adev);
1618         if (r)
1619                 return r;
1620
1621         /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
1622         /* this will fail for cards that aren't VGA class devices, just
1623          * ignore it */
1624         vga_client_register(adev->pdev, adev, NULL, amdgpu_vga_set_decode);
1625
1626         if (amdgpu_runtime_pm == 1)
1627                 runtime = true;
1628         if (amdgpu_device_is_px(ddev))
1629                 runtime = true;
1630         vga_switcheroo_register_client(adev->pdev, &amdgpu_switcheroo_ops, runtime);
1631         if (runtime)
1632                 vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
1633
1634         /* Read BIOS */
1635         if (!amdgpu_get_bios(adev)) {
1636                 r = -EINVAL;
1637                 goto failed;
1638         }
1639         /* Must be an ATOMBIOS */
1640         if (!adev->is_atom_bios) {
1641                 dev_err(adev->dev, "Expecting atombios for GPU\n");
1642                 r = -EINVAL;
1643                 goto failed;
1644         }
1645         r = amdgpu_atombios_init(adev);
1646         if (r) {
1647                 dev_err(adev->dev, "amdgpu_atombios_init failed\n");
1648                 goto failed;
1649         }
1650
1651         /* See if the asic supports SR-IOV */
1652         adev->virtualization.supports_sr_iov =
1653                 amdgpu_atombios_has_gpu_virtualization_table(adev);
1654
1655         /* Check if we are executing in a virtualized environment */
1656         adev->virtualization.is_virtual = amdgpu_device_is_virtual();
1657         adev->virtualization.caps = amdgpu_asic_get_virtual_caps(adev);
1658
1659         /* Post card if necessary */
1660         if (!amdgpu_card_posted(adev) ||
1661             (adev->virtualization.is_virtual &&
1662              !(adev->virtualization.caps & AMDGPU_VIRT_CAPS_SRIOV_EN))) {
1663                 if (!adev->bios) {
1664                         dev_err(adev->dev, "Card not posted and no BIOS - ignoring\n");
1665                         r = -EINVAL;
1666                         goto failed;
1667                 }
1668                 DRM_INFO("GPU not posted. posting now...\n");
1669                 amdgpu_atom_asic_init(adev->mode_info.atom_context);
1670         }
1671
1672         /* Initialize clocks */
1673         r = amdgpu_atombios_get_clock_info(adev);
1674         if (r) {
1675                 dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
1676                 goto failed;
1677         }
1678         /* init i2c buses */
1679         amdgpu_atombios_i2c_init(adev);
1680
1681         /* Fence driver */
1682         r = amdgpu_fence_driver_init(adev);
1683         if (r) {
1684                 dev_err(adev->dev, "amdgpu_fence_driver_init failed\n");
1685                 goto failed;
1686         }
1687
1688         /* init the mode config */
1689         drm_mode_config_init(adev->ddev);
1690
1691         r = amdgpu_init(adev);
1692         if (r) {
1693                 dev_err(adev->dev, "amdgpu_init failed\n");
1694                 amdgpu_fini(adev);
1695                 goto failed;
1696         }
1697
1698         adev->accel_working = true;
1699
1700         /* Initialize the buffer migration limit. */
1701         if (amdgpu_moverate >= 0)
1702                 max_MBps = amdgpu_moverate;
1703         else
1704                 max_MBps = 8; /* Allow 8 MB/s. */
1705         /* Get a log2 for easy divisions. */
1706         adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
1707
1708         amdgpu_fbdev_init(adev);
1709
1710         r = amdgpu_ib_pool_init(adev);
1711         if (r) {
1712                 dev_err(adev->dev, "IB initialization failed (%d).\n", r);
1713                 goto failed;
1714         }
1715
1716         r = amdgpu_ib_ring_tests(adev);
1717         if (r)
1718                 DRM_ERROR("ib ring test failed (%d).\n", r);
1719
1720         r = amdgpu_gem_debugfs_init(adev);
1721         if (r) {
1722                 DRM_ERROR("registering gem debugfs failed (%d).\n", r);
1723         }
1724
1725         r = amdgpu_debugfs_regs_init(adev);
1726         if (r) {
1727                 DRM_ERROR("registering register debugfs failed (%d).\n", r);
1728         }
1729
1730         r = amdgpu_debugfs_firmware_init(adev);
1731         if (r) {
1732                 DRM_ERROR("registering firmware debugfs failed (%d).\n", r);
1733                 return r;
1734         }
1735
1736         if ((amdgpu_testing & 1)) {
1737                 if (adev->accel_working)
1738                         amdgpu_test_moves(adev);
1739                 else
1740                         DRM_INFO("amdgpu: acceleration disabled, skipping move tests\n");
1741         }
1742         if ((amdgpu_testing & 2)) {
1743                 if (adev->accel_working)
1744                         amdgpu_test_syncing(adev);
1745                 else
1746                         DRM_INFO("amdgpu: acceleration disabled, skipping sync tests\n");
1747         }
1748         if (amdgpu_benchmarking) {
1749                 if (adev->accel_working)
1750                         amdgpu_benchmark(adev, amdgpu_benchmarking);
1751                 else
1752                         DRM_INFO("amdgpu: acceleration disabled, skipping benchmarks\n");
1753         }
1754
1755         /* enable clockgating, etc. after ib tests, etc. since some blocks require
1756          * explicit gating rather than handling it automatically.
1757          */
1758         r = amdgpu_late_init(adev);
1759         if (r) {
1760                 dev_err(adev->dev, "amdgpu_late_init failed\n");
1761                 goto failed;
1762         }
1763
1764         return 0;
1765
1766 failed:
1767         if (runtime)
1768                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
1769         return r;
1770 }
1771
1772 static void amdgpu_debugfs_remove_files(struct amdgpu_device *adev);
1773
1774 /**
1775  * amdgpu_device_fini - tear down the driver
1776  *
1777  * @adev: amdgpu_device pointer
1778  *
1779  * Tear down the driver info (all asics).
1780  * Called at driver shutdown.
1781  */
1782 void amdgpu_device_fini(struct amdgpu_device *adev)
1783 {
1784         int r;
1785
1786         DRM_INFO("amdgpu: finishing device.\n");
1787         adev->shutdown = true;
1788         /* evict vram memory */
1789         amdgpu_bo_evict_vram(adev);
1790         amdgpu_ib_pool_fini(adev);
1791         amdgpu_fence_driver_fini(adev);
1792         drm_crtc_force_disable_all(adev->ddev);
1793         amdgpu_fbdev_fini(adev);
1794         r = amdgpu_fini(adev);
1795         kfree(adev->ip_block_status);
1796         adev->ip_block_status = NULL;
1797         adev->accel_working = false;
1798         /* free i2c buses */
1799         amdgpu_i2c_fini(adev);
1800         amdgpu_atombios_fini(adev);
1801         kfree(adev->bios);
1802         adev->bios = NULL;
1803         vga_switcheroo_unregister_client(adev->pdev);
1804         if (adev->flags & AMD_IS_PX)
1805                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
1806         vga_client_register(adev->pdev, NULL, NULL, NULL);
1807         if (adev->rio_mem)
1808                 pci_iounmap(adev->pdev, adev->rio_mem);
1809         adev->rio_mem = NULL;
1810         iounmap(adev->rmmio);
1811         adev->rmmio = NULL;
1812         if (adev->asic_type >= CHIP_BONAIRE)
1813                 amdgpu_doorbell_fini(adev);
1814         amdgpu_debugfs_regs_cleanup(adev);
1815         amdgpu_debugfs_remove_files(adev);
1816 }
1817
1818
1819 /*
1820  * Suspend & resume.
1821  */
1822 /**
1823  * amdgpu_device_suspend - initiate device suspend
1824  *
1825  * @pdev: drm dev pointer
1826  * @state: suspend state
1827  *
1828  * Puts the hw in the suspend state (all asics).
1829  * Returns 0 for success or an error on failure.
1830  * Called at driver suspend.
1831  */
1832 int amdgpu_device_suspend(struct drm_device *dev, bool suspend, bool fbcon)
1833 {
1834         struct amdgpu_device *adev;
1835         struct drm_crtc *crtc;
1836         struct drm_connector *connector;
1837         int r;
1838
1839         if (dev == NULL || dev->dev_private == NULL) {
1840                 return -ENODEV;
1841         }
1842
1843         adev = dev->dev_private;
1844
1845         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF ||
1846             dev->switch_power_state == DRM_SWITCH_POWER_DYNAMIC_OFF)
1847                 return 0;
1848
1849         drm_kms_helper_poll_disable(dev);
1850
1851         /* turn off display hw */
1852         drm_modeset_lock_all(dev);
1853         list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
1854                 drm_helper_connector_dpms(connector, DRM_MODE_DPMS_OFF);
1855         }
1856         drm_modeset_unlock_all(dev);
1857
1858         /* unpin the front buffers and cursors */
1859         list_for_each_entry(crtc, &dev->mode_config.crtc_list, head) {
1860                 struct amdgpu_crtc *amdgpu_crtc = to_amdgpu_crtc(crtc);
1861                 struct amdgpu_framebuffer *rfb = to_amdgpu_framebuffer(crtc->primary->fb);
1862                 struct amdgpu_bo *robj;
1863
1864                 if (amdgpu_crtc->cursor_bo) {
1865                         struct amdgpu_bo *aobj = gem_to_amdgpu_bo(amdgpu_crtc->cursor_bo);
1866                         r = amdgpu_bo_reserve(aobj, false);
1867                         if (r == 0) {
1868                                 amdgpu_bo_unpin(aobj);
1869                                 amdgpu_bo_unreserve(aobj);
1870                         }
1871                 }
1872
1873                 if (rfb == NULL || rfb->obj == NULL) {
1874                         continue;
1875                 }
1876                 robj = gem_to_amdgpu_bo(rfb->obj);
1877                 /* don't unpin kernel fb objects */
1878                 if (!amdgpu_fbdev_robj_is_fb(adev, robj)) {
1879                         r = amdgpu_bo_reserve(robj, false);
1880                         if (r == 0) {
1881                                 amdgpu_bo_unpin(robj);
1882                                 amdgpu_bo_unreserve(robj);
1883                         }
1884                 }
1885         }
1886         /* evict vram memory */
1887         amdgpu_bo_evict_vram(adev);
1888
1889         amdgpu_fence_driver_suspend(adev);
1890
1891         r = amdgpu_suspend(adev);
1892
1893         /* evict remaining vram memory */
1894         amdgpu_bo_evict_vram(adev);
1895
1896         pci_save_state(dev->pdev);
1897         if (suspend) {
1898                 /* Shut down the device */
1899                 pci_disable_device(dev->pdev);
1900                 pci_set_power_state(dev->pdev, PCI_D3hot);
1901         } else {
1902                 r = amdgpu_asic_reset(adev);
1903                 if (r)
1904                         DRM_ERROR("amdgpu asic reset failed\n");
1905         }
1906
1907         if (fbcon) {
1908                 console_lock();
1909                 amdgpu_fbdev_set_suspend(adev, 1);
1910                 console_unlock();
1911         }
1912         return 0;
1913 }
1914
1915 /**
1916  * amdgpu_device_resume - initiate device resume
1917  *
1918  * @pdev: drm dev pointer
1919  *
1920  * Bring the hw back to operating state (all asics).
1921  * Returns 0 for success or an error on failure.
1922  * Called at driver resume.
1923  */
1924 int amdgpu_device_resume(struct drm_device *dev, bool resume, bool fbcon)
1925 {
1926         struct drm_connector *connector;
1927         struct amdgpu_device *adev = dev->dev_private;
1928         struct drm_crtc *crtc;
1929         int r;
1930
1931         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF ||
1932             dev->switch_power_state == DRM_SWITCH_POWER_DYNAMIC_OFF)
1933                 return 0;
1934
1935         if (fbcon)
1936                 console_lock();
1937
1938         if (resume) {
1939                 pci_set_power_state(dev->pdev, PCI_D0);
1940                 pci_restore_state(dev->pdev);
1941                 r = pci_enable_device(dev->pdev);
1942                 if (r) {
1943                         if (fbcon)
1944                                 console_unlock();
1945                         return r;
1946                 }
1947         }
1948
1949         /* post card */
1950         if (!amdgpu_card_posted(adev) || !resume) {
1951                 r = amdgpu_atom_asic_init(adev->mode_info.atom_context);
1952                 if (r)
1953                         DRM_ERROR("amdgpu asic init failed\n");
1954         }
1955
1956         r = amdgpu_resume(adev);
1957         if (r)
1958                 DRM_ERROR("amdgpu_resume failed (%d).\n", r);
1959
1960         amdgpu_fence_driver_resume(adev);
1961
1962         if (resume) {
1963                 r = amdgpu_ib_ring_tests(adev);
1964                 if (r)
1965                         DRM_ERROR("ib ring test failed (%d).\n", r);
1966         }
1967
1968         r = amdgpu_late_init(adev);
1969         if (r)
1970                 return r;
1971
1972         /* pin cursors */
1973         list_for_each_entry(crtc, &dev->mode_config.crtc_list, head) {
1974                 struct amdgpu_crtc *amdgpu_crtc = to_amdgpu_crtc(crtc);
1975
1976                 if (amdgpu_crtc->cursor_bo) {
1977                         struct amdgpu_bo *aobj = gem_to_amdgpu_bo(amdgpu_crtc->cursor_bo);
1978                         r = amdgpu_bo_reserve(aobj, false);
1979                         if (r == 0) {
1980                                 r = amdgpu_bo_pin(aobj,
1981                                                   AMDGPU_GEM_DOMAIN_VRAM,
1982                                                   &amdgpu_crtc->cursor_addr);
1983                                 if (r != 0)
1984                                         DRM_ERROR("Failed to pin cursor BO (%d)\n", r);
1985                                 amdgpu_bo_unreserve(aobj);
1986                         }
1987                 }
1988         }
1989
1990         /* blat the mode back in */
1991         if (fbcon) {
1992                 drm_helper_resume_force_mode(dev);
1993                 /* turn on display hw */
1994                 drm_modeset_lock_all(dev);
1995                 list_for_each_entry(connector, &dev->mode_config.connector_list, head) {
1996                         drm_helper_connector_dpms(connector, DRM_MODE_DPMS_ON);
1997                 }
1998                 drm_modeset_unlock_all(dev);
1999         }
2000
2001         drm_kms_helper_poll_enable(dev);
2002
2003         /*
2004          * Most of the connector probing functions try to acquire runtime pm
2005          * refs to ensure that the GPU is powered on when connector polling is
2006          * performed. Since we're calling this from a runtime PM callback,
2007          * trying to acquire rpm refs will cause us to deadlock.
2008          *
2009          * Since we're guaranteed to be holding the rpm lock, it's safe to
2010          * temporarily disable the rpm helpers so this doesn't deadlock us.
2011          */
2012 #ifdef CONFIG_PM
2013         dev->dev->power.disable_depth++;
2014 #endif
2015         drm_helper_hpd_irq_event(dev);
2016 #ifdef CONFIG_PM
2017         dev->dev->power.disable_depth--;
2018 #endif
2019
2020         if (fbcon) {
2021                 amdgpu_fbdev_set_suspend(adev, 0);
2022                 console_unlock();
2023         }
2024
2025         return 0;
2026 }
2027
2028 static bool amdgpu_check_soft_reset(struct amdgpu_device *adev)
2029 {
2030         int i;
2031         bool asic_hang = false;
2032
2033         for (i = 0; i < adev->num_ip_blocks; i++) {
2034                 if (!adev->ip_block_status[i].valid)
2035                         continue;
2036                 if (adev->ip_blocks[i].funcs->check_soft_reset)
2037                         adev->ip_blocks[i].funcs->check_soft_reset(adev);
2038                 if (adev->ip_block_status[i].hang) {
2039                         DRM_INFO("IP block:%d is hang!\n", i);
2040                         asic_hang = true;
2041                 }
2042         }
2043         return asic_hang;
2044 }
2045
2046 int amdgpu_pre_soft_reset(struct amdgpu_device *adev)
2047 {
2048         int i, r = 0;
2049
2050         for (i = 0; i < adev->num_ip_blocks; i++) {
2051                 if (!adev->ip_block_status[i].valid)
2052                         continue;
2053                 if (adev->ip_block_status[i].hang &&
2054                     adev->ip_blocks[i].funcs->pre_soft_reset) {
2055                         r = adev->ip_blocks[i].funcs->pre_soft_reset(adev);
2056                         if (r)
2057                                 return r;
2058                 }
2059         }
2060
2061         return 0;
2062 }
2063
2064 static bool amdgpu_need_full_reset(struct amdgpu_device *adev)
2065 {
2066         if (adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang ||
2067             adev->ip_block_status[AMD_IP_BLOCK_TYPE_SMC].hang ||
2068             adev->ip_block_status[AMD_IP_BLOCK_TYPE_ACP].hang ||
2069             adev->ip_block_status[AMD_IP_BLOCK_TYPE_DCE].hang) {
2070                 DRM_INFO("Some block need full reset!\n");
2071                 return true;
2072         }
2073         return false;
2074 }
2075
2076 static int amdgpu_soft_reset(struct amdgpu_device *adev)
2077 {
2078         int i, r = 0;
2079
2080         for (i = 0; i < adev->num_ip_blocks; i++) {
2081                 if (!adev->ip_block_status[i].valid)
2082                         continue;
2083                 if (adev->ip_block_status[i].hang &&
2084                     adev->ip_blocks[i].funcs->soft_reset) {
2085                         r = adev->ip_blocks[i].funcs->soft_reset(adev);
2086                         if (r)
2087                                 return r;
2088                 }
2089         }
2090
2091         return 0;
2092 }
2093
2094 static int amdgpu_post_soft_reset(struct amdgpu_device *adev)
2095 {
2096         int i, r = 0;
2097
2098         for (i = 0; i < adev->num_ip_blocks; i++) {
2099                 if (!adev->ip_block_status[i].valid)
2100                         continue;
2101                 if (adev->ip_block_status[i].hang &&
2102                     adev->ip_blocks[i].funcs->post_soft_reset)
2103                         r = adev->ip_blocks[i].funcs->post_soft_reset(adev);
2104                 if (r)
2105                         return r;
2106         }
2107
2108         return 0;
2109 }
2110
2111 bool amdgpu_need_backup(struct amdgpu_device *adev)
2112 {
2113         if (adev->flags & AMD_IS_APU)
2114                 return false;
2115
2116         return amdgpu_lockup_timeout > 0 ? true : false;
2117 }
2118
2119 static int amdgpu_recover_vram_from_shadow(struct amdgpu_device *adev,
2120                                            struct amdgpu_ring *ring,
2121                                            struct amdgpu_bo *bo,
2122                                            struct fence **fence)
2123 {
2124         uint32_t domain;
2125         int r;
2126
2127        if (!bo->shadow)
2128                return 0;
2129
2130        r = amdgpu_bo_reserve(bo, false);
2131        if (r)
2132                return r;
2133        domain = amdgpu_mem_type_to_domain(bo->tbo.mem.mem_type);
2134        /* if bo has been evicted, then no need to recover */
2135        if (domain == AMDGPU_GEM_DOMAIN_VRAM) {
2136                r = amdgpu_bo_restore_from_shadow(adev, ring, bo,
2137                                                  NULL, fence, true);
2138                if (r) {
2139                        DRM_ERROR("recover page table failed!\n");
2140                        goto err;
2141                }
2142        }
2143 err:
2144        amdgpu_bo_unreserve(bo);
2145        return r;
2146 }
2147
2148 /**
2149  * amdgpu_gpu_reset - reset the asic
2150  *
2151  * @adev: amdgpu device pointer
2152  *
2153  * Attempt the reset the GPU if it has hung (all asics).
2154  * Returns 0 for success or an error on failure.
2155  */
2156 int amdgpu_gpu_reset(struct amdgpu_device *adev)
2157 {
2158         int i, r;
2159         int resched;
2160         bool need_full_reset;
2161
2162         if (!amdgpu_check_soft_reset(adev)) {
2163                 DRM_INFO("No hardware hang detected. Did some blocks stall?\n");
2164                 return 0;
2165         }
2166
2167         atomic_inc(&adev->gpu_reset_counter);
2168
2169         /* block TTM */
2170         resched = ttm_bo_lock_delayed_workqueue(&adev->mman.bdev);
2171
2172         /* block scheduler */
2173         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2174                 struct amdgpu_ring *ring = adev->rings[i];
2175
2176                 if (!ring)
2177                         continue;
2178                 kthread_park(ring->sched.thread);
2179                 amd_sched_hw_job_reset(&ring->sched);
2180         }
2181         /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
2182         amdgpu_fence_driver_force_completion(adev);
2183
2184         need_full_reset = amdgpu_need_full_reset(adev);
2185
2186         if (!need_full_reset) {
2187                 amdgpu_pre_soft_reset(adev);
2188                 r = amdgpu_soft_reset(adev);
2189                 amdgpu_post_soft_reset(adev);
2190                 if (r || amdgpu_check_soft_reset(adev)) {
2191                         DRM_INFO("soft reset failed, will fallback to full reset!\n");
2192                         need_full_reset = true;
2193                 }
2194         }
2195
2196         if (need_full_reset) {
2197                 /* save scratch */
2198                 amdgpu_atombios_scratch_regs_save(adev);
2199                 r = amdgpu_suspend(adev);
2200
2201 retry:
2202                 /* Disable fb access */
2203                 if (adev->mode_info.num_crtc) {
2204                         struct amdgpu_mode_mc_save save;
2205                         amdgpu_display_stop_mc_access(adev, &save);
2206                         amdgpu_wait_for_idle(adev, AMD_IP_BLOCK_TYPE_GMC);
2207                 }
2208
2209                 r = amdgpu_asic_reset(adev);
2210                 /* post card */
2211                 amdgpu_atom_asic_init(adev->mode_info.atom_context);
2212
2213                 if (!r) {
2214                         dev_info(adev->dev, "GPU reset succeeded, trying to resume\n");
2215                         r = amdgpu_resume(adev);
2216                 }
2217                 /* restore scratch */
2218                 amdgpu_atombios_scratch_regs_restore(adev);
2219         }
2220         if (!r) {
2221                 amdgpu_irq_gpu_reset_resume_helper(adev);
2222                 if (need_full_reset && amdgpu_need_backup(adev)) {
2223                         r = amdgpu_ttm_recover_gart(adev);
2224                         if (r)
2225                                 DRM_ERROR("gart recovery failed!!!\n");
2226                 }
2227                 r = amdgpu_ib_ring_tests(adev);
2228                 if (r) {
2229                         dev_err(adev->dev, "ib ring test failed (%d).\n", r);
2230                         r = amdgpu_suspend(adev);
2231                         need_full_reset = true;
2232                         goto retry;
2233                 }
2234                 /**
2235                  * recovery vm page tables, since we cannot depend on VRAM is
2236                  * consistent after gpu full reset.
2237                  */
2238                 if (need_full_reset && amdgpu_need_backup(adev)) {
2239                         struct amdgpu_ring *ring = adev->mman.buffer_funcs_ring;
2240                         struct amdgpu_bo *bo, *tmp;
2241                         struct fence *fence = NULL, *next = NULL;
2242
2243                         DRM_INFO("recover vram bo from shadow\n");
2244                         mutex_lock(&adev->shadow_list_lock);
2245                         list_for_each_entry_safe(bo, tmp, &adev->shadow_list, shadow_list) {
2246                                 amdgpu_recover_vram_from_shadow(adev, ring, bo, &next);
2247                                 if (fence) {
2248                                         r = fence_wait(fence, false);
2249                                         if (r) {
2250                                                 WARN(r, "recovery from shadow isn't comleted\n");
2251                                                 break;
2252                                         }
2253                                 }
2254
2255                                 fence_put(fence);
2256                                 fence = next;
2257                         }
2258                         mutex_unlock(&adev->shadow_list_lock);
2259                         if (fence) {
2260                                 r = fence_wait(fence, false);
2261                                 if (r)
2262                                         WARN(r, "recovery from shadow isn't comleted\n");
2263                         }
2264                         fence_put(fence);
2265                 }
2266                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2267                         struct amdgpu_ring *ring = adev->rings[i];
2268                         if (!ring)
2269                                 continue;
2270
2271                         amd_sched_job_recovery(&ring->sched);
2272                         kthread_unpark(ring->sched.thread);
2273                 }
2274         } else {
2275                 dev_err(adev->dev, "asic resume failed (%d).\n", r);
2276                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2277                         if (adev->rings[i]) {
2278                                 kthread_unpark(adev->rings[i]->sched.thread);
2279                         }
2280                 }
2281         }
2282
2283         drm_helper_resume_force_mode(adev->ddev);
2284
2285         ttm_bo_unlock_delayed_workqueue(&adev->mman.bdev, resched);
2286         if (r) {
2287                 /* bad news, how to tell it to userspace ? */
2288                 dev_info(adev->dev, "GPU reset failed\n");
2289         }
2290
2291         return r;
2292 }
2293
2294 void amdgpu_get_pcie_info(struct amdgpu_device *adev)
2295 {
2296         u32 mask;
2297         int ret;
2298
2299         if (amdgpu_pcie_gen_cap)
2300                 adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
2301
2302         if (amdgpu_pcie_lane_cap)
2303                 adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
2304
2305         /* covers APUs as well */
2306         if (pci_is_root_bus(adev->pdev->bus)) {
2307                 if (adev->pm.pcie_gen_mask == 0)
2308                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
2309                 if (adev->pm.pcie_mlw_mask == 0)
2310                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
2311                 return;
2312         }
2313
2314         if (adev->pm.pcie_gen_mask == 0) {
2315                 ret = drm_pcie_get_speed_cap_mask(adev->ddev, &mask);
2316                 if (!ret) {
2317                         adev->pm.pcie_gen_mask = (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
2318                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
2319                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
2320
2321                         if (mask & DRM_PCIE_SPEED_25)
2322                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
2323                         if (mask & DRM_PCIE_SPEED_50)
2324                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2;
2325                         if (mask & DRM_PCIE_SPEED_80)
2326                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3;
2327                 } else {
2328                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
2329                 }
2330         }
2331         if (adev->pm.pcie_mlw_mask == 0) {
2332                 ret = drm_pcie_get_max_link_width(adev->ddev, &mask);
2333                 if (!ret) {
2334                         switch (mask) {
2335                         case 32:
2336                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
2337                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
2338                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
2339                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
2340                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
2341                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
2342                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
2343                                 break;
2344                         case 16:
2345                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
2346                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
2347                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
2348                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
2349                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
2350                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
2351                                 break;
2352                         case 12:
2353                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
2354                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
2355                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
2356                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
2357                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
2358                                 break;
2359                         case 8:
2360                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
2361                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
2362                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
2363                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
2364                                 break;
2365                         case 4:
2366                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
2367                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
2368                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
2369                                 break;
2370                         case 2:
2371                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
2372                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
2373                                 break;
2374                         case 1:
2375                                 adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
2376                                 break;
2377                         default:
2378                                 break;
2379                         }
2380                 } else {
2381                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
2382                 }
2383         }
2384 }
2385
2386 /*
2387  * Debugfs
2388  */
2389 int amdgpu_debugfs_add_files(struct amdgpu_device *adev,
2390                              const struct drm_info_list *files,
2391                              unsigned nfiles)
2392 {
2393         unsigned i;
2394
2395         for (i = 0; i < adev->debugfs_count; i++) {
2396                 if (adev->debugfs[i].files == files) {
2397                         /* Already registered */
2398                         return 0;
2399                 }
2400         }
2401
2402         i = adev->debugfs_count + 1;
2403         if (i > AMDGPU_DEBUGFS_MAX_COMPONENTS) {
2404                 DRM_ERROR("Reached maximum number of debugfs components.\n");
2405                 DRM_ERROR("Report so we increase "
2406                           "AMDGPU_DEBUGFS_MAX_COMPONENTS.\n");
2407                 return -EINVAL;
2408         }
2409         adev->debugfs[adev->debugfs_count].files = files;
2410         adev->debugfs[adev->debugfs_count].num_files = nfiles;
2411         adev->debugfs_count = i;
2412 #if defined(CONFIG_DEBUG_FS)
2413         drm_debugfs_create_files(files, nfiles,
2414                                  adev->ddev->control->debugfs_root,
2415                                  adev->ddev->control);
2416         drm_debugfs_create_files(files, nfiles,
2417                                  adev->ddev->primary->debugfs_root,
2418                                  adev->ddev->primary);
2419 #endif
2420         return 0;
2421 }
2422
2423 static void amdgpu_debugfs_remove_files(struct amdgpu_device *adev)
2424 {
2425 #if defined(CONFIG_DEBUG_FS)
2426         unsigned i;
2427
2428         for (i = 0; i < adev->debugfs_count; i++) {
2429                 drm_debugfs_remove_files(adev->debugfs[i].files,
2430                                          adev->debugfs[i].num_files,
2431                                          adev->ddev->control);
2432                 drm_debugfs_remove_files(adev->debugfs[i].files,
2433                                          adev->debugfs[i].num_files,
2434                                          adev->ddev->primary);
2435         }
2436 #endif
2437 }
2438
2439 #if defined(CONFIG_DEBUG_FS)
2440
2441 static ssize_t amdgpu_debugfs_regs_read(struct file *f, char __user *buf,
2442                                         size_t size, loff_t *pos)
2443 {
2444         struct amdgpu_device *adev = f->f_inode->i_private;
2445         ssize_t result = 0;
2446         int r;
2447         bool pm_pg_lock, use_bank;
2448         unsigned instance_bank, sh_bank, se_bank;
2449
2450         if (size & 0x3 || *pos & 0x3)
2451                 return -EINVAL;
2452
2453         /* are we reading registers for which a PG lock is necessary? */
2454         pm_pg_lock = (*pos >> 23) & 1;
2455
2456         if (*pos & (1ULL << 62)) {
2457                 se_bank = (*pos >> 24) & 0x3FF;
2458                 sh_bank = (*pos >> 34) & 0x3FF;
2459                 instance_bank = (*pos >> 44) & 0x3FF;
2460                 use_bank = 1;
2461         } else {
2462                 use_bank = 0;
2463         }
2464
2465         *pos &= 0x3FFFF;
2466
2467         if (use_bank) {
2468                 if (sh_bank >= adev->gfx.config.max_sh_per_se ||
2469                     se_bank >= adev->gfx.config.max_shader_engines)
2470                         return -EINVAL;
2471                 mutex_lock(&adev->grbm_idx_mutex);
2472                 amdgpu_gfx_select_se_sh(adev, se_bank,
2473                                         sh_bank, instance_bank);
2474         }
2475
2476         if (pm_pg_lock)
2477                 mutex_lock(&adev->pm.mutex);
2478
2479         while (size) {
2480                 uint32_t value;
2481
2482                 if (*pos > adev->rmmio_size)
2483                         goto end;
2484
2485                 value = RREG32(*pos >> 2);
2486                 r = put_user(value, (uint32_t *)buf);
2487                 if (r) {
2488                         result = r;
2489                         goto end;
2490                 }
2491
2492                 result += 4;
2493                 buf += 4;
2494                 *pos += 4;
2495                 size -= 4;
2496         }
2497
2498 end:
2499         if (use_bank) {
2500                 amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff);
2501                 mutex_unlock(&adev->grbm_idx_mutex);
2502         }
2503
2504         if (pm_pg_lock)
2505                 mutex_unlock(&adev->pm.mutex);
2506
2507         return result;
2508 }
2509
2510 static ssize_t amdgpu_debugfs_regs_write(struct file *f, const char __user *buf,
2511                                          size_t size, loff_t *pos)
2512 {
2513         struct amdgpu_device *adev = f->f_inode->i_private;
2514         ssize_t result = 0;
2515         int r;
2516
2517         if (size & 0x3 || *pos & 0x3)
2518                 return -EINVAL;
2519
2520         while (size) {
2521                 uint32_t value;
2522
2523                 if (*pos > adev->rmmio_size)
2524                         return result;
2525
2526                 r = get_user(value, (uint32_t *)buf);
2527                 if (r)
2528                         return r;
2529
2530                 WREG32(*pos >> 2, value);
2531
2532                 result += 4;
2533                 buf += 4;
2534                 *pos += 4;
2535                 size -= 4;
2536         }
2537
2538         return result;
2539 }
2540
2541 static ssize_t amdgpu_debugfs_regs_pcie_read(struct file *f, char __user *buf,
2542                                         size_t size, loff_t *pos)
2543 {
2544         struct amdgpu_device *adev = f->f_inode->i_private;
2545         ssize_t result = 0;
2546         int r;
2547
2548         if (size & 0x3 || *pos & 0x3)
2549                 return -EINVAL;
2550
2551         while (size) {
2552                 uint32_t value;
2553
2554                 value = RREG32_PCIE(*pos >> 2);
2555                 r = put_user(value, (uint32_t *)buf);
2556                 if (r)
2557                         return r;
2558
2559                 result += 4;
2560                 buf += 4;
2561                 *pos += 4;
2562                 size -= 4;
2563         }
2564
2565         return result;
2566 }
2567
2568 static ssize_t amdgpu_debugfs_regs_pcie_write(struct file *f, const char __user *buf,
2569                                          size_t size, loff_t *pos)
2570 {
2571         struct amdgpu_device *adev = f->f_inode->i_private;
2572         ssize_t result = 0;
2573         int r;
2574
2575         if (size & 0x3 || *pos & 0x3)
2576                 return -EINVAL;
2577
2578         while (size) {
2579                 uint32_t value;
2580
2581                 r = get_user(value, (uint32_t *)buf);
2582                 if (r)
2583                         return r;
2584
2585                 WREG32_PCIE(*pos >> 2, value);
2586
2587                 result += 4;
2588                 buf += 4;
2589                 *pos += 4;
2590                 size -= 4;
2591         }
2592
2593         return result;
2594 }
2595
2596 static ssize_t amdgpu_debugfs_regs_didt_read(struct file *f, char __user *buf,
2597                                         size_t size, loff_t *pos)
2598 {
2599         struct amdgpu_device *adev = f->f_inode->i_private;
2600         ssize_t result = 0;
2601         int r;
2602
2603         if (size & 0x3 || *pos & 0x3)
2604                 return -EINVAL;
2605
2606         while (size) {
2607                 uint32_t value;
2608
2609                 value = RREG32_DIDT(*pos >> 2);
2610                 r = put_user(value, (uint32_t *)buf);
2611                 if (r)
2612                         return r;
2613
2614                 result += 4;
2615                 buf += 4;
2616                 *pos += 4;
2617                 size -= 4;
2618         }
2619
2620         return result;
2621 }
2622
2623 static ssize_t amdgpu_debugfs_regs_didt_write(struct file *f, const char __user *buf,
2624                                          size_t size, loff_t *pos)
2625 {
2626         struct amdgpu_device *adev = f->f_inode->i_private;
2627         ssize_t result = 0;
2628         int r;
2629
2630         if (size & 0x3 || *pos & 0x3)
2631                 return -EINVAL;
2632
2633         while (size) {
2634                 uint32_t value;
2635
2636                 r = get_user(value, (uint32_t *)buf);
2637                 if (r)
2638                         return r;
2639
2640                 WREG32_DIDT(*pos >> 2, value);
2641
2642                 result += 4;
2643                 buf += 4;
2644                 *pos += 4;
2645                 size -= 4;
2646         }
2647
2648         return result;
2649 }
2650
2651 static ssize_t amdgpu_debugfs_regs_smc_read(struct file *f, char __user *buf,
2652                                         size_t size, loff_t *pos)
2653 {
2654         struct amdgpu_device *adev = f->f_inode->i_private;
2655         ssize_t result = 0;
2656         int r;
2657
2658         if (size & 0x3 || *pos & 0x3)
2659                 return -EINVAL;
2660
2661         while (size) {
2662                 uint32_t value;
2663
2664                 value = RREG32_SMC(*pos);
2665                 r = put_user(value, (uint32_t *)buf);
2666                 if (r)
2667                         return r;
2668
2669                 result += 4;
2670                 buf += 4;
2671                 *pos += 4;
2672                 size -= 4;
2673         }
2674
2675         return result;
2676 }
2677
2678 static ssize_t amdgpu_debugfs_regs_smc_write(struct file *f, const char __user *buf,
2679                                          size_t size, loff_t *pos)
2680 {
2681         struct amdgpu_device *adev = f->f_inode->i_private;
2682         ssize_t result = 0;
2683         int r;
2684
2685         if (size & 0x3 || *pos & 0x3)
2686                 return -EINVAL;
2687
2688         while (size) {
2689                 uint32_t value;
2690
2691                 r = get_user(value, (uint32_t *)buf);
2692                 if (r)
2693                         return r;
2694
2695                 WREG32_SMC(*pos, value);
2696
2697                 result += 4;
2698                 buf += 4;
2699                 *pos += 4;
2700                 size -= 4;
2701         }
2702
2703         return result;
2704 }
2705
2706 static ssize_t amdgpu_debugfs_gca_config_read(struct file *f, char __user *buf,
2707                                         size_t size, loff_t *pos)
2708 {
2709         struct amdgpu_device *adev = f->f_inode->i_private;
2710         ssize_t result = 0;
2711         int r;
2712         uint32_t *config, no_regs = 0;
2713
2714         if (size & 0x3 || *pos & 0x3)
2715                 return -EINVAL;
2716
2717         config = kmalloc(256 * sizeof(*config), GFP_KERNEL);
2718         if (!config)
2719                 return -ENOMEM;
2720
2721         /* version, increment each time something is added */
2722         config[no_regs++] = 2;
2723         config[no_regs++] = adev->gfx.config.max_shader_engines;
2724         config[no_regs++] = adev->gfx.config.max_tile_pipes;
2725         config[no_regs++] = adev->gfx.config.max_cu_per_sh;
2726         config[no_regs++] = adev->gfx.config.max_sh_per_se;
2727         config[no_regs++] = adev->gfx.config.max_backends_per_se;
2728         config[no_regs++] = adev->gfx.config.max_texture_channel_caches;
2729         config[no_regs++] = adev->gfx.config.max_gprs;
2730         config[no_regs++] = adev->gfx.config.max_gs_threads;
2731         config[no_regs++] = adev->gfx.config.max_hw_contexts;
2732         config[no_regs++] = adev->gfx.config.sc_prim_fifo_size_frontend;
2733         config[no_regs++] = adev->gfx.config.sc_prim_fifo_size_backend;
2734         config[no_regs++] = adev->gfx.config.sc_hiz_tile_fifo_size;
2735         config[no_regs++] = adev->gfx.config.sc_earlyz_tile_fifo_size;
2736         config[no_regs++] = adev->gfx.config.num_tile_pipes;
2737         config[no_regs++] = adev->gfx.config.backend_enable_mask;
2738         config[no_regs++] = adev->gfx.config.mem_max_burst_length_bytes;
2739         config[no_regs++] = adev->gfx.config.mem_row_size_in_kb;
2740         config[no_regs++] = adev->gfx.config.shader_engine_tile_size;
2741         config[no_regs++] = adev->gfx.config.num_gpus;
2742         config[no_regs++] = adev->gfx.config.multi_gpu_tile_size;
2743         config[no_regs++] = adev->gfx.config.mc_arb_ramcfg;
2744         config[no_regs++] = adev->gfx.config.gb_addr_config;
2745         config[no_regs++] = adev->gfx.config.num_rbs;
2746
2747         /* rev==1 */
2748         config[no_regs++] = adev->rev_id;
2749         config[no_regs++] = adev->pg_flags;
2750         config[no_regs++] = adev->cg_flags;
2751
2752         /* rev==2 */
2753         config[no_regs++] = adev->family;
2754         config[no_regs++] = adev->external_rev_id;
2755
2756         while (size && (*pos < no_regs * 4)) {
2757                 uint32_t value;
2758
2759                 value = config[*pos >> 2];
2760                 r = put_user(value, (uint32_t *)buf);
2761                 if (r) {
2762                         kfree(config);
2763                         return r;
2764                 }
2765
2766                 result += 4;
2767                 buf += 4;
2768                 *pos += 4;
2769                 size -= 4;
2770         }
2771
2772         kfree(config);
2773         return result;
2774 }
2775
2776
2777 static const struct file_operations amdgpu_debugfs_regs_fops = {
2778         .owner = THIS_MODULE,
2779         .read = amdgpu_debugfs_regs_read,
2780         .write = amdgpu_debugfs_regs_write,
2781         .llseek = default_llseek
2782 };
2783 static const struct file_operations amdgpu_debugfs_regs_didt_fops = {
2784         .owner = THIS_MODULE,
2785         .read = amdgpu_debugfs_regs_didt_read,
2786         .write = amdgpu_debugfs_regs_didt_write,
2787         .llseek = default_llseek
2788 };
2789 static const struct file_operations amdgpu_debugfs_regs_pcie_fops = {
2790         .owner = THIS_MODULE,
2791         .read = amdgpu_debugfs_regs_pcie_read,
2792         .write = amdgpu_debugfs_regs_pcie_write,
2793         .llseek = default_llseek
2794 };
2795 static const struct file_operations amdgpu_debugfs_regs_smc_fops = {
2796         .owner = THIS_MODULE,
2797         .read = amdgpu_debugfs_regs_smc_read,
2798         .write = amdgpu_debugfs_regs_smc_write,
2799         .llseek = default_llseek
2800 };
2801
2802 static const struct file_operations amdgpu_debugfs_gca_config_fops = {
2803         .owner = THIS_MODULE,
2804         .read = amdgpu_debugfs_gca_config_read,
2805         .llseek = default_llseek
2806 };
2807
2808 static const struct file_operations *debugfs_regs[] = {
2809         &amdgpu_debugfs_regs_fops,
2810         &amdgpu_debugfs_regs_didt_fops,
2811         &amdgpu_debugfs_regs_pcie_fops,
2812         &amdgpu_debugfs_regs_smc_fops,
2813         &amdgpu_debugfs_gca_config_fops,
2814 };
2815
2816 static const char *debugfs_regs_names[] = {
2817         "amdgpu_regs",
2818         "amdgpu_regs_didt",
2819         "amdgpu_regs_pcie",
2820         "amdgpu_regs_smc",
2821         "amdgpu_gca_config",
2822 };
2823
2824 static int amdgpu_debugfs_regs_init(struct amdgpu_device *adev)
2825 {
2826         struct drm_minor *minor = adev->ddev->primary;
2827         struct dentry *ent, *root = minor->debugfs_root;
2828         unsigned i, j;
2829
2830         for (i = 0; i < ARRAY_SIZE(debugfs_regs); i++) {
2831                 ent = debugfs_create_file(debugfs_regs_names[i],
2832                                           S_IFREG | S_IRUGO, root,
2833                                           adev, debugfs_regs[i]);
2834                 if (IS_ERR(ent)) {
2835                         for (j = 0; j < i; j++) {
2836                                 debugfs_remove(adev->debugfs_regs[i]);
2837                                 adev->debugfs_regs[i] = NULL;
2838                         }
2839                         return PTR_ERR(ent);
2840                 }
2841
2842                 if (!i)
2843                         i_size_write(ent->d_inode, adev->rmmio_size);
2844                 adev->debugfs_regs[i] = ent;
2845         }
2846
2847         return 0;
2848 }
2849
2850 static void amdgpu_debugfs_regs_cleanup(struct amdgpu_device *adev)
2851 {
2852         unsigned i;
2853
2854         for (i = 0; i < ARRAY_SIZE(debugfs_regs); i++) {
2855                 if (adev->debugfs_regs[i]) {
2856                         debugfs_remove(adev->debugfs_regs[i]);
2857                         adev->debugfs_regs[i] = NULL;
2858                 }
2859         }
2860 }
2861
2862 int amdgpu_debugfs_init(struct drm_minor *minor)
2863 {
2864         return 0;
2865 }
2866
2867 void amdgpu_debugfs_cleanup(struct drm_minor *minor)
2868 {
2869 }
2870 #else
2871 static int amdgpu_debugfs_regs_init(struct amdgpu_device *adev)
2872 {
2873         return 0;
2874 }
2875 static void amdgpu_debugfs_regs_cleanup(struct amdgpu_device *adev) { }
2876 #endif