Home | History | Annotate | Line # | Download | only in amdgpu
      1  1.1  riastrad /*	$NetBSD: amdgpu_sdma.c,v 1.2 2021/12/18 23:44:58 riastradh Exp $	*/
      2  1.1  riastrad 
      3  1.1  riastrad /*
      4  1.1  riastrad  * Copyright 2018 Advanced Micro Devices, Inc.
      5  1.1  riastrad  *
      6  1.1  riastrad  * Permission is hereby granted, free of charge, to any person obtaining a
      7  1.1  riastrad  * copy of this software and associated documentation files (the "Software"),
      8  1.1  riastrad  * to deal in the Software without restriction, including without limitation
      9  1.1  riastrad  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
     10  1.1  riastrad  * and/or sell copies of the Software, and to permit persons to whom the
     11  1.1  riastrad  * Software is furnished to do so, subject to the following conditions:
     12  1.1  riastrad  *
     13  1.1  riastrad  * The above copyright notice and this permission notice shall be included in
     14  1.1  riastrad  * all copies or substantial portions of the Software.
     15  1.1  riastrad  *
     16  1.1  riastrad  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     17  1.1  riastrad  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     18  1.1  riastrad  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
     19  1.1  riastrad  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
     20  1.1  riastrad  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
     21  1.1  riastrad  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
     22  1.1  riastrad  * OTHER DEALINGS IN THE SOFTWARE.
     23  1.1  riastrad  *
     24  1.1  riastrad  */
     25  1.1  riastrad 
     26  1.1  riastrad #include <sys/cdefs.h>
     27  1.1  riastrad __KERNEL_RCSID(0, "$NetBSD: amdgpu_sdma.c,v 1.2 2021/12/18 23:44:58 riastradh Exp $");
     28  1.1  riastrad 
     29  1.1  riastrad #include "amdgpu.h"
     30  1.1  riastrad #include "amdgpu_sdma.h"
     31  1.1  riastrad #include "amdgpu_ras.h"
     32  1.1  riastrad 
     33  1.1  riastrad #define AMDGPU_CSA_SDMA_SIZE 64
     34  1.1  riastrad /* SDMA CSA reside in the 3rd page of CSA */
     35  1.1  riastrad #define AMDGPU_CSA_SDMA_OFFSET (4096 * 2)
     36  1.1  riastrad 
     37  1.1  riastrad /*
     38  1.1  riastrad  * GPU SDMA IP block helpers function.
     39  1.1  riastrad  */
     40  1.1  riastrad 
     41  1.1  riastrad struct amdgpu_sdma_instance *amdgpu_sdma_get_instance_from_ring(struct amdgpu_ring *ring)
     42  1.1  riastrad {
     43  1.1  riastrad 	struct amdgpu_device *adev = ring->adev;
     44  1.1  riastrad 	int i;
     45  1.1  riastrad 
     46  1.1  riastrad 	for (i = 0; i < adev->sdma.num_instances; i++)
     47  1.1  riastrad 		if (ring == &adev->sdma.instance[i].ring ||
     48  1.1  riastrad 		    ring == &adev->sdma.instance[i].page)
     49  1.1  riastrad 			return &adev->sdma.instance[i];
     50  1.1  riastrad 
     51  1.1  riastrad 	return NULL;
     52  1.1  riastrad }
     53  1.1  riastrad 
     54  1.1  riastrad int amdgpu_sdma_get_index_from_ring(struct amdgpu_ring *ring, uint32_t *index)
     55  1.1  riastrad {
     56  1.1  riastrad 	struct amdgpu_device *adev = ring->adev;
     57  1.1  riastrad 	int i;
     58  1.1  riastrad 
     59  1.1  riastrad 	for (i = 0; i < adev->sdma.num_instances; i++) {
     60  1.1  riastrad 		if (ring == &adev->sdma.instance[i].ring ||
     61  1.1  riastrad 			ring == &adev->sdma.instance[i].page) {
     62  1.1  riastrad 			*index = i;
     63  1.1  riastrad 			return 0;
     64  1.1  riastrad 		}
     65  1.1  riastrad 	}
     66  1.1  riastrad 
     67  1.1  riastrad 	return -EINVAL;
     68  1.1  riastrad }
     69  1.1  riastrad 
     70  1.1  riastrad uint64_t amdgpu_sdma_get_csa_mc_addr(struct amdgpu_ring *ring,
     71  1.1  riastrad 				     unsigned vmid)
     72  1.1  riastrad {
     73  1.1  riastrad 	struct amdgpu_device *adev = ring->adev;
     74  1.1  riastrad 	uint64_t csa_mc_addr;
     75  1.1  riastrad 	uint32_t index = 0;
     76  1.1  riastrad 	int r;
     77  1.1  riastrad 
     78  1.1  riastrad 	if (vmid == 0 || !amdgpu_mcbp)
     79  1.1  riastrad 		return 0;
     80  1.1  riastrad 
     81  1.1  riastrad 	r = amdgpu_sdma_get_index_from_ring(ring, &index);
     82  1.1  riastrad 
     83  1.1  riastrad 	if (r || index > 31)
     84  1.1  riastrad 		csa_mc_addr = 0;
     85  1.1  riastrad 	else
     86  1.1  riastrad 		csa_mc_addr = amdgpu_csa_vaddr(adev) +
     87  1.1  riastrad 			AMDGPU_CSA_SDMA_OFFSET +
     88  1.1  riastrad 			index * AMDGPU_CSA_SDMA_SIZE;
     89  1.1  riastrad 
     90  1.1  riastrad 	return csa_mc_addr;
     91  1.1  riastrad }
     92  1.1  riastrad 
     93  1.1  riastrad int amdgpu_sdma_ras_late_init(struct amdgpu_device *adev,
     94  1.1  riastrad 			      void *ras_ih_info)
     95  1.1  riastrad {
     96  1.1  riastrad 	int r, i;
     97  1.1  riastrad 	struct ras_ih_if *ih_info = (struct ras_ih_if *)ras_ih_info;
     98  1.1  riastrad 	struct ras_fs_if fs_info = {
     99  1.1  riastrad 		.sysfs_name = "sdma_err_count",
    100  1.1  riastrad 		.debugfs_name = "sdma_err_inject",
    101  1.1  riastrad 	};
    102  1.1  riastrad 
    103  1.1  riastrad 	if (!ih_info)
    104  1.1  riastrad 		return -EINVAL;
    105  1.1  riastrad 
    106  1.1  riastrad 	if (!adev->sdma.ras_if) {
    107  1.1  riastrad 		adev->sdma.ras_if = kmalloc(sizeof(struct ras_common_if), GFP_KERNEL);
    108  1.1  riastrad 		if (!adev->sdma.ras_if)
    109  1.1  riastrad 			return -ENOMEM;
    110  1.1  riastrad 		adev->sdma.ras_if->block = AMDGPU_RAS_BLOCK__SDMA;
    111  1.1  riastrad 		adev->sdma.ras_if->type = AMDGPU_RAS_ERROR__MULTI_UNCORRECTABLE;
    112  1.1  riastrad 		adev->sdma.ras_if->sub_block_index = 0;
    113  1.1  riastrad 		strcpy(adev->sdma.ras_if->name, "sdma");
    114  1.1  riastrad 	}
    115  1.1  riastrad 	fs_info.head = ih_info->head = *adev->sdma.ras_if;
    116  1.1  riastrad 
    117  1.1  riastrad 	r = amdgpu_ras_late_init(adev, adev->sdma.ras_if,
    118  1.1  riastrad 				 &fs_info, ih_info);
    119  1.1  riastrad 	if (r)
    120  1.1  riastrad 		goto free;
    121  1.1  riastrad 
    122  1.1  riastrad 	if (amdgpu_ras_is_supported(adev, adev->sdma.ras_if->block)) {
    123  1.1  riastrad 		for (i = 0; i < adev->sdma.num_instances; i++) {
    124  1.1  riastrad 			r = amdgpu_irq_get(adev, &adev->sdma.ecc_irq,
    125  1.1  riastrad 				AMDGPU_SDMA_IRQ_INSTANCE0 + i);
    126  1.1  riastrad 			if (r)
    127  1.1  riastrad 				goto late_fini;
    128  1.1  riastrad 		}
    129  1.1  riastrad 	} else {
    130  1.1  riastrad 		r = 0;
    131  1.1  riastrad 		goto free;
    132  1.1  riastrad 	}
    133  1.1  riastrad 
    134  1.1  riastrad         return 0;
    135  1.1  riastrad 
    136  1.1  riastrad late_fini:
    137  1.1  riastrad 	amdgpu_ras_late_fini(adev, adev->sdma.ras_if, ih_info);
    138  1.1  riastrad free:
    139  1.1  riastrad 	kfree(adev->sdma.ras_if);
    140  1.1  riastrad 	adev->sdma.ras_if = NULL;
    141  1.1  riastrad 	return r;
    142  1.1  riastrad }
    143  1.1  riastrad 
    144  1.1  riastrad void amdgpu_sdma_ras_fini(struct amdgpu_device *adev)
    145  1.1  riastrad {
    146  1.1  riastrad 	if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__SDMA) &&
    147  1.1  riastrad 			adev->sdma.ras_if) {
    148  1.1  riastrad 		struct ras_common_if *ras_if = adev->sdma.ras_if;
    149  1.1  riastrad 		struct ras_ih_if ih_info = {
    150  1.1  riastrad 			.head = *ras_if,
    151  1.1  riastrad 			/* the cb member will not be used by
    152  1.1  riastrad 			 * amdgpu_ras_interrupt_remove_handler, init it only
    153  1.1  riastrad 			 * to cheat the check in ras_late_fini
    154  1.1  riastrad 			 */
    155  1.1  riastrad 			.cb = amdgpu_sdma_process_ras_data_cb,
    156  1.1  riastrad 		};
    157  1.1  riastrad 
    158  1.1  riastrad 		amdgpu_ras_late_fini(adev, ras_if, &ih_info);
    159  1.1  riastrad 		kfree(ras_if);
    160  1.1  riastrad 	}
    161  1.1  riastrad }
    162  1.1  riastrad 
    163  1.1  riastrad int amdgpu_sdma_process_ras_data_cb(struct amdgpu_device *adev,
    164  1.1  riastrad 		void *err_data,
    165  1.1  riastrad 		struct amdgpu_iv_entry *entry)
    166  1.1  riastrad {
    167  1.1  riastrad 	kgd2kfd_set_sram_ecc_flag(adev->kfd.dev);
    168  1.1  riastrad 	amdgpu_ras_reset_gpu(adev);
    169  1.1  riastrad 
    170  1.1  riastrad 	return AMDGPU_RAS_SUCCESS;
    171  1.1  riastrad }
    172  1.1  riastrad 
    173  1.1  riastrad int amdgpu_sdma_process_ecc_irq(struct amdgpu_device *adev,
    174  1.1  riastrad 				      struct amdgpu_irq_src *source,
    175  1.1  riastrad 				      struct amdgpu_iv_entry *entry)
    176  1.1  riastrad {
    177  1.1  riastrad 	struct ras_common_if *ras_if = adev->sdma.ras_if;
    178  1.1  riastrad 	struct ras_dispatch_if ih_data = {
    179  1.1  riastrad 		.entry = entry,
    180  1.1  riastrad 	};
    181  1.1  riastrad 
    182  1.1  riastrad 	if (!ras_if)
    183  1.1  riastrad 		return 0;
    184  1.1  riastrad 
    185  1.1  riastrad 	ih_data.head = *ras_if;
    186  1.1  riastrad 
    187  1.1  riastrad 	amdgpu_ras_interrupt_dispatch(adev, &ih_data);
    188  1.1  riastrad 	return 0;
    189  1.1  riastrad }
    190