Home | History | Annotate | Line # | Download | only in pci
nvme_pci.c revision 1.23
      1 /*	$NetBSD: nvme_pci.c,v 1.23 2018/12/01 13:31:48 jdolecek Exp $	*/
      2 /*	$OpenBSD: nvme_pci.c,v 1.3 2016/04/14 11:18:32 dlg Exp $ */
      3 
      4 /*
      5  * Copyright (c) 2014 David Gwynne <dlg (at) openbsd.org>
      6  *
      7  * Permission to use, copy, modify, and distribute this software for any
      8  * purpose with or without fee is hereby granted, provided that the above
      9  * copyright notice and this permission notice appear in all copies.
     10  *
     11  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
     12  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
     13  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
     14  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
     15  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
     16  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
     17  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
     18  */
     19 
     20 /*-
     21  * Copyright (C) 2016 NONAKA Kimihiro <nonaka (at) netbsd.org>
     22  * All rights reserved.
     23  *
     24  * Redistribution and use in source and binary forms, with or without
     25  * modification, are permitted provided that the following conditions
     26  * are met:
     27  * 1. Redistributions of source code must retain the above copyright
     28  *    notice, this list of conditions and the following disclaimer.
     29  * 2. Redistributions in binary form must reproduce the above copyright
     30  *    notice, this list of conditions and the following disclaimer in the
     31  *    documentation and/or other materials provided with the distribution.
     32  *
     33  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     34  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     35  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     36  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     37  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     38  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     39  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     40  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     41  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     42  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     43  */
     44 
     45 #include <sys/cdefs.h>
     46 __KERNEL_RCSID(0, "$NetBSD: nvme_pci.c,v 1.23 2018/12/01 13:31:48 jdolecek Exp $");
     47 
     48 #include <sys/param.h>
     49 #include <sys/systm.h>
     50 #include <sys/kernel.h>
     51 #include <sys/device.h>
     52 #include <sys/bitops.h>
     53 #include <sys/bus.h>
     54 #include <sys/cpu.h>
     55 #include <sys/interrupt.h>
     56 #include <sys/kmem.h>
     57 #include <sys/pmf.h>
     58 #include <sys/module.h>
     59 
     60 #include <dev/pci/pcireg.h>
     61 #include <dev/pci/pcivar.h>
     62 #include <dev/pci/pcidevs.h>
     63 
     64 #include <dev/ic/nvmereg.h>
     65 #include <dev/ic/nvmevar.h>
     66 
     67 int nvme_pci_force_intx = 0;
     68 int nvme_pci_mpsafe = 1;
     69 int nvme_pci_mq = 1;		/* INTx: ioq=1, MSI/MSI-X: ioq=ncpu */
     70 
     71 #define NVME_PCI_BAR		0x10
     72 
     73 struct nvme_pci_softc {
     74 	struct nvme_softc	psc_nvme;
     75 
     76 	pci_chipset_tag_t	psc_pc;
     77 	pci_intr_handle_t	*psc_intrs;
     78 	int			psc_nintrs;
     79 };
     80 
     81 static int	nvme_pci_match(device_t, cfdata_t, void *);
     82 static void	nvme_pci_attach(device_t, device_t, void *);
     83 static int	nvme_pci_detach(device_t, int);
     84 static int	nvme_pci_rescan(device_t, const char *, const int *);
     85 
     86 CFATTACH_DECL3_NEW(nvme_pci, sizeof(struct nvme_pci_softc),
     87     nvme_pci_match, nvme_pci_attach, nvme_pci_detach, NULL, nvme_pci_rescan,
     88     nvme_childdet, DVF_DETACH_SHUTDOWN);
     89 
     90 static int	nvme_pci_intr_establish(struct nvme_softc *,
     91 		    uint16_t, struct nvme_queue *);
     92 static int	nvme_pci_intr_disestablish(struct nvme_softc *, uint16_t);
     93 static int	nvme_pci_setup_intr(struct pci_attach_args *,
     94 		    struct nvme_pci_softc *);
     95 
     96 static const struct nvme_pci_quirk {
     97 	pci_vendor_id_t		vendor;
     98 	pci_product_id_t	product;
     99 	uint32_t		quirks;
    100 } nvme_pci_quirks[] = {
    101 	{ PCI_VENDOR_HGST, PCI_PRODUCT_HGST_SN100,
    102 	    NVME_QUIRK_DELAY_B4_CHK_RDY },
    103 	{ PCI_VENDOR_HGST, PCI_PRODUCT_HGST_SN200,
    104 	    NVME_QUIRK_DELAY_B4_CHK_RDY },
    105 	{ PCI_VENDOR_BEIJING_MEMBLAZE, PCI_PRODUCT_BEIJING_MEMBLAZE_PBLAZE4,
    106 	    NVME_QUIRK_DELAY_B4_CHK_RDY },
    107 	{ PCI_VENDOR_SAMSUNGELEC3, PCI_PRODUCT_SAMSUNGELEC3_172X,
    108 	    NVME_QUIRK_DELAY_B4_CHK_RDY },
    109 	{ PCI_VENDOR_SAMSUNGELEC3, PCI_PRODUCT_SAMSUNGELEC3_172XAB,
    110 	    NVME_QUIRK_DELAY_B4_CHK_RDY },
    111 };
    112 
    113 static const struct nvme_pci_quirk *
    114 nvme_pci_lookup_quirk(struct pci_attach_args *pa)
    115 {
    116 	const struct nvme_pci_quirk *q;
    117 	int i;
    118 
    119 	for (i = 0; i < __arraycount(nvme_pci_quirks); i++) {
    120 		q = &nvme_pci_quirks[i];
    121 
    122 		if (PCI_VENDOR(pa->pa_id) == q->vendor &&
    123 		    PCI_PRODUCT(pa->pa_id) == q->product)
    124 			return q;
    125 	}
    126 	return NULL;
    127 }
    128 
    129 static int
    130 nvme_pci_match(device_t parent, cfdata_t match, void *aux)
    131 {
    132 	struct pci_attach_args *pa = aux;
    133 
    134 	if (PCI_CLASS(pa->pa_class) == PCI_CLASS_MASS_STORAGE &&
    135 	    PCI_SUBCLASS(pa->pa_class) == PCI_SUBCLASS_MASS_STORAGE_NVM &&
    136 	    PCI_INTERFACE(pa->pa_class) == PCI_INTERFACE_NVM_NVME)
    137 		return 1;
    138 
    139 	return 0;
    140 }
    141 
    142 static void
    143 nvme_pci_attach(device_t parent, device_t self, void *aux)
    144 {
    145 	struct nvme_pci_softc *psc = device_private(self);
    146 	struct nvme_softc *sc = &psc->psc_nvme;
    147 	struct pci_attach_args *pa = aux;
    148 	const struct nvme_pci_quirk *quirk;
    149 	pcireg_t memtype, reg;
    150 	bus_addr_t memaddr;
    151 	int flags, error;
    152 	int msixoff;
    153 
    154 	sc->sc_dev = self;
    155 	psc->psc_pc = pa->pa_pc;
    156 	if (pci_dma64_available(pa))
    157 		sc->sc_dmat = pa->pa_dmat64;
    158 	else
    159 		sc->sc_dmat = pa->pa_dmat;
    160 
    161 	pci_aprint_devinfo(pa, NULL);
    162 
    163 	reg = pci_conf_read(pa->pa_pc, pa->pa_tag, PCI_COMMAND_STATUS_REG);
    164 	if ((reg & PCI_COMMAND_MASTER_ENABLE) == 0) {
    165 		reg |= PCI_COMMAND_MASTER_ENABLE;
    166         	pci_conf_write(pa->pa_pc, pa->pa_tag, PCI_COMMAND_STATUS_REG, reg);
    167 	}
    168 
    169 	/* Map registers */
    170 	memtype = pci_mapreg_type(pa->pa_pc, pa->pa_tag, NVME_PCI_BAR);
    171 	if (PCI_MAPREG_TYPE(memtype) != PCI_MAPREG_TYPE_MEM) {
    172 		aprint_error_dev(self, "invalid type (type=0x%x)\n", memtype);
    173 		return;
    174 	}
    175 	sc->sc_iot = pa->pa_memt;
    176 	error = pci_mapreg_info(pa->pa_pc, pa->pa_tag, PCI_MAPREG_START,
    177 	    memtype, &memaddr, &sc->sc_ios, &flags);
    178 	if (error) {
    179 		aprint_error_dev(self, "can't get map info\n");
    180 		return;
    181 	}
    182 
    183 	if (pci_get_capability(pa->pa_pc, pa->pa_tag, PCI_CAP_MSIX, &msixoff,
    184 	    NULL)) {
    185 		pcireg_t msixtbl;
    186 		uint32_t table_offset;
    187 		int bir;
    188 
    189 		msixtbl = pci_conf_read(pa->pa_pc, pa->pa_tag,
    190 		    msixoff + PCI_MSIX_TBLOFFSET);
    191 		table_offset = msixtbl & PCI_MSIX_TBLOFFSET_MASK;
    192 		bir = msixtbl & PCI_MSIX_PBABIR_MASK;
    193 		if (bir == 0) {
    194 			sc->sc_ios = table_offset;
    195 		}
    196 	}
    197 
    198 	error = bus_space_map(sc->sc_iot, memaddr, sc->sc_ios, flags,
    199 	    &sc->sc_ioh);
    200 	if (error != 0) {
    201 		aprint_error_dev(self, "can't map mem space (error=%d)\n",
    202 		    error);
    203 		return;
    204 	}
    205 
    206 	/* Establish interrupts */
    207 	if (nvme_pci_setup_intr(pa, psc) != 0) {
    208 		aprint_error_dev(self, "unable to allocate interrupt\n");
    209 		goto unmap;
    210 	}
    211 	sc->sc_intr_establish = nvme_pci_intr_establish;
    212 	sc->sc_intr_disestablish = nvme_pci_intr_disestablish;
    213 
    214 	sc->sc_ih = kmem_zalloc(sizeof(*sc->sc_ih) * psc->psc_nintrs, KM_SLEEP);
    215 	sc->sc_softih = kmem_zalloc(
    216 	    sizeof(*sc->sc_softih) * psc->psc_nintrs, KM_SLEEP);
    217 
    218 	quirk = nvme_pci_lookup_quirk(pa);
    219 	if (quirk != NULL)
    220 		sc->sc_quirks = quirk->quirks;
    221 
    222 	if (nvme_attach(sc) != 0) {
    223 		/* error printed by nvme_attach() */
    224 		goto softintr_free;
    225 	}
    226 
    227 	if (!pmf_device_register(self, NULL, NULL))
    228 		aprint_error_dev(self, "couldn't establish power handler\n");
    229 
    230 	SET(sc->sc_flags, NVME_F_ATTACHED);
    231 	return;
    232 
    233 softintr_free:
    234 	kmem_free(sc->sc_softih, sizeof(*sc->sc_softih) * psc->psc_nintrs);
    235 	kmem_free(sc->sc_ih, sizeof(*sc->sc_ih) * psc->psc_nintrs);
    236 	sc->sc_nq = 0;
    237 	pci_intr_release(pa->pa_pc, psc->psc_intrs, psc->psc_nintrs);
    238 	psc->psc_nintrs = 0;
    239 unmap:
    240 	bus_space_unmap(sc->sc_iot, sc->sc_ioh, sc->sc_ios);
    241 	sc->sc_ios = 0;
    242 }
    243 
    244 static int
    245 nvme_pci_rescan(device_t self, const char *attr, const int *flags)
    246 {
    247 
    248 	return nvme_rescan(self, attr, flags);
    249 }
    250 
    251 static int
    252 nvme_pci_detach(device_t self, int flags)
    253 {
    254 	struct nvme_pci_softc *psc = device_private(self);
    255 	struct nvme_softc *sc = &psc->psc_nvme;
    256 	int error;
    257 
    258 	if (!ISSET(sc->sc_flags, NVME_F_ATTACHED))
    259 		return 0;
    260 
    261 	error = nvme_detach(sc, flags);
    262 	if (error)
    263 		return error;
    264 
    265 	kmem_free(sc->sc_softih, sizeof(*sc->sc_softih) * psc->psc_nintrs);
    266 	sc->sc_softih = NULL;
    267 
    268 	kmem_free(sc->sc_ih, sizeof(*sc->sc_ih) * psc->psc_nintrs);
    269 	pci_intr_release(psc->psc_pc, psc->psc_intrs, psc->psc_nintrs);
    270 	bus_space_unmap(sc->sc_iot, sc->sc_ioh, sc->sc_ios);
    271 	return 0;
    272 }
    273 
    274 static int
    275 nvme_pci_intr_establish(struct nvme_softc *sc, uint16_t qid,
    276     struct nvme_queue *q)
    277 {
    278 	struct nvme_pci_softc *psc = (struct nvme_pci_softc *)sc;
    279 	char intr_xname[INTRDEVNAMEBUF];
    280 	char intrbuf[PCI_INTRSTR_LEN];
    281 	const char *intrstr = NULL;
    282 	int (*ih_func)(void *);
    283 	void (*ih_func_soft)(void *);
    284 	void *ih_arg;
    285 	int error;
    286 
    287 	KASSERT(sc->sc_use_mq || qid == NVME_ADMIN_Q);
    288 	KASSERT(sc->sc_ih[qid] == NULL);
    289 
    290 	if (nvme_pci_mpsafe) {
    291 		pci_intr_setattr(psc->psc_pc, &psc->psc_intrs[qid],
    292 		    PCI_INTR_MPSAFE, true);
    293 	}
    294 
    295 	if (!sc->sc_use_mq) {
    296 		snprintf(intr_xname, sizeof(intr_xname), "%s",
    297 		    device_xname(sc->sc_dev));
    298 		ih_arg = sc;
    299 		ih_func = nvme_intr;
    300 		ih_func_soft = nvme_softintr_intx;
    301 	} else {
    302 		if (qid == NVME_ADMIN_Q) {
    303 			snprintf(intr_xname, sizeof(intr_xname), "%s adminq",
    304 			    device_xname(sc->sc_dev));
    305 		} else {
    306 			snprintf(intr_xname, sizeof(intr_xname), "%s ioq%d",
    307 			    device_xname(sc->sc_dev), qid);
    308 		}
    309 		ih_arg = q;
    310 		ih_func = nvme_intr_msi;
    311 		ih_func_soft = nvme_softintr_msi;
    312 	}
    313 
    314 	/* establish hardware interrupt */
    315 	sc->sc_ih[qid] = pci_intr_establish_xname(psc->psc_pc,
    316 	    psc->psc_intrs[qid], IPL_BIO, ih_func, ih_arg, intr_xname);
    317 	if (sc->sc_ih[qid] == NULL) {
    318 		aprint_error_dev(sc->sc_dev,
    319 		    "unable to establish %s interrupt\n", intr_xname);
    320 		return 1;
    321 	}
    322 
    323 	/* establish also the software interrupt */
    324 	sc->sc_softih[qid] = softint_establish(
    325 	    SOFTINT_BIO|(nvme_pci_mpsafe ? SOFTINT_MPSAFE : 0),
    326 	    ih_func_soft, q);
    327 	if (sc->sc_softih[qid] == NULL) {
    328 		pci_intr_disestablish(psc->psc_pc, sc->sc_ih[qid]);
    329 		sc->sc_ih[qid] = NULL;
    330 
    331 		aprint_error_dev(sc->sc_dev,
    332 		    "unable to establish %s soft interrupt\n",
    333 		    intr_xname);
    334 		return 1;
    335 	}
    336 
    337 	intrstr = pci_intr_string(psc->psc_pc, psc->psc_intrs[qid], intrbuf,
    338 	    sizeof(intrbuf));
    339 	if (!sc->sc_use_mq) {
    340 		aprint_normal_dev(sc->sc_dev, "interrupting at %s\n", intrstr);
    341 	} else if (qid == NVME_ADMIN_Q) {
    342 		aprint_normal_dev(sc->sc_dev,
    343 		    "for admin queue interrupting at %s\n", intrstr);
    344 	} else if (!nvme_pci_mpsafe) {
    345 		aprint_normal_dev(sc->sc_dev,
    346 		    "for io queue %d interrupting at %s\n", qid, intrstr);
    347 	} else {
    348 		kcpuset_t *affinity;
    349 		cpuid_t affinity_to;
    350 
    351 		kcpuset_create(&affinity, true);
    352 		affinity_to = (qid - 1) % ncpu;
    353 		kcpuset_set(affinity, affinity_to);
    354 		error = interrupt_distribute(sc->sc_ih[qid], affinity, NULL);
    355 		kcpuset_destroy(affinity);
    356 		aprint_normal_dev(sc->sc_dev,
    357 		    "for io queue %d interrupting at %s", qid, intrstr);
    358 		if (error == 0)
    359 			aprint_normal(" affinity to cpu%lu", affinity_to);
    360 		aprint_normal("\n");
    361 	}
    362 	return 0;
    363 }
    364 
    365 static int
    366 nvme_pci_intr_disestablish(struct nvme_softc *sc, uint16_t qid)
    367 {
    368 	struct nvme_pci_softc *psc = (struct nvme_pci_softc *)sc;
    369 
    370 	KASSERT(sc->sc_use_mq || qid == NVME_ADMIN_Q);
    371 	KASSERT(sc->sc_ih[qid] != NULL);
    372 
    373 	if (sc->sc_softih) {
    374 		softint_disestablish(sc->sc_softih[qid]);
    375 		sc->sc_softih[qid] = NULL;
    376 	}
    377 
    378 	pci_intr_disestablish(psc->psc_pc, sc->sc_ih[qid]);
    379 	sc->sc_ih[qid] = NULL;
    380 
    381 	return 0;
    382 }
    383 
    384 static int
    385 nvme_pci_setup_intr(struct pci_attach_args *pa, struct nvme_pci_softc *psc)
    386 {
    387 	struct nvme_softc *sc = &psc->psc_nvme;
    388 	int error;
    389 	int counts[PCI_INTR_TYPE_SIZE];
    390 	pci_intr_handle_t *ihps;
    391 	int intr_type;
    392 
    393 	memset(counts, 0, sizeof(counts));
    394 
    395 	if (nvme_pci_force_intx)
    396 		goto force_intx;
    397 
    398 	/* MSI-X */
    399 	counts[PCI_INTR_TYPE_MSIX] = uimin(pci_msix_count(pa->pa_pc, pa->pa_tag),
    400 	    ncpu + 1);
    401 	if (counts[PCI_INTR_TYPE_MSIX] < 1) {
    402 		counts[PCI_INTR_TYPE_MSIX] = 0;
    403 	} else if (!nvme_pci_mq || !nvme_pci_mpsafe) {
    404 		if (counts[PCI_INTR_TYPE_MSI] > 2)
    405 			counts[PCI_INTR_TYPE_MSIX] = 2;	/* adminq + 1 ioq */
    406 	}
    407 
    408 	/* MSI */
    409 	counts[PCI_INTR_TYPE_MSI] = pci_msi_count(pa->pa_pc, pa->pa_tag);
    410 	if (counts[PCI_INTR_TYPE_MSI] > 0) {
    411 		while (counts[PCI_INTR_TYPE_MSI] > ncpu + 1) {
    412 			if (counts[PCI_INTR_TYPE_MSI] / 2 <= ncpu + 1)
    413 				break;
    414 			counts[PCI_INTR_TYPE_MSI] /= 2;
    415 		}
    416 	}
    417 	if (counts[PCI_INTR_TYPE_MSI] < 1) {
    418 		counts[PCI_INTR_TYPE_MSI] = 0;
    419 	} else if (!nvme_pci_mq || !nvme_pci_mpsafe) {
    420 		if (counts[PCI_INTR_TYPE_MSI] > 2)
    421 			counts[PCI_INTR_TYPE_MSI] = 2;	/* adminq + 1 ioq */
    422 	}
    423 
    424 force_intx:
    425 	/* INTx */
    426 	counts[PCI_INTR_TYPE_INTX] = 1;
    427 
    428 	error = pci_intr_alloc(pa, &ihps, counts, PCI_INTR_TYPE_MSIX);
    429 	if (error)
    430 		return error;
    431 
    432 	intr_type = pci_intr_type(pa->pa_pc, ihps[0]);
    433 
    434 	psc->psc_intrs = ihps;
    435 	psc->psc_nintrs = counts[intr_type];
    436 	if (intr_type == PCI_INTR_TYPE_MSI) {
    437 		if (counts[intr_type] > ncpu + 1)
    438 			counts[intr_type] = ncpu + 1;
    439 	}
    440 	sc->sc_use_mq = counts[intr_type] > 1;
    441 	sc->sc_nq = sc->sc_use_mq ? counts[intr_type] - 1 : 1;
    442 
    443 	return 0;
    444 }
    445 
    446 MODULE(MODULE_CLASS_DRIVER, nvme, "pci,dk_subr");
    447 
    448 #ifdef _MODULE
    449 #include "ioconf.c"
    450 #endif
    451 
    452 static int
    453 nvme_modcmd(modcmd_t cmd, void *opaque)
    454 {
    455 #ifdef _MODULE
    456 	devmajor_t cmajor, bmajor;
    457 	extern const struct cdevsw nvme_cdevsw;
    458 #endif
    459 	int error = 0;
    460 
    461 #ifdef _MODULE
    462 	switch (cmd) {
    463 	case MODULE_CMD_INIT:
    464 		error = config_init_component(cfdriver_ioconf_nvme_pci,
    465 		    cfattach_ioconf_nvme_pci, cfdata_ioconf_nvme_pci);
    466 		if (error)
    467 			break;
    468 
    469 		bmajor = cmajor = NODEVMAJOR;
    470 		error = devsw_attach(nvme_cd.cd_name, NULL, &bmajor,
    471 		    &nvme_cdevsw, &cmajor);
    472 		if (error) {
    473 			aprint_error("%s: unable to register devsw\n",
    474 			    nvme_cd.cd_name);
    475 			/* do not abort, just /dev/nvme* will not work */
    476 		}
    477 		break;
    478 	case MODULE_CMD_FINI:
    479 		devsw_detach(NULL, &nvme_cdevsw);
    480 
    481 		error = config_fini_component(cfdriver_ioconf_nvme_pci,
    482 		    cfattach_ioconf_nvme_pci, cfdata_ioconf_nvme_pci);
    483 		break;
    484 	default:
    485 		break;
    486 	}
    487 #endif
    488 	return error;
    489 }
    490