nvme.c revision 1.38 1 1.38 nonaka /* $NetBSD: nvme.c,v 1.38 2018/04/18 10:05:59 nonaka Exp $ */
2 1.1 nonaka /* $OpenBSD: nvme.c,v 1.49 2016/04/18 05:59:50 dlg Exp $ */
3 1.1 nonaka
4 1.1 nonaka /*
5 1.1 nonaka * Copyright (c) 2014 David Gwynne <dlg (at) openbsd.org>
6 1.1 nonaka *
7 1.1 nonaka * Permission to use, copy, modify, and distribute this software for any
8 1.1 nonaka * purpose with or without fee is hereby granted, provided that the above
9 1.1 nonaka * copyright notice and this permission notice appear in all copies.
10 1.1 nonaka *
11 1.1 nonaka * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
12 1.1 nonaka * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
13 1.1 nonaka * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
14 1.1 nonaka * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15 1.1 nonaka * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16 1.1 nonaka * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
17 1.1 nonaka * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18 1.1 nonaka */
19 1.1 nonaka
20 1.1 nonaka #include <sys/cdefs.h>
21 1.38 nonaka __KERNEL_RCSID(0, "$NetBSD: nvme.c,v 1.38 2018/04/18 10:05:59 nonaka Exp $");
22 1.1 nonaka
23 1.1 nonaka #include <sys/param.h>
24 1.1 nonaka #include <sys/systm.h>
25 1.1 nonaka #include <sys/kernel.h>
26 1.1 nonaka #include <sys/atomic.h>
27 1.1 nonaka #include <sys/bus.h>
28 1.1 nonaka #include <sys/buf.h>
29 1.3 nonaka #include <sys/conf.h>
30 1.1 nonaka #include <sys/device.h>
31 1.1 nonaka #include <sys/kmem.h>
32 1.1 nonaka #include <sys/once.h>
33 1.3 nonaka #include <sys/proc.h>
34 1.1 nonaka #include <sys/queue.h>
35 1.1 nonaka #include <sys/mutex.h>
36 1.1 nonaka
37 1.3 nonaka #include <uvm/uvm_extern.h>
38 1.3 nonaka
39 1.1 nonaka #include <dev/ic/nvmereg.h>
40 1.1 nonaka #include <dev/ic/nvmevar.h>
41 1.3 nonaka #include <dev/ic/nvmeio.h>
42 1.1 nonaka
43 1.31 riastrad #include "ioconf.h"
44 1.31 riastrad
45 1.38 nonaka #define B4_CHK_RDY_DELAY_MS 2300 /* workaround controller bug */
46 1.38 nonaka
47 1.22 jdolecek int nvme_adminq_size = 32;
48 1.9 jdolecek int nvme_ioq_size = 1024;
49 1.1 nonaka
50 1.1 nonaka static int nvme_print(void *, const char *);
51 1.1 nonaka
52 1.1 nonaka static int nvme_ready(struct nvme_softc *, uint32_t);
53 1.1 nonaka static int nvme_enable(struct nvme_softc *, u_int);
54 1.1 nonaka static int nvme_disable(struct nvme_softc *);
55 1.1 nonaka static int nvme_shutdown(struct nvme_softc *);
56 1.1 nonaka
57 1.1 nonaka #ifdef NVME_DEBUG
58 1.1 nonaka static void nvme_dumpregs(struct nvme_softc *);
59 1.1 nonaka #endif
60 1.1 nonaka static int nvme_identify(struct nvme_softc *, u_int);
61 1.1 nonaka static void nvme_fill_identify(struct nvme_queue *, struct nvme_ccb *,
62 1.1 nonaka void *);
63 1.1 nonaka
64 1.20 jdolecek static int nvme_ccbs_alloc(struct nvme_queue *, uint16_t);
65 1.1 nonaka static void nvme_ccbs_free(struct nvme_queue *);
66 1.1 nonaka
67 1.1 nonaka static struct nvme_ccb *
68 1.34 jdolecek nvme_ccb_get(struct nvme_queue *, bool);
69 1.1 nonaka static void nvme_ccb_put(struct nvme_queue *, struct nvme_ccb *);
70 1.1 nonaka
71 1.1 nonaka static int nvme_poll(struct nvme_softc *, struct nvme_queue *,
72 1.1 nonaka struct nvme_ccb *, void (*)(struct nvme_queue *,
73 1.7 jdolecek struct nvme_ccb *, void *), int);
74 1.1 nonaka static void nvme_poll_fill(struct nvme_queue *, struct nvme_ccb *, void *);
75 1.1 nonaka static void nvme_poll_done(struct nvme_queue *, struct nvme_ccb *,
76 1.1 nonaka struct nvme_cqe *);
77 1.1 nonaka static void nvme_sqe_fill(struct nvme_queue *, struct nvme_ccb *, void *);
78 1.1 nonaka static void nvme_empty_done(struct nvme_queue *, struct nvme_ccb *,
79 1.1 nonaka struct nvme_cqe *);
80 1.1 nonaka
81 1.1 nonaka static struct nvme_queue *
82 1.1 nonaka nvme_q_alloc(struct nvme_softc *, uint16_t, u_int, u_int);
83 1.1 nonaka static int nvme_q_create(struct nvme_softc *, struct nvme_queue *);
84 1.1 nonaka static int nvme_q_delete(struct nvme_softc *, struct nvme_queue *);
85 1.1 nonaka static void nvme_q_submit(struct nvme_softc *, struct nvme_queue *,
86 1.1 nonaka struct nvme_ccb *, void (*)(struct nvme_queue *,
87 1.1 nonaka struct nvme_ccb *, void *));
88 1.1 nonaka static int nvme_q_complete(struct nvme_softc *, struct nvme_queue *q);
89 1.1 nonaka static void nvme_q_free(struct nvme_softc *, struct nvme_queue *);
90 1.34 jdolecek static void nvme_q_wait_complete(struct nvme_softc *, struct nvme_queue *,
91 1.34 jdolecek bool (*)(void *), void *);
92 1.1 nonaka
93 1.19 jdolecek static struct nvme_dmamem *
94 1.19 jdolecek nvme_dmamem_alloc(struct nvme_softc *, size_t);
95 1.1 nonaka static void nvme_dmamem_free(struct nvme_softc *, struct nvme_dmamem *);
96 1.19 jdolecek static void nvme_dmamem_sync(struct nvme_softc *, struct nvme_dmamem *,
97 1.19 jdolecek int);
98 1.1 nonaka
99 1.1 nonaka static void nvme_ns_io_fill(struct nvme_queue *, struct nvme_ccb *,
100 1.1 nonaka void *);
101 1.1 nonaka static void nvme_ns_io_done(struct nvme_queue *, struct nvme_ccb *,
102 1.1 nonaka struct nvme_cqe *);
103 1.1 nonaka static void nvme_ns_sync_fill(struct nvme_queue *, struct nvme_ccb *,
104 1.1 nonaka void *);
105 1.1 nonaka static void nvme_ns_sync_done(struct nvme_queue *, struct nvme_ccb *,
106 1.1 nonaka struct nvme_cqe *);
107 1.25 jdolecek static void nvme_getcache_fill(struct nvme_queue *, struct nvme_ccb *,
108 1.25 jdolecek void *);
109 1.25 jdolecek static void nvme_getcache_done(struct nvme_queue *, struct nvme_ccb *,
110 1.25 jdolecek struct nvme_cqe *);
111 1.1 nonaka
112 1.3 nonaka static void nvme_pt_fill(struct nvme_queue *, struct nvme_ccb *,
113 1.3 nonaka void *);
114 1.3 nonaka static void nvme_pt_done(struct nvme_queue *, struct nvme_ccb *,
115 1.3 nonaka struct nvme_cqe *);
116 1.3 nonaka static int nvme_command_passthrough(struct nvme_softc *,
117 1.3 nonaka struct nvme_pt_command *, uint16_t, struct lwp *, bool);
118 1.3 nonaka
119 1.23 nonaka static int nvme_get_number_of_queues(struct nvme_softc *, u_int *);
120 1.23 nonaka
121 1.7 jdolecek #define NVME_TIMO_QOP 5 /* queue create and delete timeout */
122 1.7 jdolecek #define NVME_TIMO_IDENT 10 /* probe identify timeout */
123 1.7 jdolecek #define NVME_TIMO_PT -1 /* passthrough cmd timeout */
124 1.13 jdolecek #define NVME_TIMO_SY 60 /* sync cache timeout */
125 1.7 jdolecek
126 1.1 nonaka #define nvme_read4(_s, _r) \
127 1.1 nonaka bus_space_read_4((_s)->sc_iot, (_s)->sc_ioh, (_r))
128 1.1 nonaka #define nvme_write4(_s, _r, _v) \
129 1.1 nonaka bus_space_write_4((_s)->sc_iot, (_s)->sc_ioh, (_r), (_v))
130 1.28 nonaka /*
131 1.28 nonaka * Some controllers, at least Apple NVMe, always require split
132 1.28 nonaka * transfers, so don't use bus_space_{read,write}_8() on LP64.
133 1.28 nonaka */
134 1.1 nonaka static inline uint64_t
135 1.1 nonaka nvme_read8(struct nvme_softc *sc, bus_size_t r)
136 1.1 nonaka {
137 1.1 nonaka uint64_t v;
138 1.1 nonaka uint32_t *a = (uint32_t *)&v;
139 1.1 nonaka
140 1.1 nonaka #if _BYTE_ORDER == _LITTLE_ENDIAN
141 1.1 nonaka a[0] = nvme_read4(sc, r);
142 1.1 nonaka a[1] = nvme_read4(sc, r + 4);
143 1.1 nonaka #else /* _BYTE_ORDER == _LITTLE_ENDIAN */
144 1.1 nonaka a[1] = nvme_read4(sc, r);
145 1.1 nonaka a[0] = nvme_read4(sc, r + 4);
146 1.1 nonaka #endif
147 1.1 nonaka
148 1.1 nonaka return v;
149 1.1 nonaka }
150 1.1 nonaka
151 1.1 nonaka static inline void
152 1.1 nonaka nvme_write8(struct nvme_softc *sc, bus_size_t r, uint64_t v)
153 1.1 nonaka {
154 1.1 nonaka uint32_t *a = (uint32_t *)&v;
155 1.1 nonaka
156 1.1 nonaka #if _BYTE_ORDER == _LITTLE_ENDIAN
157 1.1 nonaka nvme_write4(sc, r, a[0]);
158 1.1 nonaka nvme_write4(sc, r + 4, a[1]);
159 1.1 nonaka #else /* _BYTE_ORDER == _LITTLE_ENDIAN */
160 1.1 nonaka nvme_write4(sc, r, a[1]);
161 1.1 nonaka nvme_write4(sc, r + 4, a[0]);
162 1.1 nonaka #endif
163 1.1 nonaka }
164 1.1 nonaka #define nvme_barrier(_s, _r, _l, _f) \
165 1.1 nonaka bus_space_barrier((_s)->sc_iot, (_s)->sc_ioh, (_r), (_l), (_f))
166 1.1 nonaka
167 1.1 nonaka #ifdef NVME_DEBUG
168 1.6 jdolecek static __used void
169 1.1 nonaka nvme_dumpregs(struct nvme_softc *sc)
170 1.1 nonaka {
171 1.1 nonaka uint64_t r8;
172 1.1 nonaka uint32_t r4;
173 1.1 nonaka
174 1.1 nonaka #define DEVNAME(_sc) device_xname((_sc)->sc_dev)
175 1.1 nonaka r8 = nvme_read8(sc, NVME_CAP);
176 1.8 jdolecek printf("%s: cap 0x%016"PRIx64"\n", DEVNAME(sc), nvme_read8(sc, NVME_CAP));
177 1.1 nonaka printf("%s: mpsmax %u (%u)\n", DEVNAME(sc),
178 1.1 nonaka (u_int)NVME_CAP_MPSMAX(r8), (1 << NVME_CAP_MPSMAX(r8)));
179 1.1 nonaka printf("%s: mpsmin %u (%u)\n", DEVNAME(sc),
180 1.1 nonaka (u_int)NVME_CAP_MPSMIN(r8), (1 << NVME_CAP_MPSMIN(r8)));
181 1.8 jdolecek printf("%s: css %"PRIu64"\n", DEVNAME(sc), NVME_CAP_CSS(r8));
182 1.8 jdolecek printf("%s: nssrs %"PRIu64"\n", DEVNAME(sc), NVME_CAP_NSSRS(r8));
183 1.8 jdolecek printf("%s: dstrd %"PRIu64"\n", DEVNAME(sc), NVME_CAP_DSTRD(r8));
184 1.8 jdolecek printf("%s: to %"PRIu64" msec\n", DEVNAME(sc), NVME_CAP_TO(r8));
185 1.8 jdolecek printf("%s: ams %"PRIu64"\n", DEVNAME(sc), NVME_CAP_AMS(r8));
186 1.8 jdolecek printf("%s: cqr %"PRIu64"\n", DEVNAME(sc), NVME_CAP_CQR(r8));
187 1.8 jdolecek printf("%s: mqes %"PRIu64"\n", DEVNAME(sc), NVME_CAP_MQES(r8));
188 1.1 nonaka
189 1.1 nonaka printf("%s: vs 0x%04x\n", DEVNAME(sc), nvme_read4(sc, NVME_VS));
190 1.1 nonaka
191 1.1 nonaka r4 = nvme_read4(sc, NVME_CC);
192 1.1 nonaka printf("%s: cc 0x%04x\n", DEVNAME(sc), r4);
193 1.8 jdolecek printf("%s: iocqes %u (%u)\n", DEVNAME(sc), NVME_CC_IOCQES_R(r4),
194 1.8 jdolecek (1 << NVME_CC_IOCQES_R(r4)));
195 1.8 jdolecek printf("%s: iosqes %u (%u)\n", DEVNAME(sc), NVME_CC_IOSQES_R(r4),
196 1.8 jdolecek (1 << NVME_CC_IOSQES_R(r4)));
197 1.1 nonaka printf("%s: shn %u\n", DEVNAME(sc), NVME_CC_SHN_R(r4));
198 1.1 nonaka printf("%s: ams %u\n", DEVNAME(sc), NVME_CC_AMS_R(r4));
199 1.8 jdolecek printf("%s: mps %u (%u)\n", DEVNAME(sc), NVME_CC_MPS_R(r4),
200 1.8 jdolecek (1 << NVME_CC_MPS_R(r4)));
201 1.1 nonaka printf("%s: css %u\n", DEVNAME(sc), NVME_CC_CSS_R(r4));
202 1.6 jdolecek printf("%s: en %u\n", DEVNAME(sc), ISSET(r4, NVME_CC_EN) ? 1 : 0);
203 1.1 nonaka
204 1.8 jdolecek r4 = nvme_read4(sc, NVME_CSTS);
205 1.8 jdolecek printf("%s: csts 0x%08x\n", DEVNAME(sc), r4);
206 1.8 jdolecek printf("%s: rdy %u\n", DEVNAME(sc), r4 & NVME_CSTS_RDY);
207 1.8 jdolecek printf("%s: cfs %u\n", DEVNAME(sc), r4 & NVME_CSTS_CFS);
208 1.8 jdolecek printf("%s: shst %x\n", DEVNAME(sc), r4 & NVME_CSTS_SHST_MASK);
209 1.8 jdolecek
210 1.8 jdolecek r4 = nvme_read4(sc, NVME_AQA);
211 1.8 jdolecek printf("%s: aqa 0x%08x\n", DEVNAME(sc), r4);
212 1.8 jdolecek printf("%s: acqs %u\n", DEVNAME(sc), NVME_AQA_ACQS_R(r4));
213 1.8 jdolecek printf("%s: asqs %u\n", DEVNAME(sc), NVME_AQA_ASQS_R(r4));
214 1.8 jdolecek
215 1.8 jdolecek printf("%s: asq 0x%016"PRIx64"\n", DEVNAME(sc), nvme_read8(sc, NVME_ASQ));
216 1.8 jdolecek printf("%s: acq 0x%016"PRIx64"\n", DEVNAME(sc), nvme_read8(sc, NVME_ACQ));
217 1.1 nonaka #undef DEVNAME
218 1.1 nonaka }
219 1.1 nonaka #endif /* NVME_DEBUG */
220 1.1 nonaka
221 1.1 nonaka static int
222 1.1 nonaka nvme_ready(struct nvme_softc *sc, uint32_t rdy)
223 1.1 nonaka {
224 1.1 nonaka u_int i = 0;
225 1.1 nonaka
226 1.1 nonaka while ((nvme_read4(sc, NVME_CSTS) & NVME_CSTS_RDY) != rdy) {
227 1.1 nonaka if (i++ > sc->sc_rdy_to)
228 1.8 jdolecek return ENXIO;
229 1.1 nonaka
230 1.1 nonaka delay(1000);
231 1.1 nonaka nvme_barrier(sc, NVME_CSTS, 4, BUS_SPACE_BARRIER_READ);
232 1.1 nonaka }
233 1.1 nonaka
234 1.1 nonaka return 0;
235 1.1 nonaka }
236 1.1 nonaka
237 1.1 nonaka static int
238 1.1 nonaka nvme_enable(struct nvme_softc *sc, u_int mps)
239 1.1 nonaka {
240 1.8 jdolecek uint32_t cc, csts;
241 1.38 nonaka int error;
242 1.1 nonaka
243 1.1 nonaka cc = nvme_read4(sc, NVME_CC);
244 1.8 jdolecek csts = nvme_read4(sc, NVME_CSTS);
245 1.38 nonaka
246 1.38 nonaka /*
247 1.38 nonaka * See note in nvme_disable. Short circuit if we're already enabled.
248 1.38 nonaka */
249 1.7 jdolecek if (ISSET(cc, NVME_CC_EN)) {
250 1.8 jdolecek if (ISSET(csts, NVME_CSTS_RDY))
251 1.38 nonaka return 0;
252 1.8 jdolecek
253 1.8 jdolecek goto waitready;
254 1.38 nonaka } else {
255 1.38 nonaka /* EN == 0 already wait for RDY == 0 or fail */
256 1.38 nonaka error = nvme_ready(sc, 0);
257 1.38 nonaka if (error)
258 1.38 nonaka return error;
259 1.7 jdolecek }
260 1.1 nonaka
261 1.1 nonaka nvme_write8(sc, NVME_ASQ, NVME_DMA_DVA(sc->sc_admin_q->q_sq_dmamem));
262 1.1 nonaka nvme_barrier(sc, 0, sc->sc_ios, BUS_SPACE_BARRIER_WRITE);
263 1.8 jdolecek delay(5000);
264 1.1 nonaka nvme_write8(sc, NVME_ACQ, NVME_DMA_DVA(sc->sc_admin_q->q_cq_dmamem));
265 1.1 nonaka nvme_barrier(sc, 0, sc->sc_ios, BUS_SPACE_BARRIER_WRITE);
266 1.8 jdolecek delay(5000);
267 1.8 jdolecek
268 1.8 jdolecek nvme_write4(sc, NVME_AQA, NVME_AQA_ACQS(sc->sc_admin_q->q_entries) |
269 1.8 jdolecek NVME_AQA_ASQS(sc->sc_admin_q->q_entries));
270 1.8 jdolecek nvme_barrier(sc, 0, sc->sc_ios, BUS_SPACE_BARRIER_WRITE);
271 1.8 jdolecek delay(5000);
272 1.1 nonaka
273 1.1 nonaka CLR(cc, NVME_CC_IOCQES_MASK | NVME_CC_IOSQES_MASK | NVME_CC_SHN_MASK |
274 1.1 nonaka NVME_CC_AMS_MASK | NVME_CC_MPS_MASK | NVME_CC_CSS_MASK);
275 1.1 nonaka SET(cc, NVME_CC_IOSQES(ffs(64) - 1) | NVME_CC_IOCQES(ffs(16) - 1));
276 1.1 nonaka SET(cc, NVME_CC_SHN(NVME_CC_SHN_NONE));
277 1.1 nonaka SET(cc, NVME_CC_CSS(NVME_CC_CSS_NVM));
278 1.1 nonaka SET(cc, NVME_CC_AMS(NVME_CC_AMS_RR));
279 1.1 nonaka SET(cc, NVME_CC_MPS(mps));
280 1.1 nonaka SET(cc, NVME_CC_EN);
281 1.1 nonaka
282 1.1 nonaka nvme_write4(sc, NVME_CC, cc);
283 1.1 nonaka nvme_barrier(sc, 0, sc->sc_ios,
284 1.1 nonaka BUS_SPACE_BARRIER_READ | BUS_SPACE_BARRIER_WRITE);
285 1.1 nonaka
286 1.8 jdolecek waitready:
287 1.1 nonaka return nvme_ready(sc, NVME_CSTS_RDY);
288 1.1 nonaka }
289 1.1 nonaka
290 1.1 nonaka static int
291 1.1 nonaka nvme_disable(struct nvme_softc *sc)
292 1.1 nonaka {
293 1.1 nonaka uint32_t cc, csts;
294 1.38 nonaka int error;
295 1.1 nonaka
296 1.1 nonaka cc = nvme_read4(sc, NVME_CC);
297 1.8 jdolecek csts = nvme_read4(sc, NVME_CSTS);
298 1.8 jdolecek
299 1.38 nonaka /*
300 1.38 nonaka * Per 3.1.5 in NVME 1.3 spec, transitioning CC.EN from 0 to 1
301 1.38 nonaka * when CSTS.RDY is 1 or transitioning CC.EN from 1 to 0 when
302 1.38 nonaka * CSTS.RDY is 0 "has undefined results" So make sure that CSTS.RDY
303 1.38 nonaka * isn't the desired value. Short circuit if we're already disabled.
304 1.38 nonaka */
305 1.38 nonaka if (ISSET(cc, NVME_CC_EN)) {
306 1.38 nonaka if (!ISSET(csts, NVME_CSTS_RDY)) {
307 1.38 nonaka /* EN == 1, wait for RDY == 1 or fail */
308 1.38 nonaka error = nvme_ready(sc, NVME_CSTS_RDY);
309 1.38 nonaka if (error)
310 1.38 nonaka return error;
311 1.38 nonaka }
312 1.38 nonaka } else {
313 1.38 nonaka /* EN == 0 already wait for RDY == 0 */
314 1.38 nonaka if (!ISSET(csts, NVME_CSTS_RDY))
315 1.38 nonaka return 0;
316 1.38 nonaka
317 1.38 nonaka goto waitready;
318 1.38 nonaka }
319 1.1 nonaka
320 1.1 nonaka CLR(cc, NVME_CC_EN);
321 1.1 nonaka nvme_write4(sc, NVME_CC, cc);
322 1.8 jdolecek nvme_barrier(sc, 0, sc->sc_ios, BUS_SPACE_BARRIER_READ);
323 1.1 nonaka
324 1.38 nonaka /*
325 1.38 nonaka * Some drives have issues with accessing the mmio after we disable,
326 1.38 nonaka * so delay for a bit after we write the bit to cope with these issues.
327 1.38 nonaka */
328 1.38 nonaka if (ISSET(sc->sc_quirks, NVME_QUIRK_DELAY_B4_CHK_RDY))
329 1.38 nonaka delay(B4_CHK_RDY_DELAY_MS);
330 1.38 nonaka
331 1.38 nonaka waitready:
332 1.1 nonaka return nvme_ready(sc, 0);
333 1.1 nonaka }
334 1.1 nonaka
335 1.1 nonaka int
336 1.1 nonaka nvme_attach(struct nvme_softc *sc)
337 1.1 nonaka {
338 1.1 nonaka uint64_t cap;
339 1.1 nonaka uint32_t reg;
340 1.1 nonaka u_int dstrd;
341 1.1 nonaka u_int mps = PAGE_SHIFT;
342 1.23 nonaka u_int ioq_allocated;
343 1.20 jdolecek uint16_t adminq_entries = nvme_adminq_size;
344 1.20 jdolecek uint16_t ioq_entries = nvme_ioq_size;
345 1.1 nonaka int i;
346 1.1 nonaka
347 1.1 nonaka reg = nvme_read4(sc, NVME_VS);
348 1.1 nonaka if (reg == 0xffffffff) {
349 1.1 nonaka aprint_error_dev(sc->sc_dev, "invalid mapping\n");
350 1.1 nonaka return 1;
351 1.1 nonaka }
352 1.1 nonaka
353 1.27 nonaka if (NVME_VS_TER(reg) == 0)
354 1.27 nonaka aprint_normal_dev(sc->sc_dev, "NVMe %d.%d\n", NVME_VS_MJR(reg),
355 1.27 nonaka NVME_VS_MNR(reg));
356 1.27 nonaka else
357 1.27 nonaka aprint_normal_dev(sc->sc_dev, "NVMe %d.%d.%d\n", NVME_VS_MJR(reg),
358 1.27 nonaka NVME_VS_MNR(reg), NVME_VS_TER(reg));
359 1.1 nonaka
360 1.1 nonaka cap = nvme_read8(sc, NVME_CAP);
361 1.1 nonaka dstrd = NVME_CAP_DSTRD(cap);
362 1.1 nonaka if (NVME_CAP_MPSMIN(cap) > PAGE_SHIFT) {
363 1.1 nonaka aprint_error_dev(sc->sc_dev, "NVMe minimum page size %u "
364 1.1 nonaka "is greater than CPU page size %u\n",
365 1.1 nonaka 1 << NVME_CAP_MPSMIN(cap), 1 << PAGE_SHIFT);
366 1.1 nonaka return 1;
367 1.1 nonaka }
368 1.1 nonaka if (NVME_CAP_MPSMAX(cap) < mps)
369 1.1 nonaka mps = NVME_CAP_MPSMAX(cap);
370 1.15 nonaka if (ioq_entries > NVME_CAP_MQES(cap))
371 1.15 nonaka ioq_entries = NVME_CAP_MQES(cap);
372 1.1 nonaka
373 1.8 jdolecek /* set initial values to be used for admin queue during probe */
374 1.1 nonaka sc->sc_rdy_to = NVME_CAP_TO(cap);
375 1.1 nonaka sc->sc_mps = 1 << mps;
376 1.1 nonaka sc->sc_mdts = MAXPHYS;
377 1.1 nonaka sc->sc_max_sgl = 2;
378 1.1 nonaka
379 1.1 nonaka if (nvme_disable(sc) != 0) {
380 1.1 nonaka aprint_error_dev(sc->sc_dev, "unable to disable controller\n");
381 1.1 nonaka return 1;
382 1.1 nonaka }
383 1.1 nonaka
384 1.1 nonaka sc->sc_admin_q = nvme_q_alloc(sc, NVME_ADMIN_Q, adminq_entries, dstrd);
385 1.1 nonaka if (sc->sc_admin_q == NULL) {
386 1.1 nonaka aprint_error_dev(sc->sc_dev,
387 1.1 nonaka "unable to allocate admin queue\n");
388 1.1 nonaka return 1;
389 1.1 nonaka }
390 1.1 nonaka if (sc->sc_intr_establish(sc, NVME_ADMIN_Q, sc->sc_admin_q))
391 1.1 nonaka goto free_admin_q;
392 1.1 nonaka
393 1.1 nonaka if (nvme_enable(sc, mps) != 0) {
394 1.1 nonaka aprint_error_dev(sc->sc_dev, "unable to enable controller\n");
395 1.1 nonaka goto disestablish_admin_q;
396 1.1 nonaka }
397 1.1 nonaka
398 1.1 nonaka if (nvme_identify(sc, NVME_CAP_MPSMIN(cap)) != 0) {
399 1.1 nonaka aprint_error_dev(sc->sc_dev, "unable to identify controller\n");
400 1.1 nonaka goto disable;
401 1.1 nonaka }
402 1.1 nonaka
403 1.1 nonaka /* we know how big things are now */
404 1.1 nonaka sc->sc_max_sgl = sc->sc_mdts / sc->sc_mps;
405 1.1 nonaka
406 1.1 nonaka /* reallocate ccbs of admin queue with new max sgl. */
407 1.1 nonaka nvme_ccbs_free(sc->sc_admin_q);
408 1.1 nonaka nvme_ccbs_alloc(sc->sc_admin_q, sc->sc_admin_q->q_entries);
409 1.1 nonaka
410 1.23 nonaka if (sc->sc_use_mq) {
411 1.23 nonaka /* Limit the number of queues to the number allocated in HW */
412 1.23 nonaka if (nvme_get_number_of_queues(sc, &ioq_allocated) != 0) {
413 1.23 nonaka aprint_error_dev(sc->sc_dev,
414 1.23 nonaka "unable to get number of queues\n");
415 1.23 nonaka goto disable;
416 1.23 nonaka }
417 1.23 nonaka if (sc->sc_nq > ioq_allocated)
418 1.23 nonaka sc->sc_nq = ioq_allocated;
419 1.23 nonaka }
420 1.23 nonaka
421 1.1 nonaka sc->sc_q = kmem_zalloc(sizeof(*sc->sc_q) * sc->sc_nq, KM_SLEEP);
422 1.1 nonaka for (i = 0; i < sc->sc_nq; i++) {
423 1.1 nonaka sc->sc_q[i] = nvme_q_alloc(sc, i + 1, ioq_entries, dstrd);
424 1.1 nonaka if (sc->sc_q[i] == NULL) {
425 1.1 nonaka aprint_error_dev(sc->sc_dev,
426 1.1 nonaka "unable to allocate io queue\n");
427 1.1 nonaka goto free_q;
428 1.1 nonaka }
429 1.1 nonaka if (nvme_q_create(sc, sc->sc_q[i]) != 0) {
430 1.1 nonaka aprint_error_dev(sc->sc_dev,
431 1.1 nonaka "unable to create io queue\n");
432 1.1 nonaka nvme_q_free(sc, sc->sc_q[i]);
433 1.1 nonaka goto free_q;
434 1.1 nonaka }
435 1.1 nonaka }
436 1.1 nonaka
437 1.1 nonaka if (!sc->sc_use_mq)
438 1.1 nonaka nvme_write4(sc, NVME_INTMC, 1);
439 1.1 nonaka
440 1.9 jdolecek /* probe subdevices */
441 1.1 nonaka sc->sc_namespaces = kmem_zalloc(sizeof(*sc->sc_namespaces) * sc->sc_nn,
442 1.1 nonaka KM_SLEEP);
443 1.14 pgoyette nvme_rescan(sc->sc_dev, "nvme", &i);
444 1.1 nonaka
445 1.1 nonaka return 0;
446 1.1 nonaka
447 1.1 nonaka free_q:
448 1.1 nonaka while (--i >= 0) {
449 1.1 nonaka nvme_q_delete(sc, sc->sc_q[i]);
450 1.1 nonaka nvme_q_free(sc, sc->sc_q[i]);
451 1.1 nonaka }
452 1.1 nonaka disable:
453 1.1 nonaka nvme_disable(sc);
454 1.1 nonaka disestablish_admin_q:
455 1.1 nonaka sc->sc_intr_disestablish(sc, NVME_ADMIN_Q);
456 1.1 nonaka free_admin_q:
457 1.1 nonaka nvme_q_free(sc, sc->sc_admin_q);
458 1.1 nonaka
459 1.1 nonaka return 1;
460 1.1 nonaka }
461 1.1 nonaka
462 1.14 pgoyette int
463 1.14 pgoyette nvme_rescan(device_t self, const char *attr, const int *flags)
464 1.14 pgoyette {
465 1.14 pgoyette struct nvme_softc *sc = device_private(self);
466 1.14 pgoyette struct nvme_attach_args naa;
467 1.15 nonaka uint64_t cap;
468 1.15 nonaka int ioq_entries = nvme_ioq_size;
469 1.15 nonaka int i;
470 1.15 nonaka
471 1.15 nonaka cap = nvme_read8(sc, NVME_CAP);
472 1.15 nonaka if (ioq_entries > NVME_CAP_MQES(cap))
473 1.15 nonaka ioq_entries = NVME_CAP_MQES(cap);
474 1.14 pgoyette
475 1.14 pgoyette for (i = 0; i < sc->sc_nn; i++) {
476 1.14 pgoyette if (sc->sc_namespaces[i].dev)
477 1.14 pgoyette continue;
478 1.14 pgoyette memset(&naa, 0, sizeof(naa));
479 1.14 pgoyette naa.naa_nsid = i + 1;
480 1.21 jdolecek naa.naa_qentries = (ioq_entries - 1) * sc->sc_nq;
481 1.21 jdolecek naa.naa_maxphys = sc->sc_mdts;
482 1.14 pgoyette sc->sc_namespaces[i].dev = config_found(sc->sc_dev, &naa,
483 1.14 pgoyette nvme_print);
484 1.14 pgoyette }
485 1.14 pgoyette return 0;
486 1.14 pgoyette }
487 1.14 pgoyette
488 1.1 nonaka static int
489 1.1 nonaka nvme_print(void *aux, const char *pnp)
490 1.1 nonaka {
491 1.1 nonaka struct nvme_attach_args *naa = aux;
492 1.1 nonaka
493 1.1 nonaka if (pnp)
494 1.1 nonaka aprint_normal("at %s", pnp);
495 1.1 nonaka
496 1.1 nonaka if (naa->naa_nsid > 0)
497 1.1 nonaka aprint_normal(" nsid %d", naa->naa_nsid);
498 1.1 nonaka
499 1.1 nonaka return UNCONF;
500 1.1 nonaka }
501 1.1 nonaka
502 1.1 nonaka int
503 1.1 nonaka nvme_detach(struct nvme_softc *sc, int flags)
504 1.1 nonaka {
505 1.1 nonaka int i, error;
506 1.1 nonaka
507 1.1 nonaka error = config_detach_children(sc->sc_dev, flags);
508 1.1 nonaka if (error)
509 1.1 nonaka return error;
510 1.1 nonaka
511 1.1 nonaka error = nvme_shutdown(sc);
512 1.1 nonaka if (error)
513 1.1 nonaka return error;
514 1.1 nonaka
515 1.9 jdolecek /* from now on we are committed to detach, following will never fail */
516 1.1 nonaka for (i = 0; i < sc->sc_nq; i++)
517 1.1 nonaka nvme_q_free(sc, sc->sc_q[i]);
518 1.1 nonaka kmem_free(sc->sc_q, sizeof(*sc->sc_q) * sc->sc_nq);
519 1.1 nonaka nvme_q_free(sc, sc->sc_admin_q);
520 1.1 nonaka
521 1.1 nonaka return 0;
522 1.1 nonaka }
523 1.1 nonaka
524 1.1 nonaka static int
525 1.1 nonaka nvme_shutdown(struct nvme_softc *sc)
526 1.1 nonaka {
527 1.1 nonaka uint32_t cc, csts;
528 1.1 nonaka bool disabled = false;
529 1.1 nonaka int i;
530 1.1 nonaka
531 1.1 nonaka if (!sc->sc_use_mq)
532 1.1 nonaka nvme_write4(sc, NVME_INTMS, 1);
533 1.1 nonaka
534 1.1 nonaka for (i = 0; i < sc->sc_nq; i++) {
535 1.1 nonaka if (nvme_q_delete(sc, sc->sc_q[i]) != 0) {
536 1.1 nonaka aprint_error_dev(sc->sc_dev,
537 1.1 nonaka "unable to delete io queue %d, disabling\n", i + 1);
538 1.1 nonaka disabled = true;
539 1.1 nonaka }
540 1.1 nonaka }
541 1.1 nonaka sc->sc_intr_disestablish(sc, NVME_ADMIN_Q);
542 1.1 nonaka if (disabled)
543 1.1 nonaka goto disable;
544 1.1 nonaka
545 1.1 nonaka cc = nvme_read4(sc, NVME_CC);
546 1.1 nonaka CLR(cc, NVME_CC_SHN_MASK);
547 1.1 nonaka SET(cc, NVME_CC_SHN(NVME_CC_SHN_NORMAL));
548 1.1 nonaka nvme_write4(sc, NVME_CC, cc);
549 1.1 nonaka
550 1.1 nonaka for (i = 0; i < 4000; i++) {
551 1.1 nonaka nvme_barrier(sc, 0, sc->sc_ios,
552 1.1 nonaka BUS_SPACE_BARRIER_READ | BUS_SPACE_BARRIER_WRITE);
553 1.1 nonaka csts = nvme_read4(sc, NVME_CSTS);
554 1.1 nonaka if ((csts & NVME_CSTS_SHST_MASK) == NVME_CSTS_SHST_DONE)
555 1.1 nonaka return 0;
556 1.1 nonaka
557 1.1 nonaka delay(1000);
558 1.1 nonaka }
559 1.1 nonaka
560 1.1 nonaka aprint_error_dev(sc->sc_dev, "unable to shudown, disabling\n");
561 1.1 nonaka
562 1.1 nonaka disable:
563 1.1 nonaka nvme_disable(sc);
564 1.1 nonaka return 0;
565 1.1 nonaka }
566 1.1 nonaka
567 1.1 nonaka void
568 1.1 nonaka nvme_childdet(device_t self, device_t child)
569 1.1 nonaka {
570 1.1 nonaka struct nvme_softc *sc = device_private(self);
571 1.1 nonaka int i;
572 1.1 nonaka
573 1.1 nonaka for (i = 0; i < sc->sc_nn; i++) {
574 1.1 nonaka if (sc->sc_namespaces[i].dev == child) {
575 1.1 nonaka /* Already freed ns->ident. */
576 1.1 nonaka sc->sc_namespaces[i].dev = NULL;
577 1.1 nonaka break;
578 1.1 nonaka }
579 1.1 nonaka }
580 1.1 nonaka }
581 1.1 nonaka
582 1.1 nonaka int
583 1.1 nonaka nvme_ns_identify(struct nvme_softc *sc, uint16_t nsid)
584 1.1 nonaka {
585 1.1 nonaka struct nvme_sqe sqe;
586 1.1 nonaka struct nvm_identify_namespace *identify;
587 1.19 jdolecek struct nvme_dmamem *mem;
588 1.1 nonaka struct nvme_ccb *ccb;
589 1.1 nonaka struct nvme_namespace *ns;
590 1.19 jdolecek int rv;
591 1.1 nonaka
592 1.1 nonaka KASSERT(nsid > 0);
593 1.1 nonaka
594 1.34 jdolecek ccb = nvme_ccb_get(sc->sc_admin_q, false);
595 1.11 jdolecek KASSERT(ccb != NULL); /* it's a bug if we don't have spare ccb here */
596 1.1 nonaka
597 1.19 jdolecek mem = nvme_dmamem_alloc(sc, sizeof(*identify));
598 1.32 christos if (mem == NULL) {
599 1.32 christos nvme_ccb_put(sc->sc_admin_q, ccb);
600 1.19 jdolecek return ENOMEM;
601 1.32 christos }
602 1.1 nonaka
603 1.1 nonaka memset(&sqe, 0, sizeof(sqe));
604 1.1 nonaka sqe.opcode = NVM_ADMIN_IDENTIFY;
605 1.1 nonaka htolem32(&sqe.nsid, nsid);
606 1.1 nonaka htolem64(&sqe.entry.prp[0], NVME_DMA_DVA(mem));
607 1.1 nonaka htolem32(&sqe.cdw10, 0);
608 1.1 nonaka
609 1.1 nonaka ccb->ccb_done = nvme_empty_done;
610 1.1 nonaka ccb->ccb_cookie = &sqe;
611 1.1 nonaka
612 1.1 nonaka nvme_dmamem_sync(sc, mem, BUS_DMASYNC_PREREAD);
613 1.19 jdolecek rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_sqe_fill, NVME_TIMO_IDENT);
614 1.1 nonaka nvme_dmamem_sync(sc, mem, BUS_DMASYNC_POSTREAD);
615 1.1 nonaka
616 1.1 nonaka nvme_ccb_put(sc->sc_admin_q, ccb);
617 1.1 nonaka
618 1.19 jdolecek if (rv != 0) {
619 1.19 jdolecek rv = EIO;
620 1.1 nonaka goto done;
621 1.1 nonaka }
622 1.1 nonaka
623 1.1 nonaka /* commit */
624 1.1 nonaka
625 1.1 nonaka identify = kmem_zalloc(sizeof(*identify), KM_SLEEP);
626 1.19 jdolecek *identify = *((volatile struct nvm_identify_namespace *)NVME_DMA_KVA(mem));
627 1.19 jdolecek //memcpy(identify, NVME_DMA_KVA(mem), sizeof(*identify));
628 1.1 nonaka
629 1.1 nonaka ns = nvme_ns_get(sc, nsid);
630 1.1 nonaka KASSERT(ns);
631 1.32 christos KASSERT(ns->ident == NULL);
632 1.1 nonaka ns->ident = identify;
633 1.1 nonaka
634 1.1 nonaka done:
635 1.19 jdolecek nvme_dmamem_free(sc, mem);
636 1.1 nonaka
637 1.19 jdolecek return rv;
638 1.1 nonaka }
639 1.1 nonaka
640 1.1 nonaka int
641 1.11 jdolecek nvme_ns_dobio(struct nvme_softc *sc, uint16_t nsid, void *cookie,
642 1.11 jdolecek struct buf *bp, void *data, size_t datasize,
643 1.11 jdolecek int secsize, daddr_t blkno, int flags, nvme_nnc_done nnc_done)
644 1.1 nonaka {
645 1.1 nonaka struct nvme_queue *q = nvme_get_q(sc);
646 1.1 nonaka struct nvme_ccb *ccb;
647 1.1 nonaka bus_dmamap_t dmap;
648 1.1 nonaka int i, error;
649 1.1 nonaka
650 1.34 jdolecek ccb = nvme_ccb_get(q, false);
651 1.1 nonaka if (ccb == NULL)
652 1.1 nonaka return EAGAIN;
653 1.1 nonaka
654 1.1 nonaka ccb->ccb_done = nvme_ns_io_done;
655 1.11 jdolecek ccb->ccb_cookie = cookie;
656 1.11 jdolecek
657 1.11 jdolecek /* namespace context */
658 1.11 jdolecek ccb->nnc_nsid = nsid;
659 1.11 jdolecek ccb->nnc_flags = flags;
660 1.11 jdolecek ccb->nnc_buf = bp;
661 1.11 jdolecek ccb->nnc_datasize = datasize;
662 1.11 jdolecek ccb->nnc_secsize = secsize;
663 1.11 jdolecek ccb->nnc_blkno = blkno;
664 1.11 jdolecek ccb->nnc_done = nnc_done;
665 1.1 nonaka
666 1.1 nonaka dmap = ccb->ccb_dmamap;
667 1.11 jdolecek error = bus_dmamap_load(sc->sc_dmat, dmap, data,
668 1.11 jdolecek datasize, NULL,
669 1.11 jdolecek (ISSET(flags, NVME_NS_CTX_F_POLL) ?
670 1.1 nonaka BUS_DMA_NOWAIT : BUS_DMA_WAITOK) |
671 1.11 jdolecek (ISSET(flags, NVME_NS_CTX_F_READ) ?
672 1.1 nonaka BUS_DMA_READ : BUS_DMA_WRITE));
673 1.1 nonaka if (error) {
674 1.1 nonaka nvme_ccb_put(q, ccb);
675 1.1 nonaka return error;
676 1.1 nonaka }
677 1.1 nonaka
678 1.1 nonaka bus_dmamap_sync(sc->sc_dmat, dmap, 0, dmap->dm_mapsize,
679 1.11 jdolecek ISSET(flags, NVME_NS_CTX_F_READ) ?
680 1.1 nonaka BUS_DMASYNC_PREREAD : BUS_DMASYNC_PREWRITE);
681 1.1 nonaka
682 1.1 nonaka if (dmap->dm_nsegs > 2) {
683 1.1 nonaka for (i = 1; i < dmap->dm_nsegs; i++) {
684 1.1 nonaka htolem64(&ccb->ccb_prpl[i - 1],
685 1.1 nonaka dmap->dm_segs[i].ds_addr);
686 1.1 nonaka }
687 1.1 nonaka bus_dmamap_sync(sc->sc_dmat,
688 1.1 nonaka NVME_DMA_MAP(q->q_ccb_prpls),
689 1.1 nonaka ccb->ccb_prpl_off,
690 1.16 nonaka sizeof(*ccb->ccb_prpl) * (dmap->dm_nsegs - 1),
691 1.1 nonaka BUS_DMASYNC_PREWRITE);
692 1.1 nonaka }
693 1.1 nonaka
694 1.11 jdolecek if (ISSET(flags, NVME_NS_CTX_F_POLL)) {
695 1.7 jdolecek if (nvme_poll(sc, q, ccb, nvme_ns_io_fill, NVME_TIMO_PT) != 0)
696 1.1 nonaka return EIO;
697 1.1 nonaka return 0;
698 1.1 nonaka }
699 1.1 nonaka
700 1.1 nonaka nvme_q_submit(sc, q, ccb, nvme_ns_io_fill);
701 1.1 nonaka return 0;
702 1.1 nonaka }
703 1.1 nonaka
704 1.1 nonaka static void
705 1.1 nonaka nvme_ns_io_fill(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
706 1.1 nonaka {
707 1.1 nonaka struct nvme_sqe_io *sqe = slot;
708 1.1 nonaka bus_dmamap_t dmap = ccb->ccb_dmamap;
709 1.1 nonaka
710 1.11 jdolecek sqe->opcode = ISSET(ccb->nnc_flags, NVME_NS_CTX_F_READ) ?
711 1.1 nonaka NVM_CMD_READ : NVM_CMD_WRITE;
712 1.11 jdolecek htolem32(&sqe->nsid, ccb->nnc_nsid);
713 1.1 nonaka
714 1.1 nonaka htolem64(&sqe->entry.prp[0], dmap->dm_segs[0].ds_addr);
715 1.1 nonaka switch (dmap->dm_nsegs) {
716 1.1 nonaka case 1:
717 1.1 nonaka break;
718 1.1 nonaka case 2:
719 1.1 nonaka htolem64(&sqe->entry.prp[1], dmap->dm_segs[1].ds_addr);
720 1.1 nonaka break;
721 1.1 nonaka default:
722 1.1 nonaka /* the prp list is already set up and synced */
723 1.1 nonaka htolem64(&sqe->entry.prp[1], ccb->ccb_prpl_dva);
724 1.1 nonaka break;
725 1.1 nonaka }
726 1.1 nonaka
727 1.11 jdolecek htolem64(&sqe->slba, ccb->nnc_blkno);
728 1.11 jdolecek
729 1.26 jdolecek if (ISSET(ccb->nnc_flags, NVME_NS_CTX_F_FUA))
730 1.26 jdolecek htolem16(&sqe->ioflags, NVM_SQE_IO_FUA);
731 1.26 jdolecek
732 1.11 jdolecek /* guaranteed by upper layers, but check just in case */
733 1.11 jdolecek KASSERT((ccb->nnc_datasize % ccb->nnc_secsize) == 0);
734 1.11 jdolecek htolem16(&sqe->nlb, (ccb->nnc_datasize / ccb->nnc_secsize) - 1);
735 1.1 nonaka }
736 1.1 nonaka
737 1.1 nonaka static void
738 1.1 nonaka nvme_ns_io_done(struct nvme_queue *q, struct nvme_ccb *ccb,
739 1.1 nonaka struct nvme_cqe *cqe)
740 1.1 nonaka {
741 1.1 nonaka struct nvme_softc *sc = q->q_sc;
742 1.1 nonaka bus_dmamap_t dmap = ccb->ccb_dmamap;
743 1.11 jdolecek void *nnc_cookie = ccb->ccb_cookie;
744 1.11 jdolecek nvme_nnc_done nnc_done = ccb->nnc_done;
745 1.11 jdolecek struct buf *bp = ccb->nnc_buf;
746 1.1 nonaka
747 1.1 nonaka if (dmap->dm_nsegs > 2) {
748 1.1 nonaka bus_dmamap_sync(sc->sc_dmat,
749 1.1 nonaka NVME_DMA_MAP(q->q_ccb_prpls),
750 1.1 nonaka ccb->ccb_prpl_off,
751 1.16 nonaka sizeof(*ccb->ccb_prpl) * (dmap->dm_nsegs - 1),
752 1.1 nonaka BUS_DMASYNC_POSTWRITE);
753 1.1 nonaka }
754 1.1 nonaka
755 1.1 nonaka bus_dmamap_sync(sc->sc_dmat, dmap, 0, dmap->dm_mapsize,
756 1.11 jdolecek ISSET(ccb->nnc_flags, NVME_NS_CTX_F_READ) ?
757 1.1 nonaka BUS_DMASYNC_POSTREAD : BUS_DMASYNC_POSTWRITE);
758 1.1 nonaka
759 1.1 nonaka bus_dmamap_unload(sc->sc_dmat, dmap);
760 1.1 nonaka nvme_ccb_put(q, ccb);
761 1.1 nonaka
762 1.25 jdolecek nnc_done(nnc_cookie, bp, lemtoh16(&cqe->flags), lemtoh32(&cqe->cdw0));
763 1.25 jdolecek }
764 1.25 jdolecek
765 1.25 jdolecek /*
766 1.25 jdolecek * If there is no volatile write cache, it makes no sense to issue
767 1.25 jdolecek * flush commands or query for the status.
768 1.25 jdolecek */
769 1.34 jdolecek static bool
770 1.25 jdolecek nvme_has_volatile_write_cache(struct nvme_softc *sc)
771 1.25 jdolecek {
772 1.25 jdolecek /* sc_identify is filled during attachment */
773 1.25 jdolecek return ((sc->sc_identify.vwc & NVME_ID_CTRLR_VWC_PRESENT) != 0);
774 1.1 nonaka }
775 1.1 nonaka
776 1.34 jdolecek static bool
777 1.34 jdolecek nvme_ns_sync_finished(void *cookie)
778 1.34 jdolecek {
779 1.34 jdolecek int *result = cookie;
780 1.34 jdolecek
781 1.34 jdolecek return (*result != 0);
782 1.34 jdolecek }
783 1.34 jdolecek
784 1.1 nonaka int
785 1.34 jdolecek nvme_ns_sync(struct nvme_softc *sc, uint16_t nsid, int flags)
786 1.1 nonaka {
787 1.1 nonaka struct nvme_queue *q = nvme_get_q(sc);
788 1.1 nonaka struct nvme_ccb *ccb;
789 1.34 jdolecek int result = 0;
790 1.34 jdolecek
791 1.34 jdolecek if (!nvme_has_volatile_write_cache(sc)) {
792 1.34 jdolecek /* cache not present, no value in trying to flush it */
793 1.34 jdolecek return 0;
794 1.34 jdolecek }
795 1.1 nonaka
796 1.34 jdolecek ccb = nvme_ccb_get(q, true);
797 1.1 nonaka if (ccb == NULL)
798 1.1 nonaka return EAGAIN;
799 1.1 nonaka
800 1.1 nonaka ccb->ccb_done = nvme_ns_sync_done;
801 1.34 jdolecek ccb->ccb_cookie = &result;
802 1.1 nonaka
803 1.11 jdolecek /* namespace context */
804 1.11 jdolecek ccb->nnc_nsid = nsid;
805 1.11 jdolecek ccb->nnc_flags = flags;
806 1.34 jdolecek ccb->nnc_done = NULL;
807 1.11 jdolecek
808 1.11 jdolecek if (ISSET(flags, NVME_NS_CTX_F_POLL)) {
809 1.7 jdolecek if (nvme_poll(sc, q, ccb, nvme_ns_sync_fill, NVME_TIMO_SY) != 0)
810 1.1 nonaka return EIO;
811 1.1 nonaka return 0;
812 1.1 nonaka }
813 1.1 nonaka
814 1.1 nonaka nvme_q_submit(sc, q, ccb, nvme_ns_sync_fill);
815 1.34 jdolecek
816 1.34 jdolecek /* wait for completion */
817 1.34 jdolecek nvme_q_wait_complete(sc, q, nvme_ns_sync_finished, &result);
818 1.34 jdolecek KASSERT(result != 0);
819 1.34 jdolecek
820 1.34 jdolecek return (result > 0) ? 0 : EIO;
821 1.1 nonaka }
822 1.1 nonaka
823 1.1 nonaka static void
824 1.1 nonaka nvme_ns_sync_fill(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
825 1.1 nonaka {
826 1.1 nonaka struct nvme_sqe *sqe = slot;
827 1.1 nonaka
828 1.1 nonaka sqe->opcode = NVM_CMD_FLUSH;
829 1.11 jdolecek htolem32(&sqe->nsid, ccb->nnc_nsid);
830 1.1 nonaka }
831 1.1 nonaka
832 1.1 nonaka static void
833 1.1 nonaka nvme_ns_sync_done(struct nvme_queue *q, struct nvme_ccb *ccb,
834 1.1 nonaka struct nvme_cqe *cqe)
835 1.1 nonaka {
836 1.34 jdolecek int *result = ccb->ccb_cookie;
837 1.34 jdolecek uint16_t status = NVME_CQE_SC(lemtoh16(&cqe->flags));
838 1.34 jdolecek
839 1.34 jdolecek if (status == NVME_CQE_SC_SUCCESS)
840 1.34 jdolecek *result = 1;
841 1.34 jdolecek else
842 1.34 jdolecek *result = -1;
843 1.1 nonaka
844 1.1 nonaka nvme_ccb_put(q, ccb);
845 1.34 jdolecek }
846 1.34 jdolecek
847 1.34 jdolecek static bool
848 1.34 jdolecek nvme_getcache_finished(void *xc)
849 1.34 jdolecek {
850 1.34 jdolecek int *addr = xc;
851 1.1 nonaka
852 1.34 jdolecek return (*addr != 0);
853 1.25 jdolecek }
854 1.25 jdolecek
855 1.25 jdolecek /*
856 1.25 jdolecek * Get status of volatile write cache. Always asynchronous.
857 1.25 jdolecek */
858 1.25 jdolecek int
859 1.34 jdolecek nvme_admin_getcache(struct nvme_softc *sc, int *addr)
860 1.25 jdolecek {
861 1.25 jdolecek struct nvme_ccb *ccb;
862 1.25 jdolecek struct nvme_queue *q = sc->sc_admin_q;
863 1.34 jdolecek int result = 0, error;
864 1.25 jdolecek
865 1.34 jdolecek if (!nvme_has_volatile_write_cache(sc)) {
866 1.34 jdolecek /* cache simply not present */
867 1.34 jdolecek *addr = 0;
868 1.34 jdolecek return 0;
869 1.34 jdolecek }
870 1.34 jdolecek
871 1.34 jdolecek ccb = nvme_ccb_get(q, true);
872 1.34 jdolecek KASSERT(ccb != NULL);
873 1.25 jdolecek
874 1.25 jdolecek ccb->ccb_done = nvme_getcache_done;
875 1.34 jdolecek ccb->ccb_cookie = &result;
876 1.25 jdolecek
877 1.25 jdolecek /* namespace context */
878 1.25 jdolecek ccb->nnc_flags = 0;
879 1.34 jdolecek ccb->nnc_done = NULL;
880 1.25 jdolecek
881 1.25 jdolecek nvme_q_submit(sc, q, ccb, nvme_getcache_fill);
882 1.34 jdolecek
883 1.34 jdolecek /* wait for completion */
884 1.34 jdolecek nvme_q_wait_complete(sc, q, nvme_getcache_finished, &result);
885 1.34 jdolecek KASSERT(result != 0);
886 1.34 jdolecek
887 1.34 jdolecek if (result > 0) {
888 1.34 jdolecek *addr = result;
889 1.34 jdolecek error = 0;
890 1.34 jdolecek } else
891 1.34 jdolecek error = EINVAL;
892 1.34 jdolecek
893 1.34 jdolecek return error;
894 1.25 jdolecek }
895 1.25 jdolecek
896 1.25 jdolecek static void
897 1.25 jdolecek nvme_getcache_fill(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
898 1.25 jdolecek {
899 1.25 jdolecek struct nvme_sqe *sqe = slot;
900 1.25 jdolecek
901 1.25 jdolecek sqe->opcode = NVM_ADMIN_GET_FEATURES;
902 1.25 jdolecek sqe->cdw10 = NVM_FEATURE_VOLATILE_WRITE_CACHE;
903 1.25 jdolecek }
904 1.25 jdolecek
905 1.25 jdolecek static void
906 1.25 jdolecek nvme_getcache_done(struct nvme_queue *q, struct nvme_ccb *ccb,
907 1.25 jdolecek struct nvme_cqe *cqe)
908 1.25 jdolecek {
909 1.34 jdolecek int *addr = ccb->ccb_cookie;
910 1.34 jdolecek uint16_t status = NVME_CQE_SC(lemtoh16(&cqe->flags));
911 1.34 jdolecek uint32_t cdw0 = lemtoh32(&cqe->cdw0);
912 1.34 jdolecek int result;
913 1.34 jdolecek
914 1.34 jdolecek if (status == NVME_CQE_SC_SUCCESS) {
915 1.34 jdolecek result = 0;
916 1.34 jdolecek
917 1.34 jdolecek /*
918 1.34 jdolecek * DPO not supported, Dataset Management (DSM) field doesn't
919 1.34 jdolecek * specify the same semantics. FUA is always supported.
920 1.34 jdolecek */
921 1.34 jdolecek result = DKCACHE_FUA;
922 1.34 jdolecek
923 1.34 jdolecek if (cdw0 & NVME_CQE_CDW0_VWC_WCE)
924 1.34 jdolecek result |= DKCACHE_WRITE;
925 1.34 jdolecek
926 1.34 jdolecek /*
927 1.34 jdolecek * If volatile write cache is present, the flag shall also be
928 1.34 jdolecek * settable.
929 1.34 jdolecek */
930 1.34 jdolecek result |= DKCACHE_WCHANGE;
931 1.34 jdolecek } else {
932 1.34 jdolecek result = -1;
933 1.34 jdolecek }
934 1.34 jdolecek
935 1.34 jdolecek *addr = result;
936 1.25 jdolecek
937 1.25 jdolecek nvme_ccb_put(q, ccb);
938 1.1 nonaka }
939 1.1 nonaka
940 1.1 nonaka void
941 1.1 nonaka nvme_ns_free(struct nvme_softc *sc, uint16_t nsid)
942 1.1 nonaka {
943 1.1 nonaka struct nvme_namespace *ns;
944 1.1 nonaka struct nvm_identify_namespace *identify;
945 1.1 nonaka
946 1.1 nonaka ns = nvme_ns_get(sc, nsid);
947 1.1 nonaka KASSERT(ns);
948 1.1 nonaka
949 1.1 nonaka identify = ns->ident;
950 1.1 nonaka ns->ident = NULL;
951 1.1 nonaka if (identify != NULL)
952 1.1 nonaka kmem_free(identify, sizeof(*identify));
953 1.1 nonaka }
954 1.1 nonaka
955 1.35 jdolecek struct nvme_pt_state {
956 1.35 jdolecek struct nvme_pt_command *pt;
957 1.35 jdolecek bool finished;
958 1.35 jdolecek };
959 1.35 jdolecek
960 1.1 nonaka static void
961 1.3 nonaka nvme_pt_fill(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
962 1.3 nonaka {
963 1.3 nonaka struct nvme_softc *sc = q->q_sc;
964 1.3 nonaka struct nvme_sqe *sqe = slot;
965 1.35 jdolecek struct nvme_pt_state *state = ccb->ccb_cookie;
966 1.35 jdolecek struct nvme_pt_command *pt = state->pt;
967 1.3 nonaka bus_dmamap_t dmap = ccb->ccb_dmamap;
968 1.3 nonaka int i;
969 1.3 nonaka
970 1.3 nonaka sqe->opcode = pt->cmd.opcode;
971 1.3 nonaka htolem32(&sqe->nsid, pt->cmd.nsid);
972 1.3 nonaka
973 1.3 nonaka if (pt->buf != NULL && pt->len > 0) {
974 1.3 nonaka htolem64(&sqe->entry.prp[0], dmap->dm_segs[0].ds_addr);
975 1.3 nonaka switch (dmap->dm_nsegs) {
976 1.3 nonaka case 1:
977 1.3 nonaka break;
978 1.3 nonaka case 2:
979 1.3 nonaka htolem64(&sqe->entry.prp[1], dmap->dm_segs[1].ds_addr);
980 1.3 nonaka break;
981 1.3 nonaka default:
982 1.3 nonaka for (i = 1; i < dmap->dm_nsegs; i++) {
983 1.3 nonaka htolem64(&ccb->ccb_prpl[i - 1],
984 1.3 nonaka dmap->dm_segs[i].ds_addr);
985 1.3 nonaka }
986 1.3 nonaka bus_dmamap_sync(sc->sc_dmat,
987 1.3 nonaka NVME_DMA_MAP(q->q_ccb_prpls),
988 1.3 nonaka ccb->ccb_prpl_off,
989 1.16 nonaka sizeof(*ccb->ccb_prpl) * (dmap->dm_nsegs - 1),
990 1.3 nonaka BUS_DMASYNC_PREWRITE);
991 1.3 nonaka htolem64(&sqe->entry.prp[1], ccb->ccb_prpl_dva);
992 1.3 nonaka break;
993 1.3 nonaka }
994 1.3 nonaka }
995 1.3 nonaka
996 1.3 nonaka htolem32(&sqe->cdw10, pt->cmd.cdw10);
997 1.3 nonaka htolem32(&sqe->cdw11, pt->cmd.cdw11);
998 1.3 nonaka htolem32(&sqe->cdw12, pt->cmd.cdw12);
999 1.3 nonaka htolem32(&sqe->cdw13, pt->cmd.cdw13);
1000 1.3 nonaka htolem32(&sqe->cdw14, pt->cmd.cdw14);
1001 1.3 nonaka htolem32(&sqe->cdw15, pt->cmd.cdw15);
1002 1.3 nonaka }
1003 1.3 nonaka
1004 1.3 nonaka static void
1005 1.3 nonaka nvme_pt_done(struct nvme_queue *q, struct nvme_ccb *ccb, struct nvme_cqe *cqe)
1006 1.3 nonaka {
1007 1.3 nonaka struct nvme_softc *sc = q->q_sc;
1008 1.35 jdolecek struct nvme_pt_state *state = ccb->ccb_cookie;
1009 1.35 jdolecek struct nvme_pt_command *pt = state->pt;
1010 1.3 nonaka bus_dmamap_t dmap = ccb->ccb_dmamap;
1011 1.3 nonaka
1012 1.3 nonaka if (pt->buf != NULL && pt->len > 0) {
1013 1.3 nonaka if (dmap->dm_nsegs > 2) {
1014 1.3 nonaka bus_dmamap_sync(sc->sc_dmat,
1015 1.3 nonaka NVME_DMA_MAP(q->q_ccb_prpls),
1016 1.3 nonaka ccb->ccb_prpl_off,
1017 1.16 nonaka sizeof(*ccb->ccb_prpl) * (dmap->dm_nsegs - 1),
1018 1.3 nonaka BUS_DMASYNC_POSTWRITE);
1019 1.3 nonaka }
1020 1.3 nonaka
1021 1.3 nonaka bus_dmamap_sync(sc->sc_dmat, dmap, 0, dmap->dm_mapsize,
1022 1.3 nonaka pt->is_read ? BUS_DMASYNC_POSTREAD : BUS_DMASYNC_POSTWRITE);
1023 1.3 nonaka bus_dmamap_unload(sc->sc_dmat, dmap);
1024 1.3 nonaka }
1025 1.3 nonaka
1026 1.23 nonaka pt->cpl.cdw0 = lemtoh32(&cqe->cdw0);
1027 1.23 nonaka pt->cpl.flags = lemtoh16(&cqe->flags) & ~NVME_CQE_PHASE;
1028 1.35 jdolecek
1029 1.35 jdolecek state->finished = true;
1030 1.35 jdolecek
1031 1.35 jdolecek nvme_ccb_put(q, ccb);
1032 1.35 jdolecek }
1033 1.35 jdolecek
1034 1.35 jdolecek static bool
1035 1.35 jdolecek nvme_pt_finished(void *cookie)
1036 1.35 jdolecek {
1037 1.35 jdolecek struct nvme_pt_state *state = cookie;
1038 1.35 jdolecek
1039 1.35 jdolecek return state->finished;
1040 1.3 nonaka }
1041 1.3 nonaka
1042 1.3 nonaka static int
1043 1.3 nonaka nvme_command_passthrough(struct nvme_softc *sc, struct nvme_pt_command *pt,
1044 1.3 nonaka uint16_t nsid, struct lwp *l, bool is_adminq)
1045 1.3 nonaka {
1046 1.3 nonaka struct nvme_queue *q;
1047 1.3 nonaka struct nvme_ccb *ccb;
1048 1.3 nonaka void *buf = NULL;
1049 1.35 jdolecek struct nvme_pt_state state;
1050 1.3 nonaka int error;
1051 1.3 nonaka
1052 1.9 jdolecek /* limit command size to maximum data transfer size */
1053 1.3 nonaka if ((pt->buf == NULL && pt->len > 0) ||
1054 1.9 jdolecek (pt->buf != NULL && (pt->len == 0 || pt->len > sc->sc_mdts)))
1055 1.3 nonaka return EINVAL;
1056 1.3 nonaka
1057 1.3 nonaka q = is_adminq ? sc->sc_admin_q : nvme_get_q(sc);
1058 1.34 jdolecek ccb = nvme_ccb_get(q, true);
1059 1.34 jdolecek KASSERT(ccb != NULL);
1060 1.3 nonaka
1061 1.9 jdolecek if (pt->buf != NULL) {
1062 1.9 jdolecek KASSERT(pt->len > 0);
1063 1.3 nonaka buf = kmem_alloc(pt->len, KM_SLEEP);
1064 1.3 nonaka if (!pt->is_read) {
1065 1.3 nonaka error = copyin(pt->buf, buf, pt->len);
1066 1.3 nonaka if (error)
1067 1.3 nonaka goto kmem_free;
1068 1.3 nonaka }
1069 1.3 nonaka error = bus_dmamap_load(sc->sc_dmat, ccb->ccb_dmamap, buf,
1070 1.3 nonaka pt->len, NULL,
1071 1.3 nonaka BUS_DMA_WAITOK |
1072 1.3 nonaka (pt->is_read ? BUS_DMA_READ : BUS_DMA_WRITE));
1073 1.3 nonaka if (error)
1074 1.3 nonaka goto kmem_free;
1075 1.3 nonaka bus_dmamap_sync(sc->sc_dmat, ccb->ccb_dmamap,
1076 1.3 nonaka 0, ccb->ccb_dmamap->dm_mapsize,
1077 1.3 nonaka pt->is_read ? BUS_DMASYNC_PREREAD : BUS_DMASYNC_PREWRITE);
1078 1.3 nonaka }
1079 1.3 nonaka
1080 1.35 jdolecek memset(&state, 0, sizeof(state));
1081 1.35 jdolecek state.pt = pt;
1082 1.35 jdolecek state.finished = false;
1083 1.35 jdolecek
1084 1.3 nonaka ccb->ccb_done = nvme_pt_done;
1085 1.35 jdolecek ccb->ccb_cookie = &state;
1086 1.3 nonaka
1087 1.3 nonaka pt->cmd.nsid = nsid;
1088 1.35 jdolecek
1089 1.35 jdolecek nvme_q_submit(sc, q, ccb, nvme_pt_fill);
1090 1.35 jdolecek
1091 1.35 jdolecek /* wait for completion */
1092 1.35 jdolecek nvme_q_wait_complete(sc, q, nvme_pt_finished, &state);
1093 1.35 jdolecek KASSERT(state.finished);
1094 1.3 nonaka
1095 1.3 nonaka error = 0;
1096 1.35 jdolecek
1097 1.3 nonaka if (buf != NULL) {
1098 1.3 nonaka if (error == 0 && pt->is_read)
1099 1.3 nonaka error = copyout(buf, pt->buf, pt->len);
1100 1.3 nonaka kmem_free:
1101 1.3 nonaka kmem_free(buf, pt->len);
1102 1.3 nonaka }
1103 1.35 jdolecek
1104 1.3 nonaka return error;
1105 1.3 nonaka }
1106 1.3 nonaka
1107 1.3 nonaka static void
1108 1.1 nonaka nvme_q_submit(struct nvme_softc *sc, struct nvme_queue *q, struct nvme_ccb *ccb,
1109 1.1 nonaka void (*fill)(struct nvme_queue *, struct nvme_ccb *, void *))
1110 1.1 nonaka {
1111 1.1 nonaka struct nvme_sqe *sqe = NVME_DMA_KVA(q->q_sq_dmamem);
1112 1.1 nonaka uint32_t tail;
1113 1.1 nonaka
1114 1.1 nonaka mutex_enter(&q->q_sq_mtx);
1115 1.1 nonaka tail = q->q_sq_tail;
1116 1.1 nonaka if (++q->q_sq_tail >= q->q_entries)
1117 1.1 nonaka q->q_sq_tail = 0;
1118 1.1 nonaka
1119 1.1 nonaka sqe += tail;
1120 1.1 nonaka
1121 1.1 nonaka bus_dmamap_sync(sc->sc_dmat, NVME_DMA_MAP(q->q_sq_dmamem),
1122 1.1 nonaka sizeof(*sqe) * tail, sizeof(*sqe), BUS_DMASYNC_POSTWRITE);
1123 1.1 nonaka memset(sqe, 0, sizeof(*sqe));
1124 1.1 nonaka (*fill)(q, ccb, sqe);
1125 1.1 nonaka sqe->cid = ccb->ccb_id;
1126 1.1 nonaka bus_dmamap_sync(sc->sc_dmat, NVME_DMA_MAP(q->q_sq_dmamem),
1127 1.1 nonaka sizeof(*sqe) * tail, sizeof(*sqe), BUS_DMASYNC_PREWRITE);
1128 1.1 nonaka
1129 1.1 nonaka nvme_write4(sc, q->q_sqtdbl, q->q_sq_tail);
1130 1.1 nonaka mutex_exit(&q->q_sq_mtx);
1131 1.1 nonaka }
1132 1.1 nonaka
1133 1.1 nonaka struct nvme_poll_state {
1134 1.1 nonaka struct nvme_sqe s;
1135 1.1 nonaka struct nvme_cqe c;
1136 1.34 jdolecek void *cookie;
1137 1.34 jdolecek void (*done)(struct nvme_queue *, struct nvme_ccb *, struct nvme_cqe *);
1138 1.1 nonaka };
1139 1.1 nonaka
1140 1.1 nonaka static int
1141 1.1 nonaka nvme_poll(struct nvme_softc *sc, struct nvme_queue *q, struct nvme_ccb *ccb,
1142 1.7 jdolecek void (*fill)(struct nvme_queue *, struct nvme_ccb *, void *), int timo_sec)
1143 1.1 nonaka {
1144 1.1 nonaka struct nvme_poll_state state;
1145 1.1 nonaka uint16_t flags;
1146 1.7 jdolecek int step = 10;
1147 1.7 jdolecek int maxloop = timo_sec * 1000000 / step;
1148 1.7 jdolecek int error = 0;
1149 1.1 nonaka
1150 1.1 nonaka memset(&state, 0, sizeof(state));
1151 1.1 nonaka (*fill)(q, ccb, &state.s);
1152 1.1 nonaka
1153 1.34 jdolecek state.done = ccb->ccb_done;
1154 1.34 jdolecek state.cookie = ccb->ccb_cookie;
1155 1.1 nonaka
1156 1.1 nonaka ccb->ccb_done = nvme_poll_done;
1157 1.1 nonaka ccb->ccb_cookie = &state;
1158 1.1 nonaka
1159 1.1 nonaka nvme_q_submit(sc, q, ccb, nvme_poll_fill);
1160 1.1 nonaka while (!ISSET(state.c.flags, htole16(NVME_CQE_PHASE))) {
1161 1.1 nonaka if (nvme_q_complete(sc, q) == 0)
1162 1.7 jdolecek delay(step);
1163 1.1 nonaka
1164 1.7 jdolecek if (timo_sec >= 0 && --maxloop <= 0) {
1165 1.7 jdolecek error = ETIMEDOUT;
1166 1.7 jdolecek break;
1167 1.7 jdolecek }
1168 1.1 nonaka }
1169 1.1 nonaka
1170 1.7 jdolecek if (error == 0) {
1171 1.7 jdolecek flags = lemtoh16(&state.c.flags);
1172 1.7 jdolecek return flags & ~NVME_CQE_PHASE;
1173 1.7 jdolecek } else {
1174 1.34 jdolecek /*
1175 1.34 jdolecek * If it succeds later, it would hit ccb which will have been
1176 1.34 jdolecek * already reused for something else. Not good. Cross
1177 1.34 jdolecek * fingers and hope for best. XXX do controller reset?
1178 1.34 jdolecek */
1179 1.34 jdolecek aprint_error_dev(sc->sc_dev, "polled command timed out\n");
1180 1.34 jdolecek
1181 1.34 jdolecek /* Invoke the callback to clean state anyway */
1182 1.34 jdolecek struct nvme_cqe cqe;
1183 1.34 jdolecek memset(&cqe, 0, sizeof(cqe));
1184 1.34 jdolecek ccb->ccb_done(q, ccb, &cqe);
1185 1.34 jdolecek
1186 1.7 jdolecek return 1;
1187 1.7 jdolecek }
1188 1.1 nonaka }
1189 1.1 nonaka
1190 1.1 nonaka static void
1191 1.1 nonaka nvme_poll_fill(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
1192 1.1 nonaka {
1193 1.1 nonaka struct nvme_sqe *sqe = slot;
1194 1.1 nonaka struct nvme_poll_state *state = ccb->ccb_cookie;
1195 1.1 nonaka
1196 1.1 nonaka *sqe = state->s;
1197 1.1 nonaka }
1198 1.1 nonaka
1199 1.1 nonaka static void
1200 1.1 nonaka nvme_poll_done(struct nvme_queue *q, struct nvme_ccb *ccb,
1201 1.1 nonaka struct nvme_cqe *cqe)
1202 1.1 nonaka {
1203 1.1 nonaka struct nvme_poll_state *state = ccb->ccb_cookie;
1204 1.1 nonaka
1205 1.1 nonaka SET(cqe->flags, htole16(NVME_CQE_PHASE));
1206 1.1 nonaka state->c = *cqe;
1207 1.34 jdolecek
1208 1.34 jdolecek ccb->ccb_cookie = state->cookie;
1209 1.34 jdolecek state->done(q, ccb, &state->c);
1210 1.1 nonaka }
1211 1.1 nonaka
1212 1.1 nonaka static void
1213 1.1 nonaka nvme_sqe_fill(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
1214 1.1 nonaka {
1215 1.1 nonaka struct nvme_sqe *src = ccb->ccb_cookie;
1216 1.1 nonaka struct nvme_sqe *dst = slot;
1217 1.1 nonaka
1218 1.1 nonaka *dst = *src;
1219 1.1 nonaka }
1220 1.1 nonaka
1221 1.1 nonaka static void
1222 1.1 nonaka nvme_empty_done(struct nvme_queue *q, struct nvme_ccb *ccb,
1223 1.1 nonaka struct nvme_cqe *cqe)
1224 1.1 nonaka {
1225 1.1 nonaka }
1226 1.1 nonaka
1227 1.1 nonaka static int
1228 1.1 nonaka nvme_q_complete(struct nvme_softc *sc, struct nvme_queue *q)
1229 1.1 nonaka {
1230 1.1 nonaka struct nvme_ccb *ccb;
1231 1.1 nonaka struct nvme_cqe *ring = NVME_DMA_KVA(q->q_cq_dmamem), *cqe;
1232 1.1 nonaka uint16_t flags;
1233 1.1 nonaka int rv = 0;
1234 1.1 nonaka
1235 1.9 jdolecek mutex_enter(&q->q_cq_mtx);
1236 1.1 nonaka
1237 1.1 nonaka nvme_dmamem_sync(sc, q->q_cq_dmamem, BUS_DMASYNC_POSTREAD);
1238 1.1 nonaka for (;;) {
1239 1.9 jdolecek cqe = &ring[q->q_cq_head];
1240 1.1 nonaka flags = lemtoh16(&cqe->flags);
1241 1.1 nonaka if ((flags & NVME_CQE_PHASE) != q->q_cq_phase)
1242 1.1 nonaka break;
1243 1.1 nonaka
1244 1.1 nonaka ccb = &q->q_ccbs[cqe->cid];
1245 1.1 nonaka
1246 1.9 jdolecek if (++q->q_cq_head >= q->q_entries) {
1247 1.9 jdolecek q->q_cq_head = 0;
1248 1.1 nonaka q->q_cq_phase ^= NVME_CQE_PHASE;
1249 1.1 nonaka }
1250 1.1 nonaka
1251 1.18 jdolecek #ifdef DEBUG
1252 1.18 jdolecek /*
1253 1.18 jdolecek * If we get spurious completion notification, something
1254 1.18 jdolecek * is seriously hosed up. Very likely DMA to some random
1255 1.18 jdolecek * memory place happened, so just bail out.
1256 1.18 jdolecek */
1257 1.18 jdolecek if ((intptr_t)ccb->ccb_cookie == NVME_CCB_FREE) {
1258 1.18 jdolecek panic("%s: invalid ccb detected",
1259 1.18 jdolecek device_xname(sc->sc_dev));
1260 1.18 jdolecek /* NOTREACHED */
1261 1.18 jdolecek }
1262 1.18 jdolecek #endif
1263 1.20 jdolecek
1264 1.20 jdolecek rv++;
1265 1.9 jdolecek
1266 1.9 jdolecek /*
1267 1.10 jdolecek * Unlock the mutex before calling the ccb_done callback
1268 1.9 jdolecek * and re-lock afterwards. The callback triggers lddone()
1269 1.9 jdolecek * which schedules another i/o, and also calls nvme_ccb_put().
1270 1.9 jdolecek * Unlock/relock avoids possibility of deadlock.
1271 1.9 jdolecek */
1272 1.9 jdolecek mutex_exit(&q->q_cq_mtx);
1273 1.9 jdolecek ccb->ccb_done(q, ccb, cqe);
1274 1.9 jdolecek mutex_enter(&q->q_cq_mtx);
1275 1.1 nonaka }
1276 1.1 nonaka nvme_dmamem_sync(sc, q->q_cq_dmamem, BUS_DMASYNC_PREREAD);
1277 1.1 nonaka
1278 1.1 nonaka if (rv)
1279 1.9 jdolecek nvme_write4(sc, q->q_cqhdbl, q->q_cq_head);
1280 1.9 jdolecek
1281 1.1 nonaka mutex_exit(&q->q_cq_mtx);
1282 1.1 nonaka
1283 1.1 nonaka return rv;
1284 1.1 nonaka }
1285 1.1 nonaka
1286 1.34 jdolecek static void
1287 1.34 jdolecek nvme_q_wait_complete(struct nvme_softc *sc,
1288 1.34 jdolecek struct nvme_queue *q, bool (*finished)(void *), void *cookie)
1289 1.34 jdolecek {
1290 1.34 jdolecek mutex_enter(&q->q_ccb_mtx);
1291 1.34 jdolecek if (finished(cookie))
1292 1.34 jdolecek goto out;
1293 1.34 jdolecek
1294 1.34 jdolecek for(;;) {
1295 1.34 jdolecek q->q_ccb_waiting = true;
1296 1.34 jdolecek cv_wait(&q->q_ccb_wait, &q->q_ccb_mtx);
1297 1.34 jdolecek
1298 1.34 jdolecek if (finished(cookie))
1299 1.34 jdolecek break;
1300 1.34 jdolecek }
1301 1.34 jdolecek
1302 1.34 jdolecek out:
1303 1.34 jdolecek mutex_exit(&q->q_ccb_mtx);
1304 1.34 jdolecek }
1305 1.34 jdolecek
1306 1.1 nonaka static int
1307 1.1 nonaka nvme_identify(struct nvme_softc *sc, u_int mps)
1308 1.1 nonaka {
1309 1.1 nonaka char sn[41], mn[81], fr[17];
1310 1.1 nonaka struct nvm_identify_controller *identify;
1311 1.19 jdolecek struct nvme_dmamem *mem;
1312 1.1 nonaka struct nvme_ccb *ccb;
1313 1.1 nonaka u_int mdts;
1314 1.19 jdolecek int rv = 1;
1315 1.1 nonaka
1316 1.34 jdolecek ccb = nvme_ccb_get(sc->sc_admin_q, false);
1317 1.11 jdolecek KASSERT(ccb != NULL); /* it's a bug if we don't have spare ccb here */
1318 1.1 nonaka
1319 1.19 jdolecek mem = nvme_dmamem_alloc(sc, sizeof(*identify));
1320 1.19 jdolecek if (mem == NULL)
1321 1.19 jdolecek return 1;
1322 1.1 nonaka
1323 1.1 nonaka ccb->ccb_done = nvme_empty_done;
1324 1.19 jdolecek ccb->ccb_cookie = mem;
1325 1.1 nonaka
1326 1.1 nonaka nvme_dmamem_sync(sc, mem, BUS_DMASYNC_PREREAD);
1327 1.19 jdolecek rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_fill_identify,
1328 1.7 jdolecek NVME_TIMO_IDENT);
1329 1.1 nonaka nvme_dmamem_sync(sc, mem, BUS_DMASYNC_POSTREAD);
1330 1.1 nonaka
1331 1.1 nonaka nvme_ccb_put(sc->sc_admin_q, ccb);
1332 1.1 nonaka
1333 1.19 jdolecek if (rv != 0)
1334 1.1 nonaka goto done;
1335 1.1 nonaka
1336 1.1 nonaka identify = NVME_DMA_KVA(mem);
1337 1.1 nonaka
1338 1.2 christos strnvisx(sn, sizeof(sn), (const char *)identify->sn,
1339 1.2 christos sizeof(identify->sn), VIS_TRIM|VIS_SAFE|VIS_OCTAL);
1340 1.2 christos strnvisx(mn, sizeof(mn), (const char *)identify->mn,
1341 1.2 christos sizeof(identify->mn), VIS_TRIM|VIS_SAFE|VIS_OCTAL);
1342 1.2 christos strnvisx(fr, sizeof(fr), (const char *)identify->fr,
1343 1.2 christos sizeof(identify->fr), VIS_TRIM|VIS_SAFE|VIS_OCTAL);
1344 1.1 nonaka aprint_normal_dev(sc->sc_dev, "%s, firmware %s, serial %s\n", mn, fr,
1345 1.1 nonaka sn);
1346 1.1 nonaka
1347 1.1 nonaka if (identify->mdts > 0) {
1348 1.1 nonaka mdts = (1 << identify->mdts) * (1 << mps);
1349 1.1 nonaka if (mdts < sc->sc_mdts)
1350 1.1 nonaka sc->sc_mdts = mdts;
1351 1.1 nonaka }
1352 1.1 nonaka
1353 1.1 nonaka sc->sc_nn = lemtoh32(&identify->nn);
1354 1.1 nonaka
1355 1.1 nonaka memcpy(&sc->sc_identify, identify, sizeof(sc->sc_identify));
1356 1.1 nonaka
1357 1.1 nonaka done:
1358 1.19 jdolecek nvme_dmamem_free(sc, mem);
1359 1.1 nonaka
1360 1.19 jdolecek return rv;
1361 1.1 nonaka }
1362 1.1 nonaka
1363 1.1 nonaka static int
1364 1.1 nonaka nvme_q_create(struct nvme_softc *sc, struct nvme_queue *q)
1365 1.1 nonaka {
1366 1.1 nonaka struct nvme_sqe_q sqe;
1367 1.1 nonaka struct nvme_ccb *ccb;
1368 1.1 nonaka int rv;
1369 1.1 nonaka
1370 1.9 jdolecek if (sc->sc_use_mq && sc->sc_intr_establish(sc, q->q_id, q) != 0)
1371 1.1 nonaka return 1;
1372 1.1 nonaka
1373 1.34 jdolecek ccb = nvme_ccb_get(sc->sc_admin_q, false);
1374 1.1 nonaka KASSERT(ccb != NULL);
1375 1.1 nonaka
1376 1.1 nonaka ccb->ccb_done = nvme_empty_done;
1377 1.1 nonaka ccb->ccb_cookie = &sqe;
1378 1.1 nonaka
1379 1.1 nonaka memset(&sqe, 0, sizeof(sqe));
1380 1.1 nonaka sqe.opcode = NVM_ADMIN_ADD_IOCQ;
1381 1.1 nonaka htolem64(&sqe.prp1, NVME_DMA_DVA(q->q_cq_dmamem));
1382 1.1 nonaka htolem16(&sqe.qsize, q->q_entries - 1);
1383 1.1 nonaka htolem16(&sqe.qid, q->q_id);
1384 1.1 nonaka sqe.qflags = NVM_SQE_CQ_IEN | NVM_SQE_Q_PC;
1385 1.1 nonaka if (sc->sc_use_mq)
1386 1.1 nonaka htolem16(&sqe.cqid, q->q_id); /* qid == vector */
1387 1.1 nonaka
1388 1.7 jdolecek rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_sqe_fill, NVME_TIMO_QOP);
1389 1.1 nonaka if (rv != 0)
1390 1.1 nonaka goto fail;
1391 1.1 nonaka
1392 1.1 nonaka ccb->ccb_done = nvme_empty_done;
1393 1.1 nonaka ccb->ccb_cookie = &sqe;
1394 1.1 nonaka
1395 1.1 nonaka memset(&sqe, 0, sizeof(sqe));
1396 1.1 nonaka sqe.opcode = NVM_ADMIN_ADD_IOSQ;
1397 1.1 nonaka htolem64(&sqe.prp1, NVME_DMA_DVA(q->q_sq_dmamem));
1398 1.1 nonaka htolem16(&sqe.qsize, q->q_entries - 1);
1399 1.1 nonaka htolem16(&sqe.qid, q->q_id);
1400 1.1 nonaka htolem16(&sqe.cqid, q->q_id);
1401 1.1 nonaka sqe.qflags = NVM_SQE_Q_PC;
1402 1.1 nonaka
1403 1.7 jdolecek rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_sqe_fill, NVME_TIMO_QOP);
1404 1.1 nonaka if (rv != 0)
1405 1.1 nonaka goto fail;
1406 1.1 nonaka
1407 1.1 nonaka fail:
1408 1.1 nonaka nvme_ccb_put(sc->sc_admin_q, ccb);
1409 1.1 nonaka return rv;
1410 1.1 nonaka }
1411 1.1 nonaka
1412 1.1 nonaka static int
1413 1.1 nonaka nvme_q_delete(struct nvme_softc *sc, struct nvme_queue *q)
1414 1.1 nonaka {
1415 1.1 nonaka struct nvme_sqe_q sqe;
1416 1.1 nonaka struct nvme_ccb *ccb;
1417 1.1 nonaka int rv;
1418 1.1 nonaka
1419 1.34 jdolecek ccb = nvme_ccb_get(sc->sc_admin_q, false);
1420 1.1 nonaka KASSERT(ccb != NULL);
1421 1.1 nonaka
1422 1.1 nonaka ccb->ccb_done = nvme_empty_done;
1423 1.1 nonaka ccb->ccb_cookie = &sqe;
1424 1.1 nonaka
1425 1.1 nonaka memset(&sqe, 0, sizeof(sqe));
1426 1.1 nonaka sqe.opcode = NVM_ADMIN_DEL_IOSQ;
1427 1.1 nonaka htolem16(&sqe.qid, q->q_id);
1428 1.1 nonaka
1429 1.7 jdolecek rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_sqe_fill, NVME_TIMO_QOP);
1430 1.1 nonaka if (rv != 0)
1431 1.1 nonaka goto fail;
1432 1.1 nonaka
1433 1.1 nonaka ccb->ccb_done = nvme_empty_done;
1434 1.1 nonaka ccb->ccb_cookie = &sqe;
1435 1.1 nonaka
1436 1.1 nonaka memset(&sqe, 0, sizeof(sqe));
1437 1.1 nonaka sqe.opcode = NVM_ADMIN_DEL_IOCQ;
1438 1.1 nonaka htolem16(&sqe.qid, q->q_id);
1439 1.1 nonaka
1440 1.7 jdolecek rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_sqe_fill, NVME_TIMO_QOP);
1441 1.1 nonaka if (rv != 0)
1442 1.1 nonaka goto fail;
1443 1.1 nonaka
1444 1.1 nonaka fail:
1445 1.1 nonaka nvme_ccb_put(sc->sc_admin_q, ccb);
1446 1.1 nonaka
1447 1.1 nonaka if (rv == 0 && sc->sc_use_mq) {
1448 1.1 nonaka if (sc->sc_intr_disestablish(sc, q->q_id))
1449 1.1 nonaka rv = 1;
1450 1.1 nonaka }
1451 1.1 nonaka
1452 1.1 nonaka return rv;
1453 1.1 nonaka }
1454 1.1 nonaka
1455 1.1 nonaka static void
1456 1.1 nonaka nvme_fill_identify(struct nvme_queue *q, struct nvme_ccb *ccb, void *slot)
1457 1.1 nonaka {
1458 1.1 nonaka struct nvme_sqe *sqe = slot;
1459 1.1 nonaka struct nvme_dmamem *mem = ccb->ccb_cookie;
1460 1.1 nonaka
1461 1.1 nonaka sqe->opcode = NVM_ADMIN_IDENTIFY;
1462 1.19 jdolecek htolem64(&sqe->entry.prp[0], NVME_DMA_DVA(mem));
1463 1.1 nonaka htolem32(&sqe->cdw10, 1);
1464 1.1 nonaka }
1465 1.1 nonaka
1466 1.1 nonaka static int
1467 1.23 nonaka nvme_get_number_of_queues(struct nvme_softc *sc, u_int *nqap)
1468 1.23 nonaka {
1469 1.36 jdolecek struct nvme_pt_state state;
1470 1.23 nonaka struct nvme_pt_command pt;
1471 1.23 nonaka struct nvme_ccb *ccb;
1472 1.23 nonaka uint16_t ncqa, nsqa;
1473 1.23 nonaka int rv;
1474 1.23 nonaka
1475 1.34 jdolecek ccb = nvme_ccb_get(sc->sc_admin_q, false);
1476 1.23 nonaka KASSERT(ccb != NULL); /* it's a bug if we don't have spare ccb here */
1477 1.23 nonaka
1478 1.23 nonaka memset(&pt, 0, sizeof(pt));
1479 1.23 nonaka pt.cmd.opcode = NVM_ADMIN_GET_FEATURES;
1480 1.25 jdolecek pt.cmd.cdw10 = NVM_FEATURE_NUMBER_OF_QUEUES;
1481 1.23 nonaka
1482 1.36 jdolecek memset(&state, 0, sizeof(state));
1483 1.36 jdolecek state.pt = &pt;
1484 1.36 jdolecek state.finished = false;
1485 1.36 jdolecek
1486 1.23 nonaka ccb->ccb_done = nvme_pt_done;
1487 1.36 jdolecek ccb->ccb_cookie = &state;
1488 1.23 nonaka
1489 1.23 nonaka rv = nvme_poll(sc, sc->sc_admin_q, ccb, nvme_pt_fill, NVME_TIMO_QOP);
1490 1.23 nonaka
1491 1.23 nonaka if (rv != 0) {
1492 1.23 nonaka *nqap = 0;
1493 1.23 nonaka return EIO;
1494 1.23 nonaka }
1495 1.23 nonaka
1496 1.23 nonaka ncqa = pt.cpl.cdw0 >> 16;
1497 1.23 nonaka nsqa = pt.cpl.cdw0 & 0xffff;
1498 1.23 nonaka *nqap = MIN(ncqa, nsqa) + 1;
1499 1.23 nonaka
1500 1.23 nonaka return 0;
1501 1.23 nonaka }
1502 1.23 nonaka
1503 1.23 nonaka static int
1504 1.20 jdolecek nvme_ccbs_alloc(struct nvme_queue *q, uint16_t nccbs)
1505 1.1 nonaka {
1506 1.1 nonaka struct nvme_softc *sc = q->q_sc;
1507 1.1 nonaka struct nvme_ccb *ccb;
1508 1.1 nonaka bus_addr_t off;
1509 1.1 nonaka uint64_t *prpl;
1510 1.1 nonaka u_int i;
1511 1.1 nonaka
1512 1.1 nonaka mutex_init(&q->q_ccb_mtx, MUTEX_DEFAULT, IPL_BIO);
1513 1.34 jdolecek cv_init(&q->q_ccb_wait, "nvmeqw");
1514 1.34 jdolecek q->q_ccb_waiting = false;
1515 1.1 nonaka SIMPLEQ_INIT(&q->q_ccb_list);
1516 1.1 nonaka
1517 1.1 nonaka q->q_ccbs = kmem_alloc(sizeof(*ccb) * nccbs, KM_SLEEP);
1518 1.1 nonaka
1519 1.1 nonaka q->q_nccbs = nccbs;
1520 1.19 jdolecek q->q_ccb_prpls = nvme_dmamem_alloc(sc,
1521 1.19 jdolecek sizeof(*prpl) * sc->sc_max_sgl * nccbs);
1522 1.1 nonaka
1523 1.1 nonaka prpl = NVME_DMA_KVA(q->q_ccb_prpls);
1524 1.1 nonaka off = 0;
1525 1.1 nonaka
1526 1.1 nonaka for (i = 0; i < nccbs; i++) {
1527 1.1 nonaka ccb = &q->q_ccbs[i];
1528 1.1 nonaka
1529 1.1 nonaka if (bus_dmamap_create(sc->sc_dmat, sc->sc_mdts,
1530 1.1 nonaka sc->sc_max_sgl + 1 /* we get a free prp in the sqe */,
1531 1.1 nonaka sc->sc_mps, sc->sc_mps, BUS_DMA_WAITOK | BUS_DMA_ALLOCNOW,
1532 1.1 nonaka &ccb->ccb_dmamap) != 0)
1533 1.1 nonaka goto free_maps;
1534 1.1 nonaka
1535 1.1 nonaka ccb->ccb_id = i;
1536 1.1 nonaka ccb->ccb_prpl = prpl;
1537 1.1 nonaka ccb->ccb_prpl_off = off;
1538 1.1 nonaka ccb->ccb_prpl_dva = NVME_DMA_DVA(q->q_ccb_prpls) + off;
1539 1.1 nonaka
1540 1.1 nonaka SIMPLEQ_INSERT_TAIL(&q->q_ccb_list, ccb, ccb_entry);
1541 1.1 nonaka
1542 1.1 nonaka prpl += sc->sc_max_sgl;
1543 1.1 nonaka off += sizeof(*prpl) * sc->sc_max_sgl;
1544 1.1 nonaka }
1545 1.1 nonaka
1546 1.1 nonaka return 0;
1547 1.1 nonaka
1548 1.1 nonaka free_maps:
1549 1.1 nonaka nvme_ccbs_free(q);
1550 1.1 nonaka return 1;
1551 1.1 nonaka }
1552 1.1 nonaka
1553 1.1 nonaka static struct nvme_ccb *
1554 1.34 jdolecek nvme_ccb_get(struct nvme_queue *q, bool wait)
1555 1.1 nonaka {
1556 1.20 jdolecek struct nvme_ccb *ccb = NULL;
1557 1.1 nonaka
1558 1.1 nonaka mutex_enter(&q->q_ccb_mtx);
1559 1.34 jdolecek again:
1560 1.33 jdolecek ccb = SIMPLEQ_FIRST(&q->q_ccb_list);
1561 1.33 jdolecek if (ccb != NULL) {
1562 1.1 nonaka SIMPLEQ_REMOVE_HEAD(&q->q_ccb_list, ccb_entry);
1563 1.18 jdolecek #ifdef DEBUG
1564 1.18 jdolecek ccb->ccb_cookie = NULL;
1565 1.18 jdolecek #endif
1566 1.34 jdolecek } else {
1567 1.34 jdolecek if (__predict_false(wait)) {
1568 1.34 jdolecek q->q_ccb_waiting = true;
1569 1.34 jdolecek cv_wait(&q->q_ccb_wait, &q->q_ccb_mtx);
1570 1.34 jdolecek goto again;
1571 1.34 jdolecek }
1572 1.18 jdolecek }
1573 1.1 nonaka mutex_exit(&q->q_ccb_mtx);
1574 1.1 nonaka
1575 1.1 nonaka return ccb;
1576 1.1 nonaka }
1577 1.1 nonaka
1578 1.1 nonaka static void
1579 1.1 nonaka nvme_ccb_put(struct nvme_queue *q, struct nvme_ccb *ccb)
1580 1.1 nonaka {
1581 1.1 nonaka
1582 1.1 nonaka mutex_enter(&q->q_ccb_mtx);
1583 1.18 jdolecek #ifdef DEBUG
1584 1.18 jdolecek ccb->ccb_cookie = (void *)NVME_CCB_FREE;
1585 1.18 jdolecek #endif
1586 1.1 nonaka SIMPLEQ_INSERT_HEAD(&q->q_ccb_list, ccb, ccb_entry);
1587 1.34 jdolecek
1588 1.34 jdolecek /* It's unlikely there are any waiters, it's not used for regular I/O */
1589 1.34 jdolecek if (__predict_false(q->q_ccb_waiting)) {
1590 1.34 jdolecek q->q_ccb_waiting = false;
1591 1.34 jdolecek cv_broadcast(&q->q_ccb_wait);
1592 1.34 jdolecek }
1593 1.34 jdolecek
1594 1.1 nonaka mutex_exit(&q->q_ccb_mtx);
1595 1.1 nonaka }
1596 1.1 nonaka
1597 1.1 nonaka static void
1598 1.1 nonaka nvme_ccbs_free(struct nvme_queue *q)
1599 1.1 nonaka {
1600 1.1 nonaka struct nvme_softc *sc = q->q_sc;
1601 1.1 nonaka struct nvme_ccb *ccb;
1602 1.1 nonaka
1603 1.1 nonaka mutex_enter(&q->q_ccb_mtx);
1604 1.1 nonaka while ((ccb = SIMPLEQ_FIRST(&q->q_ccb_list)) != NULL) {
1605 1.1 nonaka SIMPLEQ_REMOVE_HEAD(&q->q_ccb_list, ccb_entry);
1606 1.1 nonaka bus_dmamap_destroy(sc->sc_dmat, ccb->ccb_dmamap);
1607 1.1 nonaka }
1608 1.1 nonaka mutex_exit(&q->q_ccb_mtx);
1609 1.1 nonaka
1610 1.19 jdolecek nvme_dmamem_free(sc, q->q_ccb_prpls);
1611 1.1 nonaka kmem_free(q->q_ccbs, sizeof(*ccb) * q->q_nccbs);
1612 1.1 nonaka q->q_ccbs = NULL;
1613 1.34 jdolecek cv_destroy(&q->q_ccb_wait);
1614 1.1 nonaka mutex_destroy(&q->q_ccb_mtx);
1615 1.1 nonaka }
1616 1.1 nonaka
1617 1.1 nonaka static struct nvme_queue *
1618 1.1 nonaka nvme_q_alloc(struct nvme_softc *sc, uint16_t id, u_int entries, u_int dstrd)
1619 1.1 nonaka {
1620 1.1 nonaka struct nvme_queue *q;
1621 1.1 nonaka
1622 1.1 nonaka q = kmem_alloc(sizeof(*q), KM_SLEEP);
1623 1.1 nonaka q->q_sc = sc;
1624 1.19 jdolecek q->q_sq_dmamem = nvme_dmamem_alloc(sc,
1625 1.19 jdolecek sizeof(struct nvme_sqe) * entries);
1626 1.19 jdolecek if (q->q_sq_dmamem == NULL)
1627 1.1 nonaka goto free;
1628 1.1 nonaka
1629 1.19 jdolecek q->q_cq_dmamem = nvme_dmamem_alloc(sc,
1630 1.19 jdolecek sizeof(struct nvme_cqe) * entries);
1631 1.19 jdolecek if (q->q_cq_dmamem == NULL)
1632 1.1 nonaka goto free_sq;
1633 1.1 nonaka
1634 1.1 nonaka memset(NVME_DMA_KVA(q->q_sq_dmamem), 0, NVME_DMA_LEN(q->q_sq_dmamem));
1635 1.1 nonaka memset(NVME_DMA_KVA(q->q_cq_dmamem), 0, NVME_DMA_LEN(q->q_cq_dmamem));
1636 1.1 nonaka
1637 1.1 nonaka mutex_init(&q->q_sq_mtx, MUTEX_DEFAULT, IPL_BIO);
1638 1.1 nonaka mutex_init(&q->q_cq_mtx, MUTEX_DEFAULT, IPL_BIO);
1639 1.1 nonaka q->q_sqtdbl = NVME_SQTDBL(id, dstrd);
1640 1.1 nonaka q->q_cqhdbl = NVME_CQHDBL(id, dstrd);
1641 1.1 nonaka q->q_id = id;
1642 1.1 nonaka q->q_entries = entries;
1643 1.1 nonaka q->q_sq_tail = 0;
1644 1.1 nonaka q->q_cq_head = 0;
1645 1.1 nonaka q->q_cq_phase = NVME_CQE_PHASE;
1646 1.1 nonaka
1647 1.1 nonaka nvme_dmamem_sync(sc, q->q_sq_dmamem, BUS_DMASYNC_PREWRITE);
1648 1.1 nonaka nvme_dmamem_sync(sc, q->q_cq_dmamem, BUS_DMASYNC_PREREAD);
1649 1.1 nonaka
1650 1.20 jdolecek /*
1651 1.20 jdolecek * Due to definition of full and empty queue (queue is empty
1652 1.20 jdolecek * when head == tail, full when tail is one less then head),
1653 1.20 jdolecek * we can actually only have (entries - 1) in-flight commands.
1654 1.20 jdolecek */
1655 1.20 jdolecek if (nvme_ccbs_alloc(q, entries - 1) != 0) {
1656 1.1 nonaka aprint_error_dev(sc->sc_dev, "unable to allocate ccbs\n");
1657 1.1 nonaka goto free_cq;
1658 1.1 nonaka }
1659 1.1 nonaka
1660 1.1 nonaka return q;
1661 1.1 nonaka
1662 1.1 nonaka free_cq:
1663 1.19 jdolecek nvme_dmamem_free(sc, q->q_cq_dmamem);
1664 1.1 nonaka free_sq:
1665 1.19 jdolecek nvme_dmamem_free(sc, q->q_sq_dmamem);
1666 1.1 nonaka free:
1667 1.1 nonaka kmem_free(q, sizeof(*q));
1668 1.1 nonaka
1669 1.1 nonaka return NULL;
1670 1.1 nonaka }
1671 1.1 nonaka
1672 1.1 nonaka static void
1673 1.1 nonaka nvme_q_free(struct nvme_softc *sc, struct nvme_queue *q)
1674 1.1 nonaka {
1675 1.1 nonaka nvme_ccbs_free(q);
1676 1.9 jdolecek mutex_destroy(&q->q_sq_mtx);
1677 1.9 jdolecek mutex_destroy(&q->q_cq_mtx);
1678 1.1 nonaka nvme_dmamem_sync(sc, q->q_cq_dmamem, BUS_DMASYNC_POSTREAD);
1679 1.1 nonaka nvme_dmamem_sync(sc, q->q_sq_dmamem, BUS_DMASYNC_POSTWRITE);
1680 1.19 jdolecek nvme_dmamem_free(sc, q->q_cq_dmamem);
1681 1.19 jdolecek nvme_dmamem_free(sc, q->q_sq_dmamem);
1682 1.1 nonaka kmem_free(q, sizeof(*q));
1683 1.1 nonaka }
1684 1.1 nonaka
1685 1.1 nonaka int
1686 1.1 nonaka nvme_intr(void *xsc)
1687 1.1 nonaka {
1688 1.1 nonaka struct nvme_softc *sc = xsc;
1689 1.1 nonaka
1690 1.10 jdolecek /*
1691 1.10 jdolecek * INTx is level triggered, controller deasserts the interrupt only
1692 1.10 jdolecek * when we advance command queue head via write to the doorbell.
1693 1.17 jdolecek * Tell the controller to block the interrupts while we process
1694 1.17 jdolecek * the queue(s).
1695 1.10 jdolecek */
1696 1.17 jdolecek nvme_write4(sc, NVME_INTMS, 1);
1697 1.17 jdolecek
1698 1.17 jdolecek softint_schedule(sc->sc_softih[0]);
1699 1.17 jdolecek
1700 1.17 jdolecek /* don't know, might not have been for us */
1701 1.17 jdolecek return 1;
1702 1.17 jdolecek }
1703 1.17 jdolecek
1704 1.17 jdolecek void
1705 1.17 jdolecek nvme_softintr_intx(void *xq)
1706 1.17 jdolecek {
1707 1.17 jdolecek struct nvme_queue *q = xq;
1708 1.17 jdolecek struct nvme_softc *sc = q->q_sc;
1709 1.17 jdolecek
1710 1.17 jdolecek nvme_q_complete(sc, sc->sc_admin_q);
1711 1.1 nonaka if (sc->sc_q != NULL)
1712 1.17 jdolecek nvme_q_complete(sc, sc->sc_q[0]);
1713 1.1 nonaka
1714 1.17 jdolecek /*
1715 1.17 jdolecek * Processing done, tell controller to issue interrupts again. There
1716 1.17 jdolecek * is no race, as NVMe spec requires the controller to maintain state,
1717 1.17 jdolecek * and assert the interrupt whenever there are unacknowledged
1718 1.17 jdolecek * completion queue entries.
1719 1.17 jdolecek */
1720 1.17 jdolecek nvme_write4(sc, NVME_INTMC, 1);
1721 1.1 nonaka }
1722 1.1 nonaka
1723 1.1 nonaka int
1724 1.9 jdolecek nvme_intr_msi(void *xq)
1725 1.1 nonaka {
1726 1.1 nonaka struct nvme_queue *q = xq;
1727 1.1 nonaka
1728 1.9 jdolecek KASSERT(q && q->q_sc && q->q_sc->sc_softih
1729 1.9 jdolecek && q->q_sc->sc_softih[q->q_id]);
1730 1.1 nonaka
1731 1.17 jdolecek /*
1732 1.17 jdolecek * MSI/MSI-X are edge triggered, so can handover processing to softint
1733 1.17 jdolecek * without masking the interrupt.
1734 1.17 jdolecek */
1735 1.9 jdolecek softint_schedule(q->q_sc->sc_softih[q->q_id]);
1736 1.1 nonaka
1737 1.9 jdolecek return 1;
1738 1.1 nonaka }
1739 1.1 nonaka
1740 1.9 jdolecek void
1741 1.9 jdolecek nvme_softintr_msi(void *xq)
1742 1.1 nonaka {
1743 1.1 nonaka struct nvme_queue *q = xq;
1744 1.9 jdolecek struct nvme_softc *sc = q->q_sc;
1745 1.1 nonaka
1746 1.9 jdolecek nvme_q_complete(sc, q);
1747 1.1 nonaka }
1748 1.1 nonaka
1749 1.19 jdolecek static struct nvme_dmamem *
1750 1.19 jdolecek nvme_dmamem_alloc(struct nvme_softc *sc, size_t size)
1751 1.1 nonaka {
1752 1.19 jdolecek struct nvme_dmamem *ndm;
1753 1.1 nonaka int nsegs;
1754 1.1 nonaka
1755 1.19 jdolecek ndm = kmem_zalloc(sizeof(*ndm), KM_SLEEP);
1756 1.19 jdolecek if (ndm == NULL)
1757 1.19 jdolecek return NULL;
1758 1.19 jdolecek
1759 1.1 nonaka ndm->ndm_size = size;
1760 1.1 nonaka
1761 1.1 nonaka if (bus_dmamap_create(sc->sc_dmat, size, 1, size, 0,
1762 1.1 nonaka BUS_DMA_WAITOK | BUS_DMA_ALLOCNOW, &ndm->ndm_map) != 0)
1763 1.1 nonaka goto ndmfree;
1764 1.1 nonaka
1765 1.1 nonaka if (bus_dmamem_alloc(sc->sc_dmat, size, sc->sc_mps, 0, &ndm->ndm_seg,
1766 1.1 nonaka 1, &nsegs, BUS_DMA_WAITOK) != 0)
1767 1.1 nonaka goto destroy;
1768 1.1 nonaka
1769 1.1 nonaka if (bus_dmamem_map(sc->sc_dmat, &ndm->ndm_seg, nsegs, size,
1770 1.1 nonaka &ndm->ndm_kva, BUS_DMA_WAITOK) != 0)
1771 1.1 nonaka goto free;
1772 1.1 nonaka memset(ndm->ndm_kva, 0, size);
1773 1.1 nonaka
1774 1.1 nonaka if (bus_dmamap_load(sc->sc_dmat, ndm->ndm_map, ndm->ndm_kva, size,
1775 1.1 nonaka NULL, BUS_DMA_WAITOK) != 0)
1776 1.1 nonaka goto unmap;
1777 1.1 nonaka
1778 1.19 jdolecek return ndm;
1779 1.1 nonaka
1780 1.1 nonaka unmap:
1781 1.1 nonaka bus_dmamem_unmap(sc->sc_dmat, ndm->ndm_kva, size);
1782 1.1 nonaka free:
1783 1.1 nonaka bus_dmamem_free(sc->sc_dmat, &ndm->ndm_seg, 1);
1784 1.1 nonaka destroy:
1785 1.1 nonaka bus_dmamap_destroy(sc->sc_dmat, ndm->ndm_map);
1786 1.1 nonaka ndmfree:
1787 1.19 jdolecek kmem_free(ndm, sizeof(*ndm));
1788 1.19 jdolecek return NULL;
1789 1.19 jdolecek }
1790 1.19 jdolecek
1791 1.19 jdolecek static void
1792 1.19 jdolecek nvme_dmamem_sync(struct nvme_softc *sc, struct nvme_dmamem *mem, int ops)
1793 1.19 jdolecek {
1794 1.19 jdolecek bus_dmamap_sync(sc->sc_dmat, NVME_DMA_MAP(mem),
1795 1.19 jdolecek 0, NVME_DMA_LEN(mem), ops);
1796 1.1 nonaka }
1797 1.1 nonaka
1798 1.1 nonaka void
1799 1.1 nonaka nvme_dmamem_free(struct nvme_softc *sc, struct nvme_dmamem *ndm)
1800 1.1 nonaka {
1801 1.1 nonaka bus_dmamap_unload(sc->sc_dmat, ndm->ndm_map);
1802 1.1 nonaka bus_dmamem_unmap(sc->sc_dmat, ndm->ndm_kva, ndm->ndm_size);
1803 1.1 nonaka bus_dmamem_free(sc->sc_dmat, &ndm->ndm_seg, 1);
1804 1.1 nonaka bus_dmamap_destroy(sc->sc_dmat, ndm->ndm_map);
1805 1.19 jdolecek kmem_free(ndm, sizeof(*ndm));
1806 1.1 nonaka }
1807 1.3 nonaka
1808 1.3 nonaka /*
1809 1.3 nonaka * ioctl
1810 1.3 nonaka */
1811 1.3 nonaka
1812 1.3 nonaka dev_type_open(nvmeopen);
1813 1.3 nonaka dev_type_close(nvmeclose);
1814 1.3 nonaka dev_type_ioctl(nvmeioctl);
1815 1.3 nonaka
1816 1.3 nonaka const struct cdevsw nvme_cdevsw = {
1817 1.3 nonaka .d_open = nvmeopen,
1818 1.3 nonaka .d_close = nvmeclose,
1819 1.3 nonaka .d_read = noread,
1820 1.3 nonaka .d_write = nowrite,
1821 1.3 nonaka .d_ioctl = nvmeioctl,
1822 1.3 nonaka .d_stop = nostop,
1823 1.3 nonaka .d_tty = notty,
1824 1.3 nonaka .d_poll = nopoll,
1825 1.3 nonaka .d_mmap = nommap,
1826 1.3 nonaka .d_kqfilter = nokqfilter,
1827 1.3 nonaka .d_discard = nodiscard,
1828 1.3 nonaka .d_flag = D_OTHER,
1829 1.3 nonaka };
1830 1.3 nonaka
1831 1.3 nonaka /*
1832 1.3 nonaka * Accept an open operation on the control device.
1833 1.3 nonaka */
1834 1.3 nonaka int
1835 1.3 nonaka nvmeopen(dev_t dev, int flag, int mode, struct lwp *l)
1836 1.3 nonaka {
1837 1.3 nonaka struct nvme_softc *sc;
1838 1.3 nonaka int unit = minor(dev) / 0x10000;
1839 1.3 nonaka int nsid = minor(dev) & 0xffff;
1840 1.3 nonaka int nsidx;
1841 1.3 nonaka
1842 1.3 nonaka if ((sc = device_lookup_private(&nvme_cd, unit)) == NULL)
1843 1.3 nonaka return ENXIO;
1844 1.3 nonaka if ((sc->sc_flags & NVME_F_ATTACHED) == 0)
1845 1.3 nonaka return ENXIO;
1846 1.3 nonaka
1847 1.5 nonaka if (nsid == 0) {
1848 1.5 nonaka /* controller */
1849 1.5 nonaka if (ISSET(sc->sc_flags, NVME_F_OPEN))
1850 1.5 nonaka return EBUSY;
1851 1.5 nonaka SET(sc->sc_flags, NVME_F_OPEN);
1852 1.5 nonaka } else {
1853 1.5 nonaka /* namespace */
1854 1.5 nonaka nsidx = nsid - 1;
1855 1.5 nonaka if (nsidx >= sc->sc_nn || sc->sc_namespaces[nsidx].dev == NULL)
1856 1.5 nonaka return ENXIO;
1857 1.5 nonaka if (ISSET(sc->sc_namespaces[nsidx].flags, NVME_NS_F_OPEN))
1858 1.5 nonaka return EBUSY;
1859 1.5 nonaka SET(sc->sc_namespaces[nsidx].flags, NVME_NS_F_OPEN);
1860 1.5 nonaka }
1861 1.3 nonaka return 0;
1862 1.3 nonaka }
1863 1.3 nonaka
1864 1.3 nonaka /*
1865 1.3 nonaka * Accept the last close on the control device.
1866 1.3 nonaka */
1867 1.3 nonaka int
1868 1.5 nonaka nvmeclose(dev_t dev, int flag, int mode, struct lwp *l)
1869 1.3 nonaka {
1870 1.3 nonaka struct nvme_softc *sc;
1871 1.3 nonaka int unit = minor(dev) / 0x10000;
1872 1.3 nonaka int nsid = minor(dev) & 0xffff;
1873 1.3 nonaka int nsidx;
1874 1.3 nonaka
1875 1.3 nonaka sc = device_lookup_private(&nvme_cd, unit);
1876 1.3 nonaka if (sc == NULL)
1877 1.3 nonaka return ENXIO;
1878 1.3 nonaka
1879 1.5 nonaka if (nsid == 0) {
1880 1.5 nonaka /* controller */
1881 1.5 nonaka CLR(sc->sc_flags, NVME_F_OPEN);
1882 1.5 nonaka } else {
1883 1.5 nonaka /* namespace */
1884 1.5 nonaka nsidx = nsid - 1;
1885 1.5 nonaka if (nsidx >= sc->sc_nn)
1886 1.5 nonaka return ENXIO;
1887 1.5 nonaka CLR(sc->sc_namespaces[nsidx].flags, NVME_NS_F_OPEN);
1888 1.5 nonaka }
1889 1.3 nonaka
1890 1.3 nonaka return 0;
1891 1.3 nonaka }
1892 1.3 nonaka
1893 1.3 nonaka /*
1894 1.3 nonaka * Handle control operations.
1895 1.3 nonaka */
1896 1.3 nonaka int
1897 1.5 nonaka nvmeioctl(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
1898 1.3 nonaka {
1899 1.3 nonaka struct nvme_softc *sc;
1900 1.3 nonaka int unit = minor(dev) / 0x10000;
1901 1.3 nonaka int nsid = minor(dev) & 0xffff;
1902 1.5 nonaka struct nvme_pt_command *pt;
1903 1.3 nonaka
1904 1.3 nonaka sc = device_lookup_private(&nvme_cd, unit);
1905 1.3 nonaka if (sc == NULL)
1906 1.3 nonaka return ENXIO;
1907 1.3 nonaka
1908 1.3 nonaka switch (cmd) {
1909 1.3 nonaka case NVME_PASSTHROUGH_CMD:
1910 1.5 nonaka pt = data;
1911 1.5 nonaka return nvme_command_passthrough(sc, data,
1912 1.5 nonaka nsid == 0 ? pt->cmd.nsid : nsid, l, nsid == 0);
1913 1.3 nonaka }
1914 1.3 nonaka
1915 1.3 nonaka return ENOTTY;
1916 1.3 nonaka }
1917