1 /* $NetBSD: qat_ae.c,v 1.2 2021/12/05 07:28:20 msaitoh Exp $ */
2
3 /*
4 * Copyright (c) 2019 Internet Initiative Japan, Inc.
5 * All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
17 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
18 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
19 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
20 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 * POSSIBILITY OF SUCH DAMAGE.
27 */
28
29 /*
30 * Copyright(c) 2007-2019 Intel Corporation. All rights reserved.
31 *
32 * Redistribution and use in source and binary forms, with or without
33 * modification, are permitted provided that the following conditions
34 * are met:
35 *
36 * * Redistributions of source code must retain the above copyright
37 * notice, this list of conditions and the following disclaimer.
38 * * Redistributions in binary form must reproduce the above copyright
39 * notice, this list of conditions and the following disclaimer in
40 * the documentation and/or other materials provided with the
41 * distribution.
42 * * Neither the name of Intel Corporation nor the names of its
43 * contributors may be used to endorse or promote products derived
44 * from this software without specific prior written permission.
45 *
46 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
47 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
48 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
49 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
50 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
51 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
52 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
53 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
54 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
55 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
56 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
57 */
58
59 #include <sys/cdefs.h>
60 __KERNEL_RCSID(0, "$NetBSD: qat_ae.c,v 1.2 2021/12/05 07:28:20 msaitoh Exp $");
61
62 #include <sys/param.h>
63 #include <sys/systm.h>
64
65 #include <dev/firmload.h>
66
67 #include <dev/pci/pcireg.h>
68 #include <dev/pci/pcivar.h>
69 #include <dev/pci/pcidevs.h>
70
71 #include "qatreg.h"
72 #include "qatvar.h"
73 #include "qat_aevar.h"
74
75 int qat_ae_write_4(struct qat_softc *, u_char, bus_size_t,
76 uint32_t);
77 int qat_ae_read_4(struct qat_softc *, u_char, bus_size_t,
78 uint32_t *);
79 int qat_ae_write_4(struct qat_softc *, u_char, bus_size_t,
80 uint32_t);
81 void qat_ae_ctx_indr_write(struct qat_softc *, u_char, uint32_t,
82 bus_size_t, uint32_t);
83 int qat_ae_ctx_indr_read(struct qat_softc *, u_char, uint32_t,
84 bus_size_t, uint32_t *);
85
86 u_short qat_aereg_get_10bit_addr(enum aereg_type, u_short);
87 int qat_aereg_rel_data_write(struct qat_softc *, u_char, u_char,
88 enum aereg_type, u_short, uint32_t);
89 int qat_aereg_rel_data_read(struct qat_softc *, u_char, u_char,
90 enum aereg_type, u_short, uint32_t *);
91 int qat_aereg_rel_rdxfer_write(struct qat_softc *, u_char, u_char,
92 enum aereg_type, u_short, uint32_t);
93 int qat_aereg_rel_wrxfer_write(struct qat_softc *, u_char, u_char,
94 enum aereg_type, u_short, uint32_t);
95 int qat_aereg_rel_nn_write(struct qat_softc *, u_char, u_char,
96 enum aereg_type, u_short, uint32_t);
97 int qat_aereg_abs_to_rel(struct qat_softc *, u_char, u_short,
98 u_short *, u_char *);
99 int qat_aereg_abs_data_write(struct qat_softc *, u_char,
100 enum aereg_type, u_short, uint32_t);
101
102 void qat_ae_enable_ctx(struct qat_softc *, u_char, u_int);
103 void qat_ae_disable_ctx(struct qat_softc *, u_char, u_int);
104 void qat_ae_write_ctx_mode(struct qat_softc *, u_char, u_char);
105 void qat_ae_write_nn_mode(struct qat_softc *, u_char, u_char);
106 void qat_ae_write_lm_mode(struct qat_softc *, u_char,
107 enum aereg_type, u_char);
108 void qat_ae_write_shared_cs_mode0(struct qat_softc *, u_char,
109 u_char);
110 void qat_ae_write_shared_cs_mode(struct qat_softc *, u_char, u_char);
111 int qat_ae_set_reload_ustore(struct qat_softc *, u_char, u_int, int,
112 u_int);
113
114 enum qat_ae_status
115 qat_ae_get_status(struct qat_softc *, u_char);
116 int qat_ae_is_active(struct qat_softc *, u_char);
117 int qat_ae_wait_num_cycles(struct qat_softc *, u_char, int, int);
118
119 int qat_ae_clear_reset(struct qat_softc *);
120 int qat_ae_check(struct qat_softc *);
121 int qat_ae_reset_timestamp(struct qat_softc *);
122 void qat_ae_clear_xfer(struct qat_softc *);
123 int qat_ae_clear_gprs(struct qat_softc *);
124
125 void qat_ae_get_shared_ustore_ae(u_char, u_char *);
126 u_int qat_ae_ucode_parity64(uint64_t);
127 uint64_t qat_ae_ucode_set_ecc(uint64_t);
128 int qat_ae_ucode_write(struct qat_softc *, u_char, u_int, u_int,
129 const uint64_t *);
130 int qat_ae_ucode_read(struct qat_softc *, u_char, u_int, u_int,
131 uint64_t *);
132 u_int qat_ae_concat_ucode(uint64_t *, u_int, u_int, u_int, u_int *);
133 int qat_ae_exec_ucode(struct qat_softc *, u_char, u_char,
134 uint64_t *, u_int, int, u_int, u_int *);
135 int qat_ae_exec_ucode_init_lm(struct qat_softc *, u_char, u_char,
136 int *, uint64_t *, u_int,
137 u_int *, u_int *, u_int *, u_int *, u_int *);
138 int qat_ae_restore_init_lm_gprs(struct qat_softc *, u_char, u_char,
139 u_int, u_int, u_int, u_int, u_int);
140 int qat_ae_get_inst_num(int);
141 int qat_ae_batch_put_lm(struct qat_softc *, u_char,
142 struct qat_ae_batch_init_list *, size_t);
143 int qat_ae_write_pc(struct qat_softc *, u_char, u_int, u_int);
144
145 u_int qat_aefw_csum(char *, int);
146 const char * qat_aefw_uof_string(struct qat_softc *, size_t);
147 struct uof_chunk_hdr *
148 qat_aefw_uof_find_chunk(struct qat_softc *, const char *,
149 struct uof_chunk_hdr *);
150
151 int qat_aefw_load_mof(struct qat_softc *);
152 int qat_aefw_load_mmp(struct qat_softc *);
153
154 int qat_aefw_mof_find_uof0(struct qat_softc *,
155 struct mof_uof_hdr *, struct mof_uof_chunk_hdr *,
156 u_int, size_t, const char *,
157 size_t *, void **);
158 int qat_aefw_mof_find_uof(struct qat_softc *);
159 int qat_aefw_mof_parse(struct qat_softc *);
160
161 int qat_aefw_uof_parse_image(struct qat_softc *,
162 struct qat_uof_image *, struct uof_chunk_hdr *uch);
163 int qat_aefw_uof_parse_images(struct qat_softc *);
164 int qat_aefw_uof_parse(struct qat_softc *);
165
166 int qat_aefw_alloc_auth_dmamem(struct qat_softc *, char *, size_t,
167 struct qat_dmamem *);
168 int qat_aefw_auth(struct qat_softc *, struct qat_dmamem *);
169 int qat_aefw_suof_load(struct qat_softc *sc,
170 struct qat_dmamem *dma);
171 int qat_aefw_suof_parse_image(struct qat_softc *,
172 struct qat_suof_image *, struct suof_chunk_hdr *);
173 int qat_aefw_suof_parse(struct qat_softc *);
174 int qat_aefw_suof_write(struct qat_softc *);
175
176 int qat_aefw_uof_assign_image(struct qat_softc *, struct qat_ae *,
177 struct qat_uof_image *);
178 int qat_aefw_uof_init_ae(struct qat_softc *, u_char);
179 int qat_aefw_uof_init(struct qat_softc *);
180
181 int qat_aefw_init_memory_one(struct qat_softc *,
182 struct uof_init_mem *);
183 void qat_aefw_free_lm_init(struct qat_softc *, u_char);
184 int qat_aefw_init_ustore(struct qat_softc *);
185 int qat_aefw_init_reg(struct qat_softc *, u_char, u_char,
186 enum aereg_type, u_short, u_int);
187 int qat_aefw_init_reg_sym_expr(struct qat_softc *, u_char,
188 struct qat_uof_image *);
189 int qat_aefw_init_memory(struct qat_softc *);
190 int qat_aefw_init_globals(struct qat_softc *);
191 uint64_t qat_aefw_get_uof_inst(struct qat_softc *,
192 struct qat_uof_page *, u_int);
193 int qat_aefw_do_pagein(struct qat_softc *, u_char,
194 struct qat_uof_page *);
195 int qat_aefw_uof_write_one(struct qat_softc *, struct qat_uof_image *);
196 int qat_aefw_uof_write(struct qat_softc *);
197
198 int
qat_ae_write_4(struct qat_softc * sc,u_char ae,bus_size_t offset,uint32_t value)199 qat_ae_write_4(struct qat_softc *sc, u_char ae, bus_size_t offset,
200 uint32_t value)
201 {
202 int times = TIMEOUT_AE_CSR;
203
204 do {
205 qat_ae_local_write_4(sc, ae, offset, value);
206 if ((qat_ae_local_read_4(sc, ae, LOCAL_CSR_STATUS) &
207 LOCAL_CSR_STATUS_STATUS) == 0)
208 return 0;
209
210 } while (times--);
211
212 aprint_error_dev(sc->sc_dev,
213 "couldn't write AE CSR: ae 0x%hhx offset 0x%lx\n", ae, (long)offset);
214 return EFAULT;
215 }
216
217 int
qat_ae_read_4(struct qat_softc * sc,u_char ae,bus_size_t offset,uint32_t * value)218 qat_ae_read_4(struct qat_softc *sc, u_char ae, bus_size_t offset,
219 uint32_t *value)
220 {
221 int times = TIMEOUT_AE_CSR;
222 uint32_t v;
223
224 do {
225 v = qat_ae_local_read_4(sc, ae, offset);
226 if ((qat_ae_local_read_4(sc, ae, LOCAL_CSR_STATUS) &
227 LOCAL_CSR_STATUS_STATUS) == 0) {
228 *value = v;
229 return 0;
230 }
231 } while (times--);
232
233 aprint_error_dev(sc->sc_dev,
234 "couldn't read AE CSR: ae 0x%hhx offset 0x%lx\n", ae, (long)offset);
235 return EFAULT;
236 }
237
238 void
qat_ae_ctx_indr_write(struct qat_softc * sc,u_char ae,uint32_t ctx_mask,bus_size_t offset,uint32_t value)239 qat_ae_ctx_indr_write(struct qat_softc *sc, u_char ae, uint32_t ctx_mask,
240 bus_size_t offset, uint32_t value)
241 {
242 int ctx;
243 uint32_t ctxptr;
244
245 KASSERT(offset == CTX_FUTURE_COUNT_INDIRECT ||
246 offset == FUTURE_COUNT_SIGNAL_INDIRECT ||
247 offset == CTX_STS_INDIRECT ||
248 offset == CTX_WAKEUP_EVENTS_INDIRECT ||
249 offset == CTX_SIG_EVENTS_INDIRECT ||
250 offset == LM_ADDR_0_INDIRECT ||
251 offset == LM_ADDR_1_INDIRECT ||
252 offset == INDIRECT_LM_ADDR_0_BYTE_INDEX ||
253 offset == INDIRECT_LM_ADDR_1_BYTE_INDEX);
254
255 qat_ae_read_4(sc, ae, CSR_CTX_POINTER, &ctxptr);
256 for (ctx = 0; ctx < MAX_AE_CTX; ctx++) {
257 if ((ctx_mask & (1 << ctx)) == 0)
258 continue;
259 qat_ae_write_4(sc, ae, CSR_CTX_POINTER, ctx);
260 qat_ae_write_4(sc, ae, offset, value);
261 }
262 qat_ae_write_4(sc, ae, CSR_CTX_POINTER, ctxptr);
263 }
264
265 int
qat_ae_ctx_indr_read(struct qat_softc * sc,u_char ae,uint32_t ctx,bus_size_t offset,uint32_t * value)266 qat_ae_ctx_indr_read(struct qat_softc *sc, u_char ae, uint32_t ctx,
267 bus_size_t offset, uint32_t *value)
268 {
269 int error;
270 uint32_t ctxptr;
271
272 KASSERT(offset == CTX_FUTURE_COUNT_INDIRECT ||
273 offset == FUTURE_COUNT_SIGNAL_INDIRECT ||
274 offset == CTX_STS_INDIRECT ||
275 offset == CTX_WAKEUP_EVENTS_INDIRECT ||
276 offset == CTX_SIG_EVENTS_INDIRECT ||
277 offset == LM_ADDR_0_INDIRECT ||
278 offset == LM_ADDR_1_INDIRECT ||
279 offset == INDIRECT_LM_ADDR_0_BYTE_INDEX ||
280 offset == INDIRECT_LM_ADDR_1_BYTE_INDEX);
281
282 /* save the ctx ptr */
283 qat_ae_read_4(sc, ae, CSR_CTX_POINTER, &ctxptr);
284 if ((ctxptr & CSR_CTX_POINTER_CONTEXT) !=
285 (ctx & CSR_CTX_POINTER_CONTEXT))
286 qat_ae_write_4(sc, ae, CSR_CTX_POINTER, ctx);
287
288 error = qat_ae_read_4(sc, ae, offset, value);
289
290 /* restore ctx ptr */
291 if ((ctxptr & CSR_CTX_POINTER_CONTEXT) !=
292 (ctx & CSR_CTX_POINTER_CONTEXT))
293 qat_ae_write_4(sc, ae, CSR_CTX_POINTER, ctxptr);
294
295 return error;
296 }
297
298 u_short
qat_aereg_get_10bit_addr(enum aereg_type regtype,u_short reg)299 qat_aereg_get_10bit_addr(enum aereg_type regtype, u_short reg)
300 {
301 u_short addr;
302
303 switch (regtype) {
304 case AEREG_GPA_ABS:
305 case AEREG_GPB_ABS:
306 addr = (reg & 0x7f) | 0x80;
307 break;
308 case AEREG_GPA_REL:
309 case AEREG_GPB_REL:
310 addr = reg & 0x1f;
311 break;
312 case AEREG_SR_RD_REL:
313 case AEREG_SR_WR_REL:
314 case AEREG_SR_REL:
315 addr = 0x180 | (reg & 0x1f);
316 break;
317 case AEREG_SR_INDX:
318 addr = 0x140 | ((reg & 0x3) << 1);
319 break;
320 case AEREG_DR_RD_REL:
321 case AEREG_DR_WR_REL:
322 case AEREG_DR_REL:
323 addr = 0x1c0 | (reg & 0x1f);
324 break;
325 case AEREG_DR_INDX:
326 addr = 0x100 | ((reg & 0x3) << 1);
327 break;
328 case AEREG_NEIGH_INDX:
329 addr = 0x241 | ((reg & 0x3) << 1);
330 break;
331 case AEREG_NEIGH_REL:
332 addr = 0x280 | (reg & 0x1f);
333 break;
334 case AEREG_LMEM0:
335 addr = 0x200;
336 break;
337 case AEREG_LMEM1:
338 addr = 0x220;
339 break;
340 case AEREG_NO_DEST:
341 addr = 0x300 | (reg & 0xff);
342 break;
343 default:
344 addr = AEREG_BAD_REGADDR;
345 break;
346 }
347 return (addr);
348 }
349
350 int
qat_aereg_rel_data_write(struct qat_softc * sc,u_char ae,u_char ctx,enum aereg_type regtype,u_short relreg,uint32_t value)351 qat_aereg_rel_data_write(struct qat_softc *sc, u_char ae, u_char ctx,
352 enum aereg_type regtype, u_short relreg, uint32_t value)
353 {
354 uint16_t srchi, srclo, destaddr, data16hi, data16lo;
355 uint64_t inst[] = {
356 0x0F440000000ull, /* immed_w1[reg, val_hi16] */
357 0x0F040000000ull, /* immed_w0[reg, val_lo16] */
358 0x0F0000C0300ull, /* nop */
359 0x0E000010000ull /* ctx_arb[kill] */
360 };
361 const int ninst = __arraycount(inst);
362 const int imm_w1 = 0, imm_w0 = 1;
363 unsigned int ctxen;
364 uint16_t mask;
365
366 /* This logic only works for GPRs and LM index registers,
367 not NN or XFER registers! */
368 KASSERT(regtype == AEREG_GPA_REL || regtype == AEREG_GPB_REL ||
369 regtype == AEREG_LMEM0 || regtype == AEREG_LMEM1);
370
371 if ((regtype == AEREG_GPA_REL) || (regtype == AEREG_GPB_REL)) {
372 /* determine the context mode */
373 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
374 if (ctxen & CTX_ENABLES_INUSE_CONTEXTS) {
375 /* 4-ctx mode */
376 if (ctx & 0x1)
377 return EINVAL;
378 mask = 0x1f;
379 } else {
380 /* 8-ctx mode */
381 mask = 0x0f;
382 }
383 if (relreg & ~mask)
384 return EINVAL;
385 }
386 if ((destaddr = qat_aereg_get_10bit_addr(regtype, relreg)) ==
387 AEREG_BAD_REGADDR) {
388 return EINVAL;
389 }
390
391 data16lo = 0xffff & value;
392 data16hi = 0xffff & (value >> 16);
393 srchi = qat_aereg_get_10bit_addr(AEREG_NO_DEST,
394 (uint16_t)(0xff & data16hi));
395 srclo = qat_aereg_get_10bit_addr(AEREG_NO_DEST,
396 (uint16_t)(0xff & data16lo));
397
398 switch (regtype) {
399 case AEREG_GPA_REL: /* A rel source */
400 inst[imm_w1] = inst[imm_w1] | ((data16hi >> 8) << 20) |
401 ((srchi & 0x3ff) << 10) | (destaddr & 0x3ff);
402 inst[imm_w0] = inst[imm_w0] | ((data16lo >> 8) << 20) |
403 ((srclo & 0x3ff) << 10) | (destaddr & 0x3ff);
404 break;
405 default:
406 inst[imm_w1] = inst[imm_w1] | ((data16hi >> 8) << 20) |
407 ((destaddr & 0x3ff) << 10) | (srchi & 0x3ff);
408 inst[imm_w0] = inst[imm_w0] | ((data16lo >> 8) << 20) |
409 ((destaddr & 0x3ff) << 10) | (srclo & 0x3ff);
410 break;
411 }
412
413 return qat_ae_exec_ucode(sc, ae, ctx, inst, ninst, 1, ninst * 5, NULL);
414 }
415
416 int
qat_aereg_rel_data_read(struct qat_softc * sc,u_char ae,u_char ctx,enum aereg_type regtype,u_short relreg,uint32_t * value)417 qat_aereg_rel_data_read(struct qat_softc *sc, u_char ae, u_char ctx,
418 enum aereg_type regtype, u_short relreg, uint32_t *value)
419 {
420 uint64_t inst, savucode;
421 uint32_t ctxen, misc, nmisc, savctx, ctxarbctl, ulo, uhi;
422 u_int uaddr, ustore_addr;
423 int error;
424 u_short mask, regaddr;
425 u_char nae;
426
427 KASSERT(regtype == AEREG_GPA_REL || regtype == AEREG_GPB_REL ||
428 regtype == AEREG_SR_REL || regtype == AEREG_SR_RD_REL ||
429 regtype == AEREG_DR_REL || regtype == AEREG_DR_RD_REL ||
430 regtype == AEREG_LMEM0 || regtype == AEREG_LMEM1);
431
432 if ((regtype == AEREG_GPA_REL) || (regtype == AEREG_GPB_REL) ||
433 (regtype == AEREG_SR_REL) || (regtype == AEREG_SR_RD_REL) ||
434 (regtype == AEREG_DR_REL) || (regtype == AEREG_DR_RD_REL))
435 {
436 /* determine the context mode */
437 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
438 if (ctxen & CTX_ENABLES_INUSE_CONTEXTS) {
439 /* 4-ctx mode */
440 if (ctx & 0x1)
441 return EINVAL;
442 mask = 0x1f;
443 } else {
444 /* 8-ctx mode */
445 mask = 0x0f;
446 }
447 if (relreg & ~mask)
448 return EINVAL;
449 }
450 if ((regaddr = qat_aereg_get_10bit_addr(regtype, relreg)) ==
451 AEREG_BAD_REGADDR) {
452 return EINVAL;
453 }
454
455 /* instruction -- alu[--, --, B, reg] */
456 switch (regtype) {
457 case AEREG_GPA_REL:
458 /* A rel source */
459 inst = 0xA070000000ull | (regaddr & 0x3ff);
460 break;
461 default:
462 inst = (0xA030000000ull | ((regaddr & 0x3ff) << 10));
463 break;
464 }
465
466 /* backup shared control store bit, and force AE to
467 * none-shared mode before executing ucode snippet */
468 qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &misc);
469 if (misc & AE_MISC_CONTROL_SHARE_CS) {
470 qat_ae_get_shared_ustore_ae(ae, &nae);
471 if ((1 << nae) & sc->sc_ae_mask && qat_ae_is_active(sc, nae))
472 return EBUSY;
473 }
474
475 nmisc = misc & ~AE_MISC_CONTROL_SHARE_CS;
476 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, nmisc);
477
478 /* read current context */
479 qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS, &savctx);
480 qat_ae_read_4(sc, ae, CTX_ARB_CNTL, &ctxarbctl);
481
482 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
483 /* prevent clearing the W1C bits: the breakpoint bit,
484 ECC error bit, and Parity error bit */
485 ctxen &= CTX_ENABLES_IGNORE_W1C_MASK;
486
487 /* change the context */
488 if (ctx != (savctx & ACTIVE_CTX_STATUS_ACNO))
489 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS,
490 ctx & ACTIVE_CTX_STATUS_ACNO);
491 /* save a ustore location */
492 if ((error = qat_ae_ucode_read(sc, ae, 0, 1, &savucode)) != 0) {
493 /* restore AE_MISC_CONTROL csr */
494 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, misc);
495
496 /* restore the context */
497 if (ctx != (savctx & ACTIVE_CTX_STATUS_ACNO)) {
498 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS,
499 savctx & ACTIVE_CTX_STATUS_ACNO);
500 }
501 qat_ae_write_4(sc, ae, CTX_ARB_CNTL, ctxarbctl);
502
503 return (error);
504 }
505
506 /* turn off ustore parity */
507 qat_ae_write_4(sc, ae, CTX_ENABLES,
508 ctxen & (~CTX_ENABLES_CNTL_STORE_PARITY_ENABLE));
509
510 /* save ustore-addr csr */
511 qat_ae_read_4(sc, ae, USTORE_ADDRESS, &ustore_addr);
512
513 /* write the ALU instruction to ustore, enable ecs bit */
514 uaddr = 0 | USTORE_ADDRESS_ECS;
515
516 /* set the uaddress */
517 qat_ae_write_4(sc, ae, USTORE_ADDRESS, uaddr);
518 inst = qat_ae_ucode_set_ecc(inst);
519
520 ulo = (uint32_t)(inst & 0xffffffff);
521 uhi = (uint32_t)(inst >> 32);
522
523 qat_ae_write_4(sc, ae, USTORE_DATA_LOWER, ulo);
524
525 /* this will auto increment the address */
526 qat_ae_write_4(sc, ae, USTORE_DATA_UPPER, uhi);
527
528 /* set the uaddress */
529 qat_ae_write_4(sc, ae, USTORE_ADDRESS, uaddr);
530
531 /* delay for at least 8 cycles */
532 qat_ae_wait_num_cycles(sc, ae, 0x8, 0);
533
534 /* read ALU output -- the instruction should have been executed
535 prior to clearing the ECS in putUwords */
536 qat_ae_read_4(sc, ae, ALU_OUT, value);
537
538 /* restore ustore-addr csr */
539 qat_ae_write_4(sc, ae, USTORE_ADDRESS, ustore_addr);
540
541 /* restore the ustore */
542 error = qat_ae_ucode_write(sc, ae, 0, 1, &savucode);
543
544 /* restore the context */
545 if (ctx != (savctx & ACTIVE_CTX_STATUS_ACNO)) {
546 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS,
547 savctx & ACTIVE_CTX_STATUS_ACNO);
548 }
549
550 qat_ae_write_4(sc, ae, CTX_ARB_CNTL, ctxarbctl);
551
552 /* restore AE_MISC_CONTROL csr */
553 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, misc);
554
555 qat_ae_write_4(sc, ae, CTX_ENABLES, ctxen);
556
557 return error;
558 }
559
560 int
qat_aereg_rel_rdxfer_write(struct qat_softc * sc,u_char ae,u_char ctx,enum aereg_type regtype,u_short relreg,uint32_t value)561 qat_aereg_rel_rdxfer_write(struct qat_softc *sc, u_char ae, u_char ctx,
562 enum aereg_type regtype, u_short relreg, uint32_t value)
563 {
564 bus_size_t addr;
565 int error;
566 uint32_t ctxen;
567 u_short mask;
568 u_short dr_offset;
569
570 KASSERT(regtype == AEREG_SR_REL || regtype == AEREG_DR_REL ||
571 regtype == AEREG_SR_RD_REL || regtype == AEREG_DR_RD_REL);
572
573 QAT_YIELD();
574
575 error = qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
576 if (ctxen & CTX_ENABLES_INUSE_CONTEXTS) {
577 if (ctx & 0x1) {
578 aprint_error_dev(sc->sc_dev,
579 "bad ctx argument in 4-ctx mode,ctx=0x%x\n", ctx);
580 return EINVAL;
581 }
582 mask = 0x1f;
583 dr_offset = 0x20;
584
585 } else {
586 mask = 0x0f;
587 dr_offset = 0x10;
588 }
589
590 if (relreg & ~mask)
591 return EINVAL;
592
593 addr = relreg + (ctx << 0x5);
594
595 switch (regtype) {
596 case AEREG_SR_REL:
597 case AEREG_SR_RD_REL:
598 qat_ae_xfer_write_4(sc, ae, addr, value);
599 break;
600 case AEREG_DR_REL:
601 case AEREG_DR_RD_REL:
602 qat_ae_xfer_write_4(sc, ae, addr + dr_offset, value);
603 break;
604 default:
605 error = EINVAL;
606 }
607
608 return error;
609 }
610
611 int
qat_aereg_rel_wrxfer_write(struct qat_softc * sc,u_char ae,u_char ctx,enum aereg_type regtype,u_short relreg,uint32_t value)612 qat_aereg_rel_wrxfer_write(struct qat_softc *sc, u_char ae, u_char ctx,
613 enum aereg_type regtype, u_short relreg, uint32_t value)
614 {
615
616 panic("notyet");
617
618 return 0;
619 }
620
621 int
qat_aereg_rel_nn_write(struct qat_softc * sc,u_char ae,u_char ctx,enum aereg_type regtype,u_short relreg,uint32_t value)622 qat_aereg_rel_nn_write(struct qat_softc *sc, u_char ae, u_char ctx,
623 enum aereg_type regtype, u_short relreg, uint32_t value)
624 {
625
626 panic("notyet");
627
628 return 0;
629 }
630
631 int
qat_aereg_abs_to_rel(struct qat_softc * sc,u_char ae,u_short absreg,u_short * relreg,u_char * ctx)632 qat_aereg_abs_to_rel(struct qat_softc *sc, u_char ae,
633 u_short absreg, u_short *relreg, u_char *ctx)
634 {
635 uint32_t ctxen;
636
637 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
638 if (ctxen & CTX_ENABLES_INUSE_CONTEXTS) {
639 /* 4-ctx mode */
640 *relreg = absreg & 0x1f;
641 *ctx = (absreg >> 0x4) & 0x6;
642 } else {
643 /* 8-ctx mode */
644 *relreg = absreg & 0x0f;
645 *ctx = (absreg >> 0x4) & 0x7;
646 }
647
648 return 0;
649 }
650
651 int
qat_aereg_abs_data_write(struct qat_softc * sc,u_char ae,enum aereg_type regtype,u_short absreg,uint32_t value)652 qat_aereg_abs_data_write(struct qat_softc *sc, u_char ae,
653 enum aereg_type regtype, u_short absreg, uint32_t value)
654 {
655 int error;
656 u_short relreg;
657 u_char ctx;
658
659 qat_aereg_abs_to_rel(sc, ae, absreg, &relreg, &ctx);
660
661 switch (regtype) {
662 case AEREG_GPA_ABS:
663 KASSERT(absreg < MAX_GPR_REG);
664 error = qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPA_REL,
665 relreg, value);
666 break;
667 case AEREG_GPB_ABS:
668 KASSERT(absreg < MAX_GPR_REG);
669 error = qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPB_REL,
670 relreg, value);
671 break;
672 case AEREG_DR_RD_ABS:
673 KASSERT(absreg < MAX_XFER_REG);
674 error = qat_aereg_rel_rdxfer_write(sc, ae, ctx, AEREG_DR_RD_REL,
675 relreg, value);
676 break;
677 case AEREG_SR_RD_ABS:
678 KASSERT(absreg < MAX_XFER_REG);
679 error = qat_aereg_rel_rdxfer_write(sc, ae, ctx, AEREG_SR_RD_REL,
680 relreg, value);
681 break;
682 case AEREG_DR_WR_ABS:
683 KASSERT(absreg < MAX_XFER_REG);
684 error = qat_aereg_rel_wrxfer_write(sc, ae, ctx, AEREG_DR_WR_REL,
685 relreg, value);
686 break;
687 case AEREG_SR_WR_ABS:
688 KASSERT(absreg < MAX_XFER_REG);
689 error = qat_aereg_rel_wrxfer_write(sc, ae, ctx, AEREG_SR_WR_REL,
690 relreg, value);
691 break;
692 case AEREG_NEIGH_ABS:
693 KASSERT(absreg < MAX_NN_REG);
694 if (absreg >= MAX_NN_REG)
695 return EINVAL;
696 error = qat_aereg_rel_nn_write(sc, ae, ctx, AEREG_NEIGH_REL,
697 relreg, value);
698 break;
699 default:
700 panic("Invalid Register Type");
701 }
702
703 return error;
704 }
705
706 void
qat_ae_enable_ctx(struct qat_softc * sc,u_char ae,u_int ctx_mask)707 qat_ae_enable_ctx(struct qat_softc *sc, u_char ae, u_int ctx_mask)
708 {
709 uint32_t ctxen;
710
711 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
712 ctxen &= CTX_ENABLES_IGNORE_W1C_MASK;
713
714 if (ctxen & CTX_ENABLES_INUSE_CONTEXTS) {
715 ctx_mask &= 0x55;
716 } else {
717 ctx_mask &= 0xff;
718 }
719
720 ctxen |= __SHIFTIN(ctx_mask, CTX_ENABLES_ENABLE);
721 qat_ae_write_4(sc, ae, CTX_ENABLES, ctxen);
722 }
723
724 void
qat_ae_disable_ctx(struct qat_softc * sc,u_char ae,u_int ctx_mask)725 qat_ae_disable_ctx(struct qat_softc *sc, u_char ae, u_int ctx_mask)
726 {
727 uint32_t ctxen;
728
729 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
730 ctxen &= CTX_ENABLES_IGNORE_W1C_MASK;
731 ctxen &= ~(__SHIFTIN(ctx_mask & AE_ALL_CTX, CTX_ENABLES_ENABLE));
732 qat_ae_write_4(sc, ae, CTX_ENABLES, ctxen);
733 }
734
735 void
qat_ae_write_ctx_mode(struct qat_softc * sc,u_char ae,u_char mode)736 qat_ae_write_ctx_mode(struct qat_softc *sc, u_char ae, u_char mode)
737 {
738 uint32_t val, nval;
739
740 qat_ae_read_4(sc, ae, CTX_ENABLES, &val);
741 val &= CTX_ENABLES_IGNORE_W1C_MASK;
742
743 if (mode == 4)
744 nval = val | CTX_ENABLES_INUSE_CONTEXTS;
745 else
746 nval = val & ~CTX_ENABLES_INUSE_CONTEXTS;
747
748 if (val != nval)
749 qat_ae_write_4(sc, ae, CTX_ENABLES, nval);
750 }
751
752 void
qat_ae_write_nn_mode(struct qat_softc * sc,u_char ae,u_char mode)753 qat_ae_write_nn_mode(struct qat_softc *sc, u_char ae, u_char mode)
754 {
755 uint32_t val, nval;
756
757 qat_ae_read_4(sc, ae, CTX_ENABLES, &val);
758 val &= CTX_ENABLES_IGNORE_W1C_MASK;
759
760 if (mode)
761 nval = val | CTX_ENABLES_NN_MODE;
762 else
763 nval = val & ~CTX_ENABLES_NN_MODE;
764
765 if (val != nval)
766 qat_ae_write_4(sc, ae, CTX_ENABLES, nval);
767 }
768
769 void
qat_ae_write_lm_mode(struct qat_softc * sc,u_char ae,enum aereg_type lm,u_char mode)770 qat_ae_write_lm_mode(struct qat_softc *sc, u_char ae,
771 enum aereg_type lm, u_char mode)
772 {
773 uint32_t val, nval;
774 uint32_t bit;
775
776 qat_ae_read_4(sc, ae, CTX_ENABLES, &val);
777 val &= CTX_ENABLES_IGNORE_W1C_MASK;
778
779 switch (lm) {
780 case AEREG_LMEM0:
781 bit = CTX_ENABLES_LMADDR_0_GLOBAL;
782 break;
783 case AEREG_LMEM1:
784 bit = CTX_ENABLES_LMADDR_1_GLOBAL;
785 break;
786 default:
787 panic("invalid lmem reg type");
788 break;
789 }
790
791 if (mode)
792 nval = val | bit;
793 else
794 nval = val & ~bit;
795
796 if (val != nval)
797 qat_ae_write_4(sc, ae, CTX_ENABLES, nval);
798 }
799
800 void
qat_ae_write_shared_cs_mode0(struct qat_softc * sc,u_char ae,u_char mode)801 qat_ae_write_shared_cs_mode0(struct qat_softc *sc, u_char ae, u_char mode)
802 {
803 uint32_t val, nval;
804
805 qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &val);
806
807 if (mode == 1)
808 nval = val | AE_MISC_CONTROL_SHARE_CS;
809 else
810 nval = val & ~AE_MISC_CONTROL_SHARE_CS;
811
812 if (val != nval)
813 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, nval);
814 }
815
816 void
qat_ae_write_shared_cs_mode(struct qat_softc * sc,u_char ae,u_char mode)817 qat_ae_write_shared_cs_mode(struct qat_softc *sc, u_char ae, u_char mode)
818 {
819 u_char nae;
820
821 qat_ae_get_shared_ustore_ae(ae, &nae);
822
823 qat_ae_write_shared_cs_mode0(sc, ae, mode);
824
825 if ((sc->sc_ae_mask & (1 << nae))) {
826 qat_ae_write_shared_cs_mode0(sc, nae, mode);
827 }
828 }
829
830 int
qat_ae_set_reload_ustore(struct qat_softc * sc,u_char ae,u_int reload_size,int shared_mode,u_int ustore_dram_addr)831 qat_ae_set_reload_ustore(struct qat_softc *sc, u_char ae,
832 u_int reload_size, int shared_mode, u_int ustore_dram_addr)
833 {
834 uint32_t val, cs_reload;
835
836 switch (reload_size) {
837 case 0:
838 cs_reload = 0x0;
839 break;
840 case QAT_2K:
841 cs_reload = 0x1;
842 break;
843 case QAT_4K:
844 cs_reload = 0x2;
845 break;
846 case QAT_8K:
847 cs_reload = 0x3;
848 break;
849 default:
850 return EINVAL;
851 }
852
853 if (cs_reload)
854 QAT_AE(sc, ae).qae_ustore_dram_addr = ustore_dram_addr;
855
856 QAT_AE(sc, ae).qae_reload_size = reload_size;
857
858 qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &val);
859 val &= ~(AE_MISC_CONTROL_ONE_CTX_RELOAD |
860 AE_MISC_CONTROL_CS_RELOAD | AE_MISC_CONTROL_SHARE_CS);
861 val |= __SHIFTIN(cs_reload, AE_MISC_CONTROL_CS_RELOAD) |
862 __SHIFTIN(shared_mode, AE_MISC_CONTROL_ONE_CTX_RELOAD);
863 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, val);
864
865 return 0;
866 }
867
868 enum qat_ae_status
qat_ae_get_status(struct qat_softc * sc,u_char ae)869 qat_ae_get_status(struct qat_softc *sc, u_char ae)
870 {
871 int error;
872 uint32_t val = 0;
873
874 error = qat_ae_read_4(sc, ae, CTX_ENABLES, &val);
875 if (error || val & CTX_ENABLES_ENABLE)
876 return QAT_AE_ENABLED;
877
878 qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS, &val);
879 if (val & ACTIVE_CTX_STATUS_ABO)
880 return QAT_AE_ACTIVE;
881
882 return QAT_AE_DISABLED;
883 }
884
885
886 int
qat_ae_is_active(struct qat_softc * sc,u_char ae)887 qat_ae_is_active(struct qat_softc *sc, u_char ae)
888 {
889 uint32_t val;
890
891 if (qat_ae_get_status(sc, ae) != QAT_AE_DISABLED)
892 return 1;
893
894 qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS, &val);
895 if (val & ACTIVE_CTX_STATUS_ABO)
896 return 1;
897 else
898 return 0;
899 }
900
901 /* returns 1 if actually waited for specified number of cycles */
902 int
qat_ae_wait_num_cycles(struct qat_softc * sc,u_char ae,int cycles,int check)903 qat_ae_wait_num_cycles(struct qat_softc *sc, u_char ae, int cycles, int check)
904 {
905 uint32_t cnt, actx;
906 int pcnt, ccnt, elapsed, times;
907
908 qat_ae_read_4(sc, ae, PROFILE_COUNT, &cnt);
909 pcnt = cnt & 0xffff;
910
911 times = TIMEOUT_AE_CHECK;
912 do {
913 qat_ae_read_4(sc, ae, PROFILE_COUNT, &cnt);
914 ccnt = cnt & 0xffff;
915
916 elapsed = ccnt - pcnt;
917 if (elapsed == 0) {
918 times--;
919 aprint_debug_dev(sc->sc_dev,
920 "qat_ae_wait_num_cycles elapsed 0 times %d\n",
921 times);
922 }
923 if (times <= 0) {
924 aprint_error_dev(sc->sc_dev,
925 "qat_ae_wait_num_cycles timeout\n");
926 return -1;
927 }
928
929 if (elapsed < 0)
930 elapsed += 0x10000;
931
932 if (elapsed >= CYCLES_FROM_READY2EXE && check) {
933 if (qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS,
934 &actx) == 0) {
935 if ((actx & ACTIVE_CTX_STATUS_ABO) == 0)
936 return 0;
937 }
938 }
939 } while (cycles > elapsed);
940
941 if (check && qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS, &actx) == 0) {
942 if ((actx & ACTIVE_CTX_STATUS_ABO) == 0)
943 return 0;
944 }
945
946 return 1;
947 }
948
949 int
qat_ae_init(struct qat_softc * sc)950 qat_ae_init(struct qat_softc *sc)
951 {
952 int error;
953 uint32_t mask, val = 0;
954 u_char ae;
955
956 /* XXX adf_initSysMemInfo */
957
958 /* XXX Disable clock gating for some chip if debug mode */
959
960 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
961 struct qat_ae *qae = &sc->sc_ae[ae];
962 if (!(mask & 1))
963 continue;
964
965 qae->qae_ustore_size = USTORE_SIZE;
966
967 qae->qae_free_addr = 0;
968 qae->qae_free_size = USTORE_SIZE;
969 qae->qae_live_ctx_mask = AE_ALL_CTX;
970 qae->qae_ustore_dram_addr = 0;
971 qae->qae_reload_size = 0;
972 }
973
974 /* XXX Enable attention interrupt */
975
976 error = qat_ae_clear_reset(sc);
977 if (error)
978 return error;
979
980 qat_ae_clear_xfer(sc);
981
982 if (!sc->sc_hw.qhw_fw_auth) {
983 error = qat_ae_clear_gprs(sc);
984 if (error)
985 return error;
986 }
987
988 /* Set SIGNATURE_ENABLE[0] to 0x1 in order to enable ALU_OUT csr */
989 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
990 if (!(mask & 1))
991 continue;
992 qat_ae_read_4(sc, ae, SIGNATURE_ENABLE, &val);
993 val |= 0x1;
994 qat_ae_write_4(sc, ae, SIGNATURE_ENABLE, val);
995 }
996
997 error = qat_ae_clear_reset(sc);
998 if (error)
999 return error;
1000
1001 /* XXX XXX XXX Clean MMP memory if mem scrub is supported */
1002 /* halMem_ScrubMMPMemory */
1003
1004 return 0;
1005 }
1006
1007 int
qat_ae_start(struct qat_softc * sc)1008 qat_ae_start(struct qat_softc *sc)
1009 {
1010 int error;
1011
1012 u_char ae;
1013
1014 for (ae = 0; ae < sc->sc_ae_num; ae++) {
1015 if ((sc->sc_ae_mask & (1 << ae)) == 0)
1016 continue;
1017
1018 error = qat_aefw_start(sc, ae, 0xff);
1019 if (error)
1020 return error;
1021
1022 aprint_verbose_dev(sc->sc_dev, "Started AE %d\n", ae);
1023 }
1024
1025 return 0;
1026 }
1027
1028 int
qat_ae_cluster_intr(void * arg)1029 qat_ae_cluster_intr(void *arg)
1030 {
1031 /* XXX */
1032 printf("qat_ae_cluster_intr\n");
1033
1034 return 1;
1035 }
1036
1037 int
qat_ae_clear_reset(struct qat_softc * sc)1038 qat_ae_clear_reset(struct qat_softc *sc)
1039 {
1040 int error;
1041 uint32_t times, reset, clock, reg, mask;
1042 u_char ae;
1043
1044 reset = qat_cap_global_read_4(sc, CAP_GLOBAL_CTL_RESET);
1045 reset &= ~(__SHIFTIN(sc->sc_ae_mask, CAP_GLOBAL_CTL_RESET_AE_MASK));
1046 reset &= ~(__SHIFTIN(sc->sc_accel_mask, CAP_GLOBAL_CTL_RESET_ACCEL_MASK));
1047 times = TIMEOUT_AE_RESET;
1048 do {
1049 qat_cap_global_write_4(sc, CAP_GLOBAL_CTL_RESET, reset);
1050 if ((times--) == 0) {
1051 aprint_error_dev(sc->sc_dev, "couldn't reset AEs\n");
1052 return EBUSY;
1053 }
1054 reg = qat_cap_global_read_4(sc, CAP_GLOBAL_CTL_RESET);
1055 } while ((__SHIFTIN(sc->sc_ae_mask, CAP_GLOBAL_CTL_RESET_AE_MASK) |
1056 __SHIFTIN(sc->sc_accel_mask, CAP_GLOBAL_CTL_RESET_ACCEL_MASK))
1057 & reg);
1058
1059 /* Enable clock for AE and QAT */
1060 clock = qat_cap_global_read_4(sc, CAP_GLOBAL_CTL_CLK_EN);
1061 clock |= __SHIFTIN(sc->sc_ae_mask, CAP_GLOBAL_CTL_CLK_EN_AE_MASK);
1062 clock |= __SHIFTIN(sc->sc_accel_mask, CAP_GLOBAL_CTL_CLK_EN_ACCEL_MASK);
1063 qat_cap_global_write_4(sc, CAP_GLOBAL_CTL_CLK_EN, clock);
1064
1065 error = qat_ae_check(sc);
1066 if (error)
1067 return error;
1068
1069 /*
1070 * Set undefined power-up/reset states to reasonable default values...
1071 * just to make sure we're starting from a known point
1072 */
1073 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
1074 if (!(mask & 1))
1075 continue;
1076
1077 /* init the ctx_enable */
1078 qat_ae_write_4(sc, ae, CTX_ENABLES,
1079 CTX_ENABLES_INIT);
1080
1081 /* initialize the PCs */
1082 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1083 CTX_STS_INDIRECT,
1084 UPC_MASK & CTX_STS_INDIRECT_UPC_INIT);
1085
1086 /* init the ctx_arb */
1087 qat_ae_write_4(sc, ae, CTX_ARB_CNTL,
1088 CTX_ARB_CNTL_INIT);
1089
1090 /* enable cc */
1091 qat_ae_write_4(sc, ae, CC_ENABLE,
1092 CC_ENABLE_INIT);
1093 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1094 CTX_WAKEUP_EVENTS_INDIRECT,
1095 CTX_WAKEUP_EVENTS_INDIRECT_INIT);
1096 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1097 CTX_SIG_EVENTS_INDIRECT,
1098 CTX_SIG_EVENTS_INDIRECT_INIT);
1099 }
1100
1101 if ((sc->sc_ae_mask != 0) &&
1102 sc->sc_flags & QAT_FLAG_ESRAM_ENABLE_AUTO_INIT) {
1103 /* XXX XXX XXX init eSram only when this is boot time */
1104 }
1105
1106 if ((sc->sc_ae_mask != 0) &&
1107 sc->sc_flags & QAT_FLAG_SHRAM_WAIT_READY) {
1108 /* XXX XXX XXX wait shram to complete initialization */
1109 }
1110
1111 qat_ae_reset_timestamp(sc);
1112
1113 return 0;
1114 }
1115
1116 int
qat_ae_check(struct qat_softc * sc)1117 qat_ae_check(struct qat_softc *sc)
1118 {
1119 int error, times, ae;
1120 uint32_t cnt, pcnt, mask;
1121
1122 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
1123 if (!(mask & 1))
1124 continue;
1125
1126 times = TIMEOUT_AE_CHECK;
1127 error = qat_ae_read_4(sc, ae, PROFILE_COUNT, &cnt);
1128 if (error) {
1129 aprint_error_dev(sc->sc_dev,
1130 "couldn't access AE %d CSR\n", ae);
1131 return error;
1132 }
1133 pcnt = cnt & 0xffff;
1134
1135 while (1) {
1136 error = qat_ae_read_4(sc, ae,
1137 PROFILE_COUNT, &cnt);
1138 if (error) {
1139 aprint_error_dev(sc->sc_dev,
1140 "couldn't access AE %d CSR\n", ae);
1141 return error;
1142 }
1143 cnt &= 0xffff;
1144 if (cnt == pcnt)
1145 times--;
1146 else
1147 break;
1148 if (times <= 0) {
1149 aprint_error_dev(sc->sc_dev,
1150 "AE %d CSR is useless\n", ae);
1151 return EFAULT;
1152 }
1153 }
1154 }
1155
1156 return 0;
1157 }
1158
1159 int
qat_ae_reset_timestamp(struct qat_softc * sc)1160 qat_ae_reset_timestamp(struct qat_softc *sc)
1161 {
1162 uint32_t misc, mask;
1163 u_char ae;
1164
1165 /* stop the timestamp timers */
1166 misc = qat_cap_global_read_4(sc, CAP_GLOBAL_CTL_MISC);
1167 if (misc & CAP_GLOBAL_CTL_MISC_TIMESTAMP_EN) {
1168 qat_cap_global_write_4(sc, CAP_GLOBAL_CTL_MISC,
1169 misc & (~CAP_GLOBAL_CTL_MISC_TIMESTAMP_EN));
1170 }
1171
1172 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
1173 if (!(mask & 1))
1174 continue;
1175 qat_ae_write_4(sc, ae, TIMESTAMP_LOW, 0);
1176 qat_ae_write_4(sc, ae, TIMESTAMP_HIGH, 0);
1177 }
1178
1179 /* start timestamp timers */
1180 qat_cap_global_write_4(sc, CAP_GLOBAL_CTL_MISC,
1181 misc | CAP_GLOBAL_CTL_MISC_TIMESTAMP_EN);
1182
1183 return 0;
1184 }
1185
1186
1187 void
qat_ae_clear_xfer(struct qat_softc * sc)1188 qat_ae_clear_xfer(struct qat_softc *sc)
1189 {
1190 u_int mask, reg;
1191 u_char ae;
1192
1193 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
1194 if (!(mask & 1))
1195 continue;
1196
1197 for (reg = 0; reg < MAX_GPR_REG; reg++) {
1198 qat_aereg_abs_data_write(sc, ae, AEREG_SR_RD_ABS,
1199 reg, 0);
1200 qat_aereg_abs_data_write(sc, ae, AEREG_DR_RD_ABS,
1201 reg, 0);
1202 }
1203 }
1204 }
1205
1206 int
qat_ae_clear_gprs(struct qat_softc * sc)1207 qat_ae_clear_gprs(struct qat_softc *sc)
1208 {
1209 uint32_t val;
1210 uint32_t saved_ctx = 0;
1211 int times = TIMEOUT_AE_CHECK, rv;
1212 u_char ae;
1213 u_int mask;
1214
1215 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
1216 if (!(mask & 1))
1217 continue;
1218
1219 /* turn off share control store bit */
1220 val = qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &val);
1221 val &= ~AE_MISC_CONTROL_SHARE_CS;
1222 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, val);
1223
1224 /* turn off ucode parity */
1225 /* make sure nn_mode is set to self */
1226 qat_ae_read_4(sc, ae, CTX_ENABLES, &val);
1227 val &= CTX_ENABLES_IGNORE_W1C_MASK;
1228 val |= CTX_ENABLES_NN_MODE;
1229 val &= ~CTX_ENABLES_CNTL_STORE_PARITY_ENABLE;
1230 qat_ae_write_4(sc, ae, CTX_ENABLES, val);
1231
1232 /* copy instructions to ustore */
1233 qat_ae_ucode_write(sc, ae, 0, __arraycount(ae_clear_gprs_inst),
1234 ae_clear_gprs_inst);
1235
1236 /* set PC */
1237 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX, CTX_STS_INDIRECT,
1238 UPC_MASK & CTX_STS_INDIRECT_UPC_INIT);
1239
1240 /* save current context */
1241 qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS, &saved_ctx);
1242 /* change the active context */
1243 /* start the context from ctx 0 */
1244 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS, 0);
1245
1246 /* wakeup-event voluntary */
1247 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1248 CTX_WAKEUP_EVENTS_INDIRECT,
1249 CTX_WAKEUP_EVENTS_INDIRECT_VOLUNTARY);
1250 /* clean signals */
1251 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1252 CTX_SIG_EVENTS_INDIRECT, 0);
1253 qat_ae_write_4(sc, ae, CTX_SIG_EVENTS_ACTIVE, 0);
1254
1255 qat_ae_enable_ctx(sc, ae, AE_ALL_CTX);
1256 }
1257
1258 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
1259 if (!(mask & 1))
1260 continue;
1261 /* wait for AE to finish */
1262 do {
1263 rv = qat_ae_wait_num_cycles(sc, ae, AE_EXEC_CYCLE, 1);
1264 } while (rv && times--);
1265 if (times <= 0) {
1266 aprint_error_dev(sc->sc_dev,
1267 "qat_ae_clear_gprs timeout");
1268 return ETIMEDOUT;
1269 }
1270 qat_ae_disable_ctx(sc, ae, AE_ALL_CTX);
1271 /* change the active context */
1272 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS,
1273 saved_ctx & ACTIVE_CTX_STATUS_ACNO);
1274 /* init the ctx_enable */
1275 qat_ae_write_4(sc, ae, CTX_ENABLES, CTX_ENABLES_INIT);
1276 /* initialize the PCs */
1277 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1278 CTX_STS_INDIRECT, UPC_MASK & CTX_STS_INDIRECT_UPC_INIT);
1279 /* init the ctx_arb */
1280 qat_ae_write_4(sc, ae, CTX_ARB_CNTL, CTX_ARB_CNTL_INIT);
1281 /* enable cc */
1282 qat_ae_write_4(sc, ae, CC_ENABLE, CC_ENABLE_INIT);
1283 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX,
1284 CTX_WAKEUP_EVENTS_INDIRECT, CTX_WAKEUP_EVENTS_INDIRECT_INIT);
1285 qat_ae_ctx_indr_write(sc, ae, AE_ALL_CTX, CTX_SIG_EVENTS_INDIRECT,
1286 CTX_SIG_EVENTS_INDIRECT_INIT);
1287 }
1288
1289 return 0;
1290 }
1291
1292 void
qat_ae_get_shared_ustore_ae(u_char ae,u_char * nae)1293 qat_ae_get_shared_ustore_ae(u_char ae, u_char *nae)
1294 {
1295 if (ae & 0x1)
1296 *nae = ae - 1;
1297 else
1298 *nae = ae + 1;
1299 }
1300
1301 u_int
qat_ae_ucode_parity64(uint64_t ucode)1302 qat_ae_ucode_parity64(uint64_t ucode)
1303 {
1304
1305 ucode ^= ucode >> 1;
1306 ucode ^= ucode >> 2;
1307 ucode ^= ucode >> 4;
1308 ucode ^= ucode >> 8;
1309 ucode ^= ucode >> 16;
1310 ucode ^= ucode >> 32;
1311
1312 return ((u_int)(ucode & 1));
1313 }
1314
1315 uint64_t
qat_ae_ucode_set_ecc(uint64_t ucode)1316 qat_ae_ucode_set_ecc(uint64_t ucode)
1317 {
1318 static const uint64_t
1319 bit0mask=0xff800007fffULL, bit1mask=0x1f801ff801fULL,
1320 bit2mask=0xe387e0781e1ULL, bit3mask=0x7cb8e388e22ULL,
1321 bit4mask=0xaf5b2c93244ULL, bit5mask=0xf56d5525488ULL,
1322 bit6mask=0xdaf69a46910ULL;
1323
1324 /* clear the ecc bits */
1325 ucode &= ~(0x7fULL << USTORE_ECC_BIT_0);
1326
1327 ucode |= (uint64_t)qat_ae_ucode_parity64(bit0mask & ucode) <<
1328 USTORE_ECC_BIT_0;
1329 ucode |= (uint64_t)qat_ae_ucode_parity64(bit1mask & ucode) <<
1330 USTORE_ECC_BIT_1;
1331 ucode |= (uint64_t)qat_ae_ucode_parity64(bit2mask & ucode) <<
1332 USTORE_ECC_BIT_2;
1333 ucode |= (uint64_t)qat_ae_ucode_parity64(bit3mask & ucode) <<
1334 USTORE_ECC_BIT_3;
1335 ucode |= (uint64_t)qat_ae_ucode_parity64(bit4mask & ucode) <<
1336 USTORE_ECC_BIT_4;
1337 ucode |= (uint64_t)qat_ae_ucode_parity64(bit5mask & ucode) <<
1338 USTORE_ECC_BIT_5;
1339 ucode |= (uint64_t)qat_ae_ucode_parity64(bit6mask & ucode) <<
1340 USTORE_ECC_BIT_6;
1341
1342 return (ucode);
1343 }
1344
1345 int
qat_ae_ucode_write(struct qat_softc * sc,u_char ae,u_int uaddr,u_int ninst,const uint64_t * ucode)1346 qat_ae_ucode_write(struct qat_softc *sc, u_char ae, u_int uaddr, u_int ninst,
1347 const uint64_t *ucode)
1348 {
1349 uint64_t tmp;
1350 uint32_t ustore_addr, ulo, uhi;
1351 int i;
1352
1353 qat_ae_read_4(sc, ae, USTORE_ADDRESS, &ustore_addr);
1354 uaddr |= USTORE_ADDRESS_ECS;
1355
1356 qat_ae_write_4(sc, ae, USTORE_ADDRESS, uaddr);
1357 for (i = 0; i < ninst; i++) {
1358 tmp = qat_ae_ucode_set_ecc(ucode[i]);
1359 ulo = (uint32_t)(tmp & 0xffffffff);
1360 uhi = (uint32_t)(tmp >> 32);
1361
1362 qat_ae_write_4(sc, ae, USTORE_DATA_LOWER, ulo);
1363 /* this will auto increment the address */
1364 qat_ae_write_4(sc, ae, USTORE_DATA_UPPER, uhi);
1365
1366 QAT_YIELD();
1367 }
1368 qat_ae_write_4(sc, ae, USTORE_ADDRESS, ustore_addr);
1369
1370 return 0;
1371 }
1372
1373 int
qat_ae_ucode_read(struct qat_softc * sc,u_char ae,u_int uaddr,u_int ninst,uint64_t * ucode)1374 qat_ae_ucode_read(struct qat_softc *sc, u_char ae, u_int uaddr, u_int ninst,
1375 uint64_t *ucode)
1376 {
1377 uint32_t misc, ustore_addr, ulo, uhi;
1378 u_int ii;
1379 u_char nae;
1380
1381 if (qat_ae_get_status(sc, ae) != QAT_AE_DISABLED)
1382 return EBUSY;
1383
1384 /* determine whether it neighbour AE runs in shared control store
1385 * status */
1386 qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &misc);
1387 if (misc & AE_MISC_CONTROL_SHARE_CS) {
1388 qat_ae_get_shared_ustore_ae(ae, &nae);
1389 if ((sc->sc_ae_mask & (1 << nae)) && qat_ae_is_active(sc, nae))
1390 return EBUSY;
1391 }
1392
1393 /* if reloadable, then get it all from dram-ustore */
1394 if (__SHIFTOUT(misc, AE_MISC_CONTROL_CS_RELOAD))
1395 panic("notyet"); /* XXX getReloadUwords */
1396
1397 /* disable SHARE_CS bit to workaround silicon bug */
1398 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, misc & 0xfffffffb);
1399
1400 KASSERT(uaddr + ninst <= USTORE_SIZE);
1401
1402 /* save ustore-addr csr */
1403 qat_ae_read_4(sc, ae, USTORE_ADDRESS, &ustore_addr);
1404
1405 uaddr |= USTORE_ADDRESS_ECS; /* enable ecs bit */
1406 for (ii = 0; ii < ninst; ii++) {
1407 qat_ae_write_4(sc, ae, USTORE_ADDRESS, uaddr);
1408
1409 uaddr++;
1410 qat_ae_read_4(sc, ae, USTORE_DATA_LOWER, &ulo);
1411 qat_ae_read_4(sc, ae, USTORE_DATA_UPPER, &uhi);
1412 ucode[ii] = uhi;
1413 ucode[ii] = (ucode[ii] << 32) | ulo;
1414 }
1415
1416 /* restore SHARE_CS bit to workaround silicon bug */
1417 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, misc);
1418 qat_ae_write_4(sc, ae, USTORE_ADDRESS, ustore_addr);
1419
1420 return 0;
1421 }
1422
1423 u_int
qat_ae_concat_ucode(uint64_t * ucode,u_int ninst,u_int size,u_int addr,u_int * value)1424 qat_ae_concat_ucode(uint64_t *ucode, u_int ninst, u_int size, u_int addr,
1425 u_int *value)
1426 {
1427 const uint64_t *inst_arr;
1428 u_int ninst0, curvalue;
1429 int ii, vali, fixup, usize = 0;
1430
1431 if (size == 0)
1432 return 0;
1433
1434 ninst0 = ninst;
1435 vali = 0;
1436 curvalue = value[vali++];
1437
1438 switch (size) {
1439 case 0x1:
1440 inst_arr = ae_inst_1b;
1441 usize = __arraycount(ae_inst_1b);
1442 break;
1443 case 0x2:
1444 inst_arr = ae_inst_2b;
1445 usize = __arraycount(ae_inst_2b);
1446 break;
1447 case 0x3:
1448 inst_arr = ae_inst_3b;
1449 usize = __arraycount(ae_inst_3b);
1450 break;
1451 default:
1452 inst_arr = ae_inst_4b;
1453 usize = __arraycount(ae_inst_4b);
1454 break;
1455 }
1456
1457 fixup = ninst;
1458 for (ii = 0; ii < usize; ii++)
1459 ucode[ninst++] = inst_arr[ii];
1460
1461 INSERT_IMMED_GPRA_CONST(ucode[fixup], (addr));
1462 fixup++;
1463 INSERT_IMMED_GPRA_CONST(ucode[fixup], 0);
1464 fixup++;
1465 INSERT_IMMED_GPRB_CONST(ucode[fixup], (curvalue >> 0));
1466 fixup++;
1467 INSERT_IMMED_GPRB_CONST(ucode[fixup], (curvalue >> 16));
1468 /* XXX fixup++ ? */
1469
1470 if (size <= 0x4)
1471 return (ninst - ninst0);
1472
1473 size -= sizeof(u_int);
1474 while (size >= sizeof(u_int)) {
1475 curvalue = value[vali++];
1476 fixup = ninst;
1477 ucode[ninst++] = ae_inst_4b[0x2];
1478 ucode[ninst++] = ae_inst_4b[0x3];
1479 ucode[ninst++] = ae_inst_4b[0x8];
1480 INSERT_IMMED_GPRB_CONST(ucode[fixup], (curvalue >> 16));
1481 fixup++;
1482 INSERT_IMMED_GPRB_CONST(ucode[fixup], (curvalue >> 0));
1483 /* XXX fixup++ ? */
1484
1485 addr += sizeof(u_int);
1486 size -= sizeof(u_int);
1487 }
1488 /* call this function recursive when the left size less than 4 */
1489 ninst +=
1490 qat_ae_concat_ucode(ucode, ninst, size, addr, value + vali);
1491
1492 return (ninst - ninst0);
1493 }
1494
1495 int
qat_ae_exec_ucode(struct qat_softc * sc,u_char ae,u_char ctx,uint64_t * ucode,u_int ninst,int cond_code_off,u_int max_cycles,u_int * endpc)1496 qat_ae_exec_ucode(struct qat_softc *sc, u_char ae, u_char ctx,
1497 uint64_t *ucode, u_int ninst, int cond_code_off, u_int max_cycles,
1498 u_int *endpc)
1499 {
1500 int error = 0, share_cs = 0;
1501 uint64_t savucode[MAX_EXEC_INST];
1502 uint32_t indr_lm_addr_0, indr_lm_addr_1;
1503 uint32_t indr_lm_addr_byte_0, indr_lm_addr_byte_1;
1504 uint32_t indr_future_cnt_sig;
1505 uint32_t indr_sig, active_sig;
1506 uint32_t wakeup_ev, savpc, savcc, savctx, ctxarbctl;
1507 uint32_t misc, nmisc, ctxen;
1508 u_char nae;
1509
1510 KASSERT(ninst <= USTORE_SIZE);
1511
1512 if (qat_ae_is_active(sc, ae))
1513 return EBUSY;
1514
1515 #if 0
1516 printf("%s: ae %d ctx %d ninst %d code 0x%016llx 0x%016llx\n",
1517 __func__, ae, ctx, ninst, ucode[0], ucode[ninst-1]);
1518 #endif
1519
1520 /* save current LM addr */
1521 qat_ae_ctx_indr_read(sc, ae, ctx, LM_ADDR_0_INDIRECT, &indr_lm_addr_0);
1522 qat_ae_ctx_indr_read(sc, ae, ctx, LM_ADDR_1_INDIRECT, &indr_lm_addr_1);
1523 qat_ae_ctx_indr_read(sc, ae, ctx, INDIRECT_LM_ADDR_0_BYTE_INDEX,
1524 &indr_lm_addr_byte_0);
1525 qat_ae_ctx_indr_read(sc, ae, ctx, INDIRECT_LM_ADDR_1_BYTE_INDEX,
1526 &indr_lm_addr_byte_1);
1527
1528 /* backup shared control store bit, and force AE to
1529 none-shared mode before executing ucode snippet */
1530 qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &misc);
1531 if (misc & AE_MISC_CONTROL_SHARE_CS) {
1532 share_cs = 1;
1533 qat_ae_get_shared_ustore_ae(ae, &nae);
1534 if ((sc->sc_ae_mask & (1 << nae)) && qat_ae_is_active(sc, nae))
1535 return EBUSY;
1536 }
1537 nmisc = misc & ~AE_MISC_CONTROL_SHARE_CS;
1538 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, nmisc);
1539
1540 /* save current states: */
1541 if (ninst <= MAX_EXEC_INST) {
1542 error = qat_ae_ucode_read(sc, ae, 0, ninst, savucode);
1543 if (error) {
1544 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, misc);
1545 return error;
1546 }
1547 }
1548
1549 /* save wakeup-events */
1550 qat_ae_ctx_indr_read(sc, ae, ctx, CTX_WAKEUP_EVENTS_INDIRECT,
1551 &wakeup_ev);
1552 /* save PC */
1553 qat_ae_ctx_indr_read(sc, ae, ctx, CTX_STS_INDIRECT, &savpc);
1554 savpc &= UPC_MASK;
1555
1556 /* save ctx enables */
1557 qat_ae_read_4(sc, ae, CTX_ENABLES, &ctxen);
1558 ctxen &= CTX_ENABLES_IGNORE_W1C_MASK;
1559 /* save conditional-code */
1560 qat_ae_read_4(sc, ae, CC_ENABLE, &savcc);
1561 /* save current context */
1562 qat_ae_read_4(sc, ae, ACTIVE_CTX_STATUS, &savctx);
1563 qat_ae_read_4(sc, ae, CTX_ARB_CNTL, &ctxarbctl);
1564
1565 /* save indirect csrs */
1566 qat_ae_ctx_indr_read(sc, ae, ctx, FUTURE_COUNT_SIGNAL_INDIRECT,
1567 &indr_future_cnt_sig);
1568 qat_ae_ctx_indr_read(sc, ae, ctx, CTX_SIG_EVENTS_INDIRECT, &indr_sig);
1569 qat_ae_read_4(sc, ae, CTX_SIG_EVENTS_ACTIVE, &active_sig);
1570
1571 /* turn off ucode parity */
1572 qat_ae_write_4(sc, ae, CTX_ENABLES,
1573 ctxen & ~CTX_ENABLES_CNTL_STORE_PARITY_ENABLE);
1574
1575 /* copy instructions to ustore */
1576 qat_ae_ucode_write(sc, ae, 0, ninst, ucode);
1577 /* set PC */
1578 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, CTX_STS_INDIRECT, 0);
1579 /* change the active context */
1580 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS,
1581 ctx & ACTIVE_CTX_STATUS_ACNO);
1582
1583 if (cond_code_off) {
1584 /* disable conditional-code*/
1585 qat_ae_write_4(sc, ae, CC_ENABLE, savcc & 0xffffdfff);
1586 }
1587
1588 /* wakeup-event voluntary */
1589 qat_ae_ctx_indr_write(sc, ae, 1 << ctx,
1590 CTX_WAKEUP_EVENTS_INDIRECT, CTX_WAKEUP_EVENTS_INDIRECT_VOLUNTARY);
1591
1592 /* clean signals */
1593 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, CTX_SIG_EVENTS_INDIRECT, 0);
1594 qat_ae_write_4(sc, ae, CTX_SIG_EVENTS_ACTIVE, 0);
1595
1596 /* enable context */
1597 qat_ae_enable_ctx(sc, ae, 1 << ctx);
1598
1599 /* wait for it to finish */
1600 if (qat_ae_wait_num_cycles(sc, ae, max_cycles, 1) != 0)
1601 error = ETIMEDOUT;
1602
1603 /* see if we need to get the current PC */
1604 if (endpc != NULL) {
1605 uint32_t ctx_status;
1606
1607 qat_ae_ctx_indr_read(sc, ae, ctx, CTX_STS_INDIRECT,
1608 &ctx_status);
1609 *endpc = ctx_status & UPC_MASK;
1610 }
1611 #if 0
1612 {
1613 uint32_t ctx_status;
1614
1615 qat_ae_ctx_indr_read(sc, ae, ctx, CTX_STS_INDIRECT,
1616 &ctx_status);
1617 printf("%s: endpc 0x%08x\n", __func__,
1618 ctx_status & UPC_MASK);
1619 }
1620 #endif
1621
1622 /* retore to previous states: */
1623 /* disable context */
1624 qat_ae_disable_ctx(sc, ae, 1 << ctx);
1625 if (ninst <= MAX_EXEC_INST) {
1626 /* instructions */
1627 qat_ae_ucode_write(sc, ae, 0, ninst, savucode);
1628 }
1629 /* wakeup-events */
1630 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, CTX_WAKEUP_EVENTS_INDIRECT,
1631 wakeup_ev);
1632 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, CTX_STS_INDIRECT, savpc);
1633
1634 /* only restore shared control store bit,
1635 other bit might be changed by AE code snippet */
1636 qat_ae_read_4(sc, ae, AE_MISC_CONTROL, &misc);
1637 if (share_cs)
1638 nmisc = misc | AE_MISC_CONTROL_SHARE_CS;
1639 else
1640 nmisc = misc & ~AE_MISC_CONTROL_SHARE_CS;
1641 qat_ae_write_4(sc, ae, AE_MISC_CONTROL, nmisc);
1642 /* conditional-code */
1643 qat_ae_write_4(sc, ae, CC_ENABLE, savcc);
1644 /* change the active context */
1645 qat_ae_write_4(sc, ae, ACTIVE_CTX_STATUS,
1646 savctx & ACTIVE_CTX_STATUS_ACNO);
1647 /* restore the nxt ctx to run */
1648 qat_ae_write_4(sc, ae, CTX_ARB_CNTL, ctxarbctl);
1649 /* restore current LM addr */
1650 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, LM_ADDR_0_INDIRECT,
1651 indr_lm_addr_0);
1652 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, LM_ADDR_1_INDIRECT,
1653 indr_lm_addr_1);
1654 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, INDIRECT_LM_ADDR_0_BYTE_INDEX,
1655 indr_lm_addr_byte_0);
1656 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, INDIRECT_LM_ADDR_1_BYTE_INDEX,
1657 indr_lm_addr_byte_1);
1658
1659 /* restore indirect csrs */
1660 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, FUTURE_COUNT_SIGNAL_INDIRECT,
1661 indr_future_cnt_sig);
1662 qat_ae_ctx_indr_write(sc, ae, 1 << ctx, CTX_SIG_EVENTS_INDIRECT,
1663 indr_sig);
1664 qat_ae_write_4(sc, ae, CTX_SIG_EVENTS_ACTIVE, active_sig);
1665
1666 /* ctx-enables */
1667 qat_ae_write_4(sc, ae, CTX_ENABLES, ctxen);
1668
1669 return error;
1670 }
1671
1672 int
qat_ae_exec_ucode_init_lm(struct qat_softc * sc,u_char ae,u_char ctx,int * first_exec,uint64_t * ucode,u_int ninst,u_int * gpr_a0,u_int * gpr_a1,u_int * gpr_a2,u_int * gpr_b0,u_int * gpr_b1)1673 qat_ae_exec_ucode_init_lm(struct qat_softc *sc, u_char ae, u_char ctx,
1674 int *first_exec, uint64_t *ucode, u_int ninst,
1675 u_int *gpr_a0, u_int *gpr_a1, u_int *gpr_a2, u_int *gpr_b0, u_int *gpr_b1)
1676 {
1677
1678 if (*first_exec) {
1679 qat_aereg_rel_data_read(sc, ae, ctx, AEREG_GPA_REL, 0, gpr_a0);
1680 qat_aereg_rel_data_read(sc, ae, ctx, AEREG_GPA_REL, 1, gpr_a1);
1681 qat_aereg_rel_data_read(sc, ae, ctx, AEREG_GPA_REL, 2, gpr_a2);
1682 qat_aereg_rel_data_read(sc, ae, ctx, AEREG_GPB_REL, 0, gpr_b0);
1683 qat_aereg_rel_data_read(sc, ae, ctx, AEREG_GPB_REL, 1, gpr_b1);
1684 *first_exec = 0;
1685 }
1686
1687 return qat_ae_exec_ucode(sc, ae, ctx, ucode, ninst, 1, ninst * 5, NULL);
1688 }
1689
1690 int
qat_ae_restore_init_lm_gprs(struct qat_softc * sc,u_char ae,u_char ctx,u_int gpr_a0,u_int gpr_a1,u_int gpr_a2,u_int gpr_b0,u_int gpr_b1)1691 qat_ae_restore_init_lm_gprs(struct qat_softc *sc, u_char ae, u_char ctx,
1692 u_int gpr_a0, u_int gpr_a1, u_int gpr_a2, u_int gpr_b0, u_int gpr_b1)
1693 {
1694 qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPA_REL, 0, gpr_a0);
1695 qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPA_REL, 1, gpr_a1);
1696 qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPA_REL, 2, gpr_a2);
1697 qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPB_REL, 0, gpr_b0);
1698 qat_aereg_rel_data_write(sc, ae, ctx, AEREG_GPB_REL, 1, gpr_b1);
1699
1700 return 0;
1701 }
1702
1703 int
qat_ae_get_inst_num(int lmsize)1704 qat_ae_get_inst_num(int lmsize)
1705 {
1706 int ninst, left;
1707
1708 if (lmsize == 0)
1709 return 0;
1710
1711 left = lmsize % sizeof(u_int);
1712
1713 if (left) {
1714 ninst = __arraycount(ae_inst_1b) +
1715 qat_ae_get_inst_num(lmsize - left);
1716 } else {
1717 /* 3 instruction is needed for further code */
1718 ninst = (lmsize - sizeof(u_int)) * 3 / 4 +
1719 __arraycount(ae_inst_4b);
1720 }
1721
1722 return (ninst);
1723 }
1724
1725 int
qat_ae_batch_put_lm(struct qat_softc * sc,u_char ae,struct qat_ae_batch_init_list * qabi_list,size_t nqabi)1726 qat_ae_batch_put_lm(struct qat_softc *sc, u_char ae,
1727 struct qat_ae_batch_init_list *qabi_list, size_t nqabi)
1728 {
1729 struct qat_ae_batch_init *qabi;
1730 size_t alloc_ninst, ninst;
1731 uint64_t *ucode;
1732 u_int gpr_a0, gpr_a1, gpr_a2, gpr_b0, gpr_b1;
1733 int insnsz, error = 0, execed = 0, first_exec = 1;
1734
1735 if (SIMPLEQ_FIRST(qabi_list) == NULL)
1736 return 0;
1737
1738 alloc_ninst = uimin(USTORE_SIZE, nqabi);
1739 ucode = qat_alloc_mem(sizeof(uint64_t) * alloc_ninst);
1740
1741 ninst = 0;
1742 SIMPLEQ_FOREACH(qabi, qabi_list, qabi_next) {
1743 insnsz = qat_ae_get_inst_num(qabi->qabi_size);
1744 if (insnsz + ninst > alloc_ninst) {
1745 aprint_debug_dev(sc->sc_dev,
1746 "code page is full, call exection unit\n");
1747 /* add ctx_arb[kill] */
1748 ucode[ninst++] = 0x0E000010000ull;
1749 execed = 1;
1750
1751 error = qat_ae_exec_ucode_init_lm(sc, ae, 0,
1752 &first_exec, ucode, ninst,
1753 &gpr_a0, &gpr_a1, &gpr_a2, &gpr_b0, &gpr_b1);
1754 if (error) {
1755 qat_ae_restore_init_lm_gprs(sc, ae, 0,
1756 gpr_a0, gpr_a1, gpr_a2, gpr_b0, gpr_b1);
1757 qat_free_mem(ucode);
1758 return error;
1759 }
1760 /* run microExec to execute the microcode */
1761 ninst = 0;
1762 }
1763 ninst += qat_ae_concat_ucode(ucode, ninst,
1764 qabi->qabi_size, qabi->qabi_addr, qabi->qabi_value);
1765 }
1766
1767 if (ninst > 0) {
1768 ucode[ninst++] = 0x0E000010000ull;
1769 execed = 1;
1770
1771 error = qat_ae_exec_ucode_init_lm(sc, ae, 0,
1772 &first_exec, ucode, ninst,
1773 &gpr_a0, &gpr_a1, &gpr_a2, &gpr_b0, &gpr_b1);
1774 }
1775 if (execed) {
1776 qat_ae_restore_init_lm_gprs(sc, ae, 0,
1777 gpr_a0, gpr_a1, gpr_a2, gpr_b0, gpr_b1);
1778 }
1779
1780 qat_free_mem(ucode);
1781
1782 return error;
1783 }
1784
1785 int
qat_ae_write_pc(struct qat_softc * sc,u_char ae,u_int ctx_mask,u_int upc)1786 qat_ae_write_pc(struct qat_softc *sc, u_char ae, u_int ctx_mask, u_int upc)
1787 {
1788
1789 if (qat_ae_is_active(sc, ae))
1790 return EBUSY;
1791
1792 qat_ae_ctx_indr_write(sc, ae, ctx_mask, CTX_STS_INDIRECT,
1793 UPC_MASK & upc);
1794 return 0;
1795 }
1796
1797 static inline u_int
qat_aefw_csum_calc(u_int reg,int ch)1798 qat_aefw_csum_calc(u_int reg, int ch)
1799 {
1800 int i;
1801 u_int topbit = CRC_BITMASK(CRC_WIDTH - 1);
1802 u_int inbyte = (u_int)((reg >> 0x18) ^ ch);
1803
1804 reg ^= inbyte << (CRC_WIDTH - 0x8);
1805 for (i = 0; i < 0x8; i++) {
1806 if (reg & topbit)
1807 reg = (reg << 1) ^ CRC_POLY;
1808 else
1809 reg <<= 1;
1810 }
1811
1812 return (reg & CRC_WIDTHMASK(CRC_WIDTH));
1813 }
1814
1815 u_int
qat_aefw_csum(char * buf,int size)1816 qat_aefw_csum(char *buf, int size)
1817 {
1818 u_int csum = 0;
1819
1820 while (size--) {
1821 csum = qat_aefw_csum_calc(csum, *buf++);
1822 }
1823
1824 return csum;
1825 }
1826
1827 const char *
qat_aefw_uof_string(struct qat_softc * sc,size_t offset)1828 qat_aefw_uof_string(struct qat_softc *sc, size_t offset)
1829 {
1830 if (offset >= sc->sc_aefw_uof.qafu_str_tab_size)
1831 return NULL;
1832 if (sc->sc_aefw_uof.qafu_str_tab == NULL)
1833 return NULL;
1834
1835 return (const char *)((uintptr_t)sc->sc_aefw_uof.qafu_str_tab + offset);
1836 }
1837
1838 struct uof_chunk_hdr *
qat_aefw_uof_find_chunk(struct qat_softc * sc,const char * id,struct uof_chunk_hdr * cur)1839 qat_aefw_uof_find_chunk(struct qat_softc *sc,
1840 const char *id, struct uof_chunk_hdr *cur)
1841 {
1842 struct uof_obj_hdr *uoh = sc->sc_aefw_uof.qafu_obj_hdr;
1843 struct uof_chunk_hdr *uch;
1844 int i;
1845
1846 uch = (struct uof_chunk_hdr *)(uoh + 1);
1847 for (i = 0; i < uoh->uoh_num_chunks; i++, uch++) {
1848 if (uch->uch_offset + uch->uch_size > sc->sc_aefw_uof.qafu_size)
1849 return NULL;
1850
1851 if (cur < uch && !strncmp(uch->uch_id, id, UOF_OBJ_ID_LEN))
1852 return uch;
1853 }
1854
1855 return NULL;
1856 }
1857
1858 int
qat_aefw_load_mof(struct qat_softc * sc)1859 qat_aefw_load_mof(struct qat_softc *sc)
1860 {
1861 int error = 0;
1862 firmware_handle_t fh = NULL;
1863 off_t fwsize;
1864
1865 /* load MOF firmware */
1866 error = firmware_open("qat", sc->sc_hw.qhw_mof_fwname, &fh);
1867 if (error) {
1868 aprint_error_dev(sc->sc_dev, "couldn't load mof firmware %s\n",
1869 sc->sc_hw.qhw_mof_fwname);
1870 goto fail;
1871 }
1872
1873 fwsize = firmware_get_size(fh);
1874 if (fwsize == 0 || fwsize > SIZE_MAX) {
1875 error = EINVAL;
1876 goto fail;
1877 }
1878 sc->sc_fw_mof_size = fwsize;
1879 sc->sc_fw_mof = firmware_malloc(sc->sc_fw_mof_size);
1880
1881 error = firmware_read(fh, 0, sc->sc_fw_mof, sc->sc_fw_mof_size);
1882 if (error)
1883 goto fail;
1884
1885 out:
1886 if (fh != NULL)
1887 firmware_close(fh);
1888 return error;
1889 fail:
1890 if (sc->sc_fw_mof != NULL) {
1891 firmware_free(sc->sc_fw_mof, sc->sc_fw_mof_size);
1892 sc->sc_fw_mof = NULL;
1893 }
1894 goto out;
1895 }
1896
1897 int
qat_aefw_load_mmp(struct qat_softc * sc)1898 qat_aefw_load_mmp(struct qat_softc *sc)
1899 {
1900 int error = 0;
1901 firmware_handle_t fh = NULL;
1902 off_t fwsize;
1903
1904 error = firmware_open("qat", sc->sc_hw.qhw_mmp_fwname, &fh);
1905 if (error) {
1906 aprint_error_dev(sc->sc_dev, "couldn't load mmp firmware %s\n",
1907 sc->sc_hw.qhw_mmp_fwname);
1908 goto fail;
1909 }
1910
1911 fwsize = firmware_get_size(fh);
1912 if (fwsize == 0 || fwsize > SIZE_MAX) {
1913 error = EINVAL;
1914 goto fail;
1915 }
1916 sc->sc_fw_mmp_size = fwsize;
1917 sc->sc_fw_mmp = firmware_malloc(sc->sc_fw_mmp_size);
1918
1919 error = firmware_read(fh, 0, sc->sc_fw_mmp, sc->sc_fw_mmp_size);
1920 if (error)
1921 goto fail;
1922
1923 out:
1924 if (fh != NULL)
1925 firmware_close(fh);
1926 return error;
1927 fail:
1928 if (sc->sc_fw_mmp != NULL) {
1929 firmware_free(sc->sc_fw_mmp, sc->sc_fw_mmp_size);
1930 sc->sc_fw_mmp = NULL;
1931 }
1932 goto out;
1933 }
1934
1935 int
qat_aefw_mof_find_uof0(struct qat_softc * sc,struct mof_uof_hdr * muh,struct mof_uof_chunk_hdr * head,u_int nchunk,size_t size,const char * id,size_t * fwsize,void ** fwptr)1936 qat_aefw_mof_find_uof0(struct qat_softc *sc,
1937 struct mof_uof_hdr *muh, struct mof_uof_chunk_hdr *head,
1938 u_int nchunk, size_t size, const char *id,
1939 size_t *fwsize, void **fwptr)
1940 {
1941 int i;
1942 char *uof_name;
1943
1944 for (i = 0; i < nchunk; i++) {
1945 struct mof_uof_chunk_hdr *much = &head[i];
1946
1947 if (strncmp(much->much_id, id, MOF_OBJ_ID_LEN))
1948 return EINVAL;
1949
1950 if (much->much_offset + much->much_size > size)
1951 return EINVAL;
1952
1953 if (sc->sc_mof.qmf_sym_size <= much->much_name)
1954 return EINVAL;
1955
1956 uof_name = (char *)((uintptr_t)sc->sc_mof.qmf_sym +
1957 much->much_name);
1958
1959 if (!strcmp(uof_name, sc->sc_fw_uof_name)) {
1960 *fwptr = (void *)((uintptr_t)muh +
1961 (uintptr_t)much->much_offset);
1962 *fwsize = (size_t)much->much_size;
1963 aprint_verbose_dev(sc->sc_dev,
1964 "%s obj %s at %p size 0x%lx\n",
1965 id, uof_name, *fwptr, *fwsize);
1966 return 0;
1967 }
1968 }
1969
1970 return ENOENT;
1971 }
1972
1973 int
qat_aefw_mof_find_uof(struct qat_softc * sc)1974 qat_aefw_mof_find_uof(struct qat_softc *sc)
1975 {
1976 struct mof_uof_hdr *uof_hdr, *suof_hdr;
1977 u_int nuof_chunks = 0, nsuof_chunks = 0;
1978 int error;
1979
1980 uof_hdr = sc->sc_mof.qmf_uof_objs;
1981 suof_hdr = sc->sc_mof.qmf_suof_objs;
1982
1983 if (uof_hdr != NULL) {
1984 if (uof_hdr->muh_max_chunks < uof_hdr->muh_num_chunks) {
1985 return EINVAL;
1986 }
1987 nuof_chunks = uof_hdr->muh_num_chunks;
1988 }
1989 if (suof_hdr != NULL) {
1990 if (suof_hdr->muh_max_chunks < suof_hdr->muh_num_chunks)
1991 return EINVAL;
1992 nsuof_chunks = suof_hdr->muh_num_chunks;
1993 }
1994
1995 if (nuof_chunks + nsuof_chunks == 0)
1996 return EINVAL;
1997
1998 if (uof_hdr != NULL) {
1999 error = qat_aefw_mof_find_uof0(sc, uof_hdr,
2000 (struct mof_uof_chunk_hdr *)(uof_hdr + 1), nuof_chunks,
2001 sc->sc_mof.qmf_uof_objs_size, UOF_IMAG,
2002 &sc->sc_fw_uof_size, &sc->sc_fw_uof);
2003 if (error && error != ENOENT)
2004 return error;
2005 }
2006
2007 if (suof_hdr != NULL) {
2008 error = qat_aefw_mof_find_uof0(sc, suof_hdr,
2009 (struct mof_uof_chunk_hdr *)(suof_hdr + 1), nsuof_chunks,
2010 sc->sc_mof.qmf_suof_objs_size, SUOF_IMAG,
2011 &sc->sc_fw_suof_size, &sc->sc_fw_suof);
2012 if (error && error != ENOENT)
2013 return error;
2014 }
2015
2016 if (sc->sc_fw_uof == NULL && sc->sc_fw_suof == NULL)
2017 return ENOENT;
2018
2019 return 0;
2020 }
2021
2022 int
qat_aefw_mof_parse(struct qat_softc * sc)2023 qat_aefw_mof_parse(struct qat_softc *sc)
2024 {
2025 struct mof_file_hdr *mfh;
2026 struct mof_file_chunk_hdr *mfch;
2027 size_t size;
2028 u_int csum;
2029 int error, i;
2030
2031 size = sc->sc_fw_mof_size;
2032
2033 if (size < sizeof(struct mof_file_hdr))
2034 return EINVAL;
2035 size -= sizeof(struct mof_file_hdr);
2036
2037 mfh = sc->sc_fw_mof;
2038
2039 if (mfh->mfh_fid != MOF_FID)
2040 return EINVAL;
2041
2042 csum = qat_aefw_csum((char *)((uintptr_t)sc->sc_fw_mof +
2043 offsetof(struct mof_file_hdr, mfh_min_ver)),
2044 sc->sc_fw_mof_size -
2045 offsetof(struct mof_file_hdr, mfh_min_ver));
2046 if (mfh->mfh_csum != csum)
2047 return EINVAL;
2048
2049 if (mfh->mfh_min_ver != MOF_MIN_VER ||
2050 mfh->mfh_maj_ver != MOF_MAJ_VER)
2051 return EINVAL;
2052
2053 if (mfh->mfh_max_chunks < mfh->mfh_num_chunks)
2054 return EINVAL;
2055
2056 if (size < sizeof(struct mof_file_chunk_hdr) * mfh->mfh_num_chunks)
2057 return EINVAL;
2058 mfch = (struct mof_file_chunk_hdr *)(mfh + 1);
2059
2060 for (i = 0; i < mfh->mfh_num_chunks; i++, mfch++) {
2061 if (mfch->mfch_offset + mfch->mfch_size > sc->sc_fw_mof_size)
2062 return EINVAL;
2063
2064 if (!strncmp(mfch->mfch_id, SYM_OBJS, MOF_OBJ_ID_LEN)) {
2065 if (sc->sc_mof.qmf_sym != NULL)
2066 return EINVAL;
2067
2068 sc->sc_mof.qmf_sym =
2069 (void *)((uintptr_t)sc->sc_fw_mof +
2070 (uintptr_t)mfch->mfch_offset + sizeof(u_int));
2071 sc->sc_mof.qmf_sym_size =
2072 *(u_int *)((uintptr_t)sc->sc_fw_mof +
2073 (uintptr_t)mfch->mfch_offset);
2074
2075 if (sc->sc_mof.qmf_sym_size % sizeof(u_int) != 0)
2076 return EINVAL;
2077 if (mfch->mfch_size != sc->sc_mof.qmf_sym_size +
2078 sizeof(u_int) || mfch->mfch_size == 0)
2079 return EINVAL;
2080 if (*(char *)((uintptr_t)sc->sc_mof.qmf_sym +
2081 sc->sc_mof.qmf_sym_size - 1) != '\0')
2082 return EINVAL;
2083
2084 } else if (!strncmp(mfch->mfch_id, UOF_OBJS, MOF_OBJ_ID_LEN)) {
2085 if (sc->sc_mof.qmf_uof_objs != NULL)
2086 return EINVAL;
2087
2088 sc->sc_mof.qmf_uof_objs =
2089 (void *)((uintptr_t)sc->sc_fw_mof +
2090 (uintptr_t)mfch->mfch_offset);
2091 sc->sc_mof.qmf_uof_objs_size = mfch->mfch_size;
2092
2093 } else if (!strncmp(mfch->mfch_id, SUOF_OBJS, MOF_OBJ_ID_LEN)) {
2094 if (sc->sc_mof.qmf_suof_objs != NULL)
2095 return EINVAL;
2096
2097 sc->sc_mof.qmf_suof_objs =
2098 (void *)((uintptr_t)sc->sc_fw_mof +
2099 (uintptr_t)mfch->mfch_offset);
2100 sc->sc_mof.qmf_suof_objs_size = mfch->mfch_size;
2101 }
2102 }
2103
2104 if (sc->sc_mof.qmf_sym == NULL ||
2105 (sc->sc_mof.qmf_uof_objs == NULL &&
2106 sc->sc_mof.qmf_suof_objs == NULL))
2107 return EINVAL;
2108
2109 error = qat_aefw_mof_find_uof(sc);
2110 if (error)
2111 return error;
2112 return 0;
2113 }
2114
2115 int
qat_aefw_uof_parse_image(struct qat_softc * sc,struct qat_uof_image * qui,struct uof_chunk_hdr * uch)2116 qat_aefw_uof_parse_image(struct qat_softc *sc,
2117 struct qat_uof_image *qui, struct uof_chunk_hdr *uch)
2118 {
2119 struct uof_image *image;
2120 struct uof_code_page *page;
2121 uintptr_t base = (uintptr_t)sc->sc_aefw_uof.qafu_obj_hdr;
2122 size_t lim = uch->uch_offset + uch->uch_size, size;
2123 int i, p;
2124
2125 size = uch->uch_size;
2126 if (size < sizeof(struct uof_image))
2127 return EINVAL;
2128 size -= sizeof(struct uof_image);
2129
2130 qui->qui_image = image =
2131 (struct uof_image *)(base + uch->uch_offset);
2132
2133 aprint_verbose_dev(sc->sc_dev,
2134 "uof_image name %s\n",
2135 qat_aefw_uof_string(sc, image->ui_name));
2136 aprint_verbose_dev(sc->sc_dev,
2137 "uof_image ae_assign 0x%08x ctx_assign 0x%08x cpu_type 0x%08x\n",
2138 image->ui_ae_assigned, image->ui_ctx_assigned, image->ui_cpu_type);
2139 aprint_verbose_dev(sc->sc_dev,
2140 "uof_image max_ver 0x%08x min_ver 0x%08x ae_mode 0x%08x\n",
2141 image->ui_max_ver, image->ui_min_ver, image->ui_ae_mode);
2142 aprint_verbose_dev(sc->sc_dev,
2143 "uof_image pages 0x%08x page regions 0x%08x\n",
2144 image->ui_num_pages, image->ui_num_page_regions);
2145
2146 #define ASSIGN_OBJ_TAB(np, typep, type, base, off, lim) \
2147 do { \
2148 u_int nent; \
2149 nent = ((struct uof_obj_table *)((base) + (off)))->uot_nentries;\
2150 if ((lim) < off + sizeof(struct uof_obj_table) + \
2151 sizeof(type) * nent) \
2152 return EINVAL; \
2153 *(np) = nent; \
2154 if (nent > 0) \
2155 *(typep) = (type)((struct uof_obj_table *) \
2156 ((base) + (off)) + 1); \
2157 else \
2158 *(typep) = NULL; \
2159 } while (0)
2160
2161 ASSIGN_OBJ_TAB(&qui->qui_num_ae_reg, &qui->qui_ae_reg,
2162 struct uof_ae_reg *, base, image->ui_reg_tab, lim);
2163 ASSIGN_OBJ_TAB(&qui->qui_num_init_reg_sym, &qui->qui_init_reg_sym,
2164 struct uof_init_reg_sym *, base, image->ui_init_reg_sym_tab, lim);
2165 ASSIGN_OBJ_TAB(&qui->qui_num_sbreak, &qui->qui_sbreak,
2166 struct qui_sbreak *, base, image->ui_sbreak_tab, lim);
2167
2168 if (size < sizeof(struct uof_code_page) * image->ui_num_pages)
2169 return EINVAL;
2170 if (__arraycount(qui->qui_pages) < image->ui_num_pages)
2171 return EINVAL;
2172
2173 page = (struct uof_code_page *)(image + 1);
2174
2175 for (p = 0; p < image->ui_num_pages; p++, page++) {
2176 struct qat_uof_page *qup = &qui->qui_pages[p];
2177 struct uof_code_area *uca;
2178
2179 qup->qup_page_num = page->ucp_page_num;
2180 qup->qup_def_page = page->ucp_def_page;
2181 qup->qup_page_region = page->ucp_page_region;
2182 qup->qup_beg_vaddr = page->ucp_beg_vaddr;
2183 qup->qup_beg_paddr = page->ucp_beg_paddr;
2184
2185 ASSIGN_OBJ_TAB(&qup->qup_num_uc_var, &qup->qup_uc_var,
2186 struct uof_uword_fixup *, base,
2187 page->ucp_uc_var_tab, lim);
2188 ASSIGN_OBJ_TAB(&qup->qup_num_imp_var, &qup->qup_imp_var,
2189 struct uof_import_var *, base,
2190 page->ucp_imp_var_tab, lim);
2191 ASSIGN_OBJ_TAB(&qup->qup_num_imp_expr, &qup->qup_imp_expr,
2192 struct uof_uword_fixup *, base,
2193 page->ucp_imp_expr_tab, lim);
2194 ASSIGN_OBJ_TAB(&qup->qup_num_neigh_reg, &qup->qup_neigh_reg,
2195 struct uof_uword_fixup *, base,
2196 page->ucp_neigh_reg_tab, lim);
2197
2198 if (lim < page->ucp_code_area + sizeof(struct uof_code_area))
2199 return EINVAL;
2200
2201 uca = (struct uof_code_area *)(base + page->ucp_code_area);
2202 qup->qup_num_micro_words = uca->uca_num_micro_words;
2203
2204 ASSIGN_OBJ_TAB(&qup->qup_num_uw_blocks, &qup->qup_uw_blocks,
2205 struct qat_uof_uword_block *, base,
2206 uca->uca_uword_block_tab, lim);
2207
2208 for (i = 0; i < qup->qup_num_uw_blocks; i++) {
2209 u_int uwordoff = ((struct uof_uword_block *)(
2210 &qup->qup_uw_blocks[i]))->uub_uword_offset;
2211
2212 if (lim < uwordoff)
2213 return EINVAL;
2214
2215 qup->qup_uw_blocks[i].quub_micro_words =
2216 (base + uwordoff);
2217 }
2218 }
2219
2220 #undef ASSIGN_OBJ_TAB
2221
2222 return 0;
2223 }
2224
2225 int
qat_aefw_uof_parse_images(struct qat_softc * sc)2226 qat_aefw_uof_parse_images(struct qat_softc *sc)
2227 {
2228 struct uof_chunk_hdr *uch = NULL;
2229 u_int assigned_ae;
2230 int i, error;
2231
2232 for (i = 0; i < MAX_NUM_AE * MAX_AE_CTX; i++) {
2233 uch = qat_aefw_uof_find_chunk(sc, UOF_IMAG, uch);
2234 if (uch == NULL)
2235 break;
2236
2237 if (i >= __arraycount(sc->sc_aefw_uof.qafu_imgs))
2238 return ENOENT;
2239
2240 error = qat_aefw_uof_parse_image(sc, &sc->sc_aefw_uof.qafu_imgs[i], uch);
2241 if (error)
2242 return error;
2243
2244 sc->sc_aefw_uof.qafu_num_imgs++;
2245 }
2246
2247 assigned_ae = 0;
2248 for (i = 0; i < sc->sc_aefw_uof.qafu_num_imgs; i++) {
2249 assigned_ae |= sc->sc_aefw_uof.qafu_imgs[i].qui_image->ui_ae_assigned;
2250 }
2251
2252 return 0;
2253 }
2254
2255 int
qat_aefw_uof_parse(struct qat_softc * sc)2256 qat_aefw_uof_parse(struct qat_softc *sc)
2257 {
2258 struct uof_file_hdr *ufh;
2259 struct uof_file_chunk_hdr *ufch;
2260 struct uof_obj_hdr *uoh;
2261 struct uof_chunk_hdr *uch;
2262 void *uof = NULL;
2263 size_t size, uof_size, hdr_size;
2264 uintptr_t base;
2265 u_int csum;
2266 int i;
2267
2268 size = sc->sc_fw_uof_size;
2269 if (size < MIN_UOF_SIZE)
2270 return EINVAL;
2271 size -= sizeof(struct uof_file_hdr);
2272
2273 ufh = sc->sc_fw_uof;
2274
2275 if (ufh->ufh_id != UOF_FID)
2276 return EINVAL;
2277 if (ufh->ufh_min_ver != UOF_MIN_VER || ufh->ufh_maj_ver != UOF_MAJ_VER)
2278 return EINVAL;
2279
2280 if (ufh->ufh_max_chunks < ufh->ufh_num_chunks)
2281 return EINVAL;
2282 if (size < sizeof(struct uof_file_chunk_hdr) * ufh->ufh_num_chunks)
2283 return EINVAL;
2284 ufch = (struct uof_file_chunk_hdr *)(ufh + 1);
2285
2286 uof_size = 0;
2287 for (i = 0; i < ufh->ufh_num_chunks; i++, ufch++) {
2288 if (ufch->ufch_offset + ufch->ufch_size > sc->sc_fw_uof_size)
2289 return EINVAL;
2290
2291 if (!strncmp(ufch->ufch_id, UOF_OBJS, UOF_OBJ_ID_LEN)) {
2292 if (uof != NULL)
2293 return EINVAL;
2294
2295 uof =
2296 (void *)((uintptr_t)sc->sc_fw_uof +
2297 ufch->ufch_offset);
2298 uof_size = ufch->ufch_size;
2299
2300 csum = qat_aefw_csum(uof, uof_size);
2301 if (csum != ufch->ufch_csum)
2302 return EINVAL;
2303
2304 aprint_verbose_dev(sc->sc_dev,
2305 "uof at %p size 0x%lx\n",
2306 uof, uof_size);
2307 }
2308 }
2309
2310 if (uof == NULL)
2311 return ENOENT;
2312
2313 size = uof_size;
2314 if (size < sizeof(struct uof_obj_hdr))
2315 return EINVAL;
2316 size -= sizeof(struct uof_obj_hdr);
2317
2318 uoh = uof;
2319
2320 aprint_verbose_dev(sc->sc_dev,
2321 "uof cpu_type 0x%08x min_cpu_ver 0x%04x max_cpu_ver 0x%04x\n",
2322 uoh->uoh_cpu_type, uoh->uoh_min_cpu_ver, uoh->uoh_max_cpu_ver);
2323
2324 if (size < sizeof(struct uof_chunk_hdr) * uoh->uoh_num_chunks)
2325 return EINVAL;
2326
2327 /* Check if the UOF objects are compatible with the chip */
2328 if ((uoh->uoh_cpu_type & sc->sc_hw.qhw_prod_type) == 0)
2329 return ENOTSUP;
2330
2331 if (uoh->uoh_min_cpu_ver > sc->sc_rev ||
2332 uoh->uoh_max_cpu_ver < sc->sc_rev)
2333 return ENOTSUP;
2334
2335 sc->sc_aefw_uof.qafu_size = uof_size;
2336 sc->sc_aefw_uof.qafu_obj_hdr = uoh;
2337
2338 base = (uintptr_t)sc->sc_aefw_uof.qafu_obj_hdr;
2339
2340 /* map uof string-table */
2341 uch = qat_aefw_uof_find_chunk(sc, UOF_STRT, NULL);
2342 if (uch != NULL) {
2343 hdr_size = offsetof(struct uof_str_tab, ust_strings);
2344 sc->sc_aefw_uof.qafu_str_tab =
2345 (void *)(base + uch->uch_offset + hdr_size);
2346 sc->sc_aefw_uof.qafu_str_tab_size = uch->uch_size - hdr_size;
2347 }
2348
2349 /* get ustore mem inits table -- should be only one */
2350 uch = qat_aefw_uof_find_chunk(sc, UOF_IMEM, NULL);
2351 if (uch != NULL) {
2352 if (uch->uch_size < sizeof(struct uof_obj_table))
2353 return EINVAL;
2354 sc->sc_aefw_uof.qafu_num_init_mem = ((struct uof_obj_table *)(base +
2355 uch->uch_offset))->uot_nentries;
2356 if (sc->sc_aefw_uof.qafu_num_init_mem) {
2357 sc->sc_aefw_uof.qafu_init_mem =
2358 (struct uof_init_mem *)(base + uch->uch_offset +
2359 sizeof(struct uof_obj_table));
2360 sc->sc_aefw_uof.qafu_init_mem_size =
2361 uch->uch_size - sizeof(struct uof_obj_table);
2362 }
2363 }
2364
2365 uch = qat_aefw_uof_find_chunk(sc, UOF_MSEG, NULL);
2366 if (uch != NULL) {
2367 if (uch->uch_size < sizeof(struct uof_obj_table) +
2368 sizeof(struct uof_var_mem_seg))
2369 return EINVAL;
2370 sc->sc_aefw_uof.qafu_var_mem_seg =
2371 (struct uof_var_mem_seg *)(base + uch->uch_offset +
2372 sizeof(struct uof_obj_table));
2373 }
2374
2375 return qat_aefw_uof_parse_images(sc);
2376 }
2377
2378 int
qat_aefw_suof_parse_image(struct qat_softc * sc,struct qat_suof_image * qsi,struct suof_chunk_hdr * sch)2379 qat_aefw_suof_parse_image(struct qat_softc *sc, struct qat_suof_image *qsi,
2380 struct suof_chunk_hdr *sch)
2381 {
2382 struct qat_aefw_suof *qafs = &sc->sc_aefw_suof;
2383 struct simg_ae_mode *ae_mode;
2384 u_int maj_ver;
2385
2386 qsi->qsi_simg_buf = qafs->qafs_suof_buf + sch->sch_offset +
2387 sizeof(struct suof_obj_hdr);
2388 qsi->qsi_simg_len =
2389 ((struct suof_obj_hdr *)
2390 (qafs->qafs_suof_buf + sch->sch_offset))->soh_img_length;
2391
2392 qsi->qsi_css_header = qsi->qsi_simg_buf;
2393 qsi->qsi_css_key = qsi->qsi_css_header + sizeof(struct css_hdr);
2394 qsi->qsi_css_signature = qsi->qsi_css_key +
2395 CSS_FWSK_MODULUS_LEN + CSS_FWSK_EXPONENT_LEN;
2396 qsi->qsi_css_simg = qsi->qsi_css_signature + CSS_SIGNATURE_LEN;
2397
2398 ae_mode = (struct simg_ae_mode *)qsi->qsi_css_simg;
2399 qsi->qsi_ae_mask = ae_mode->sam_ae_mask;
2400 qsi->qsi_simg_name = (u_long)&ae_mode->sam_simg_name;
2401 qsi->qsi_appmeta_data = (u_long)&ae_mode->sam_appmeta_data;
2402 qsi->qsi_fw_type = ae_mode->sam_fw_type;
2403
2404 if (ae_mode->sam_dev_type != sc->sc_hw.qhw_prod_type)
2405 return EINVAL;
2406
2407 maj_ver = (QAT_PID_MAJOR_REV | (sc->sc_rev & QAT_PID_MINOR_REV)) & 0xff;
2408 if ((maj_ver > ae_mode->sam_devmax_ver) ||
2409 (maj_ver < ae_mode->sam_devmin_ver)) {
2410 return EINVAL;
2411 }
2412
2413 return 0;
2414 }
2415
2416 int
qat_aefw_suof_parse(struct qat_softc * sc)2417 qat_aefw_suof_parse(struct qat_softc *sc)
2418 {
2419 struct suof_file_hdr *sfh;
2420 struct suof_chunk_hdr *sch;
2421 struct qat_aefw_suof *qafs = &sc->sc_aefw_suof;
2422 struct qat_suof_image *qsi;
2423 size_t size;
2424 u_int csum;
2425 int ae0_img = MAX_AE;
2426 int i, error;
2427
2428 size = sc->sc_fw_suof_size;
2429 if (size < sizeof(struct suof_file_hdr))
2430 return EINVAL;
2431
2432 sfh = sc->sc_fw_suof;
2433
2434 if (sfh->sfh_file_id != SUOF_FID)
2435 return EINVAL;
2436 if (sfh->sfh_fw_type != 0)
2437 return EINVAL;
2438 if (sfh->sfh_num_chunks <= 1)
2439 return EINVAL;
2440 if (sfh->sfh_min_ver != SUOF_MIN_VER ||
2441 sfh->sfh_maj_ver != SUOF_MAJ_VER)
2442 return EINVAL;
2443
2444 csum = qat_aefw_csum((char *)&sfh->sfh_min_ver,
2445 size - offsetof(struct suof_file_hdr, sfh_min_ver));
2446 if (csum != sfh->sfh_check_sum)
2447 return EINVAL;
2448
2449 size -= sizeof(struct suof_file_hdr);
2450
2451 qafs->qafs_file_id = SUOF_FID;
2452 qafs->qafs_suof_buf = sc->sc_fw_suof;
2453 qafs->qafs_suof_size = sc->sc_fw_suof_size;
2454 qafs->qafs_check_sum = sfh->sfh_check_sum;
2455 qafs->qafs_min_ver = sfh->sfh_min_ver;
2456 qafs->qafs_maj_ver = sfh->sfh_maj_ver;
2457 qafs->qafs_fw_type = sfh->sfh_fw_type;
2458
2459 if (size < sizeof(struct suof_chunk_hdr))
2460 return EINVAL;
2461 sch = (struct suof_chunk_hdr *)(sfh + 1);
2462 size -= sizeof(struct suof_chunk_hdr);
2463
2464 if (size < sizeof(struct suof_str_tab))
2465 return EINVAL;
2466 size -= offsetof(struct suof_str_tab, sst_strings);
2467
2468 qafs->qafs_sym_size = ((struct suof_str_tab *)
2469 (qafs->qafs_suof_buf + sch->sch_offset))->sst_tab_length;
2470 if (size < qafs->qafs_sym_size)
2471 return EINVAL;
2472 qafs->qafs_sym_str = qafs->qafs_suof_buf + sch->sch_offset +
2473 offsetof(struct suof_str_tab, sst_strings);
2474
2475 qafs->qafs_num_simgs = sfh->sfh_num_chunks - 1;
2476 if (qafs->qafs_num_simgs == 0)
2477 return EINVAL;
2478
2479 qsi = qat_alloc_mem(
2480 sizeof(struct qat_suof_image) * qafs->qafs_num_simgs);
2481 qafs->qafs_simg = qsi;
2482
2483 for (i = 0; i < qafs->qafs_num_simgs; i++) {
2484 error = qat_aefw_suof_parse_image(sc, &qsi[i], &sch[i + 1]);
2485 if (error)
2486 return error;
2487 if ((qsi[i].qsi_ae_mask & 0x1) != 0)
2488 ae0_img = i;
2489 }
2490
2491 if (ae0_img != qafs->qafs_num_simgs - 1) {
2492 struct qat_suof_image last_qsi;
2493
2494 memcpy(&last_qsi, &qsi[qafs->qafs_num_simgs - 1],
2495 sizeof(struct qat_suof_image));
2496 memcpy(&qsi[qafs->qafs_num_simgs - 1], &qsi[ae0_img],
2497 sizeof(struct qat_suof_image));
2498 memcpy(&qsi[ae0_img], &last_qsi,
2499 sizeof(struct qat_suof_image));
2500 }
2501
2502 return 0;
2503 }
2504
2505 int
qat_aefw_alloc_auth_dmamem(struct qat_softc * sc,char * image,size_t size,struct qat_dmamem * dma)2506 qat_aefw_alloc_auth_dmamem(struct qat_softc *sc, char *image, size_t size,
2507 struct qat_dmamem *dma)
2508 {
2509 struct css_hdr *css = (struct css_hdr *)image;
2510 struct auth_chunk *auth_chunk;
2511 struct fw_auth_desc *auth_desc;
2512 size_t mapsize, simg_offset = sizeof(struct auth_chunk);
2513 bus_size_t bus_addr;
2514 uintptr_t virt_addr;
2515 int error;
2516
2517 if (size > AE_IMG_OFFSET + CSS_MAX_IMAGE_LEN)
2518 return EINVAL;
2519
2520 mapsize = (css->css_fw_type == CSS_AE_FIRMWARE) ?
2521 CSS_AE_SIMG_LEN + simg_offset :
2522 size + CSS_FWSK_PAD_LEN + simg_offset;
2523 error = qat_alloc_dmamem(sc, dma, mapsize, PAGE_SIZE);
2524 if (error)
2525 return error;
2526
2527 memset(dma->qdm_dma_vaddr, 0, mapsize);
2528
2529 auth_chunk = dma->qdm_dma_vaddr;
2530 auth_chunk->ac_chunk_size = mapsize;
2531 auth_chunk->ac_chunk_bus_addr = dma->qdm_dma_map->dm_segs[0].ds_addr;
2532
2533 virt_addr = (uintptr_t)dma->qdm_dma_vaddr;
2534 virt_addr += simg_offset;
2535 bus_addr = auth_chunk->ac_chunk_bus_addr;
2536 bus_addr += simg_offset;
2537
2538 auth_desc = &auth_chunk->ac_fw_auth_desc;
2539 auth_desc->fad_css_hdr_high = bus_addr >> 32;
2540 auth_desc->fad_css_hdr_low = bus_addr;
2541
2542 memcpy((void *)virt_addr, image, sizeof(struct css_hdr));
2543 /* pub key */
2544 virt_addr += sizeof(struct css_hdr);
2545 bus_addr += sizeof(struct css_hdr);
2546 image += sizeof(struct css_hdr);
2547
2548 auth_desc->fad_fwsk_pub_high = bus_addr >> 32;
2549 auth_desc->fad_fwsk_pub_low = bus_addr;
2550
2551 memcpy((void *)virt_addr, image, CSS_FWSK_MODULUS_LEN);
2552 memset((void *)(virt_addr + CSS_FWSK_MODULUS_LEN), 0, CSS_FWSK_PAD_LEN);
2553 memcpy((void *)(virt_addr + CSS_FWSK_MODULUS_LEN + CSS_FWSK_PAD_LEN),
2554 image + CSS_FWSK_MODULUS_LEN, sizeof(uint32_t));
2555
2556 virt_addr += CSS_FWSK_PUB_LEN;
2557 bus_addr += CSS_FWSK_PUB_LEN;
2558 image += CSS_FWSK_MODULUS_LEN + CSS_FWSK_EXPONENT_LEN;
2559
2560 auth_desc->fad_signature_high = bus_addr >> 32;
2561 auth_desc->fad_signature_low = bus_addr;
2562
2563 memcpy((void *)virt_addr, image, CSS_SIGNATURE_LEN);
2564 #ifdef QAT_DUMP
2565 qat_dump_raw(QAT_DUMP_AEFW, "aefw signature", image, CSS_SIGNATURE_LEN);
2566 #endif
2567
2568 virt_addr += CSS_SIGNATURE_LEN;
2569 bus_addr += CSS_SIGNATURE_LEN;
2570 image += CSS_SIGNATURE_LEN;
2571
2572 auth_desc->fad_img_high = bus_addr >> 32;
2573 auth_desc->fad_img_low = bus_addr;
2574 auth_desc->fad_img_len = size - AE_IMG_OFFSET;
2575
2576 memcpy((void *)virt_addr, image, auth_desc->fad_img_len);
2577
2578 if (css->css_fw_type == CSS_AE_FIRMWARE) {
2579 auth_desc->fad_img_ae_mode_data_high = auth_desc->fad_img_high;
2580 auth_desc->fad_img_ae_mode_data_low = auth_desc->fad_img_low;
2581
2582 bus_addr += sizeof(struct simg_ae_mode);
2583
2584 auth_desc->fad_img_ae_init_data_high = bus_addr >> 32;
2585 auth_desc->fad_img_ae_init_data_low = bus_addr;
2586
2587 bus_addr += SIMG_AE_INIT_SEQ_LEN;
2588
2589 auth_desc->fad_img_ae_insts_high = bus_addr >> 32;
2590 auth_desc->fad_img_ae_insts_low = bus_addr;
2591 } else {
2592 auth_desc->fad_img_ae_insts_high = auth_desc->fad_img_high;
2593 auth_desc->fad_img_ae_insts_low = auth_desc->fad_img_low;
2594 }
2595
2596 bus_dmamap_sync(sc->sc_dmat, dma->qdm_dma_map, 0,
2597 dma->qdm_dma_map->dm_mapsize,
2598 BUS_DMASYNC_PREWRITE | BUS_DMASYNC_PREREAD);
2599
2600 return 0;
2601 }
2602
2603 int
qat_aefw_auth(struct qat_softc * sc,struct qat_dmamem * dma)2604 qat_aefw_auth(struct qat_softc *sc, struct qat_dmamem *dma)
2605 {
2606 bus_addr_t addr = dma->qdm_dma_map->dm_segs[0].ds_addr;
2607 uint32_t fcu, sts;
2608 int retry = 0;
2609
2610 qat_cap_global_write_4(sc, FCU_DRAM_ADDR_HI, addr >> 32);
2611 qat_cap_global_write_4(sc, FCU_DRAM_ADDR_LO, addr);
2612 qat_cap_global_write_4(sc, FCU_CTRL, FCU_CTRL_CMD_AUTH);
2613
2614 do {
2615 delay(FW_AUTH_WAIT_PERIOD * 1000);
2616 fcu = qat_cap_global_read_4(sc, FCU_STATUS);
2617 sts = __SHIFTOUT(fcu, FCU_STATUS_STS);
2618 if (sts == FCU_STATUS_STS_VERI_FAIL)
2619 goto fail;
2620 if (fcu & FCU_STATUS_AUTHFWLD &&
2621 sts == FCU_STATUS_STS_VERI_DONE) {
2622 return 0;
2623 }
2624 } while (retry++ < FW_AUTH_MAX_RETRY);
2625
2626 fail:
2627 aprint_error_dev(sc->sc_dev,
2628 "firmware authentication error: status 0x%08x retry %d\n",
2629 fcu, retry);
2630 return EINVAL;
2631 }
2632
2633 int
qat_aefw_suof_load(struct qat_softc * sc,struct qat_dmamem * dma)2634 qat_aefw_suof_load(struct qat_softc *sc, struct qat_dmamem *dma)
2635 {
2636 struct simg_ae_mode *ae_mode;
2637 uint32_t fcu, sts, loaded;
2638 u_int mask;
2639 u_char ae;
2640 int retry = 0;
2641
2642 ae_mode = (struct simg_ae_mode *)((uintptr_t)dma->qdm_dma_vaddr +
2643 sizeof(struct auth_chunk) + sizeof(struct css_hdr) +
2644 CSS_FWSK_PUB_LEN + CSS_SIGNATURE_LEN);
2645
2646 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
2647 if (!(mask & 1))
2648 continue;
2649 if (!((ae_mode->sam_ae_mask >> ae) & 0x1))
2650 continue;
2651 if (qat_ae_is_active(sc, ae)) {
2652 aprint_error_dev(sc->sc_dev, "AE %d is active\n", ae);
2653 return EINVAL;
2654 }
2655 qat_cap_global_write_4(sc, FCU_CTRL,
2656 FCU_CTRL_CMD_LOAD | __SHIFTIN(ae, FCU_CTRL_AE));
2657 do {
2658 delay(FW_AUTH_WAIT_PERIOD * 1000);
2659 fcu = qat_cap_global_read_4(sc, FCU_STATUS);
2660 sts = __SHIFTOUT(fcu, FCU_STATUS_STS);
2661 loaded = __SHIFTOUT(fcu, FCU_STATUS_LOADED_AE);
2662 if (sts == FCU_STATUS_STS_LOAD_DONE &&
2663 (loaded & (1 << ae))) {
2664 break;
2665 }
2666 } while (retry++ < FW_AUTH_MAX_RETRY);
2667
2668 if (retry > FW_AUTH_MAX_RETRY) {
2669 aprint_error_dev(sc->sc_dev,
2670 "firmware load timeout: status %08x\n", fcu);
2671 return EINVAL;
2672 }
2673 }
2674
2675 return 0;
2676 }
2677
2678 int
qat_aefw_suof_write(struct qat_softc * sc)2679 qat_aefw_suof_write(struct qat_softc *sc)
2680 {
2681 struct qat_suof_image *qsi = NULL;
2682 int i, error = 0;
2683
2684 for (i = 0; i < sc->sc_aefw_suof.qafs_num_simgs; i++) {
2685 qsi = &sc->sc_aefw_suof.qafs_simg[i];
2686 error = qat_aefw_alloc_auth_dmamem(sc, qsi->qsi_simg_buf,
2687 qsi->qsi_simg_len, &qsi->qsi_dma);
2688 if (error)
2689 return error;
2690 error = qat_aefw_auth(sc, &qsi->qsi_dma);
2691 if (error)
2692 goto fail;
2693 error = qat_aefw_suof_load(sc, &qsi->qsi_dma);
2694 if (error)
2695 goto fail;
2696
2697 qat_free_dmamem(sc, &qsi->qsi_dma);
2698 }
2699
2700 return 0;
2701 fail:
2702 if (qsi != NULL)
2703 qat_free_dmamem(sc, &qsi->qsi_dma);
2704 return error;
2705 }
2706
2707 int
qat_aefw_uof_assign_image(struct qat_softc * sc,struct qat_ae * qae,struct qat_uof_image * qui)2708 qat_aefw_uof_assign_image(struct qat_softc *sc, struct qat_ae *qae,
2709 struct qat_uof_image *qui)
2710 {
2711 struct qat_ae_slice *slice;
2712 int i, npages, nregions;
2713
2714 if (qae->qae_num_slices >= __arraycount(qae->qae_slices))
2715 return ENOENT;
2716
2717 if (qui->qui_image->ui_ae_mode &
2718 (AE_MODE_RELOAD_CTX_SHARED | AE_MODE_SHARED_USTORE)) {
2719 /* XXX */
2720 aprint_error_dev(sc->sc_dev,
2721 "shared ae mode is not supported yet\n");
2722 return ENOTSUP;
2723 }
2724
2725 qae->qae_shareable_ustore = 0; /* XXX */
2726 qae->qae_effect_ustore_size = USTORE_SIZE;
2727
2728 slice = &qae->qae_slices[qae->qae_num_slices];
2729
2730 slice->qas_image = qui;
2731 slice->qas_assigned_ctx_mask = qui->qui_image->ui_ctx_assigned;
2732
2733 nregions = qui->qui_image->ui_num_page_regions;
2734 npages = qui->qui_image->ui_num_pages;
2735
2736 if (nregions > __arraycount(slice->qas_regions))
2737 return ENOENT;
2738 if (npages > __arraycount(slice->qas_pages))
2739 return ENOENT;
2740
2741 for (i = 0; i < nregions; i++) {
2742 SIMPLEQ_INIT(&slice->qas_regions[i].qar_waiting_pages);
2743 }
2744 for (i = 0; i < npages; i++) {
2745 struct qat_ae_page *page = &slice->qas_pages[i];
2746 int region;
2747
2748 page->qap_page = &qui->qui_pages[i];
2749 region = page->qap_page->qup_page_region;
2750 if (region >= nregions)
2751 return EINVAL;
2752
2753 page->qap_region = &slice->qas_regions[region];
2754 aprint_verbose_dev(sc->sc_dev,
2755 "ae %p slice %d page %d assign region %d\n",
2756 qae, qae->qae_num_slices, i, region);
2757 }
2758
2759 qae->qae_num_slices++;
2760
2761 return 0;
2762 }
2763
2764 int
qat_aefw_uof_init_ae(struct qat_softc * sc,u_char ae)2765 qat_aefw_uof_init_ae(struct qat_softc *sc, u_char ae)
2766 {
2767 struct uof_image *image;
2768 struct qat_ae *qae = &(QAT_AE(sc, ae));
2769 int s;
2770 u_char nn_mode;
2771
2772 for (s = 0; s < qae->qae_num_slices; s++) {
2773 if (qae->qae_slices[s].qas_image == NULL)
2774 continue;
2775
2776 image = qae->qae_slices[s].qas_image->qui_image;
2777 qat_ae_write_ctx_mode(sc, ae,
2778 __SHIFTOUT(image->ui_ae_mode, AE_MODE_CTX_MODE));
2779
2780 nn_mode = __SHIFTOUT(image->ui_ae_mode, AE_MODE_NN_MODE);
2781 if (nn_mode != AE_MODE_NN_MODE_DONTCARE)
2782 qat_ae_write_nn_mode(sc, ae, nn_mode);
2783
2784 qat_ae_write_lm_mode(sc, ae, AEREG_LMEM0,
2785 __SHIFTOUT(image->ui_ae_mode, AE_MODE_LMEM0));
2786 qat_ae_write_lm_mode(sc, ae, AEREG_LMEM1,
2787 __SHIFTOUT(image->ui_ae_mode, AE_MODE_LMEM1));
2788
2789 qat_ae_write_shared_cs_mode(sc, ae,
2790 __SHIFTOUT(image->ui_ae_mode, AE_MODE_SHARED_USTORE));
2791 qat_ae_set_reload_ustore(sc, ae, image->ui_reloadable_size,
2792 __SHIFTOUT(image->ui_ae_mode, AE_MODE_RELOAD_CTX_SHARED),
2793 qae->qae_reloc_ustore_dram);
2794 }
2795
2796 return 0;
2797 }
2798
2799 int
qat_aefw_uof_init(struct qat_softc * sc)2800 qat_aefw_uof_init(struct qat_softc *sc)
2801 {
2802 int ae, i, error;
2803 uint32_t mask;
2804
2805 for (ae = 0, mask = sc->sc_ae_mask; mask; ae++, mask >>= 1) {
2806 struct qat_ae *qae;
2807
2808 if (!(mask & 1))
2809 continue;
2810
2811 qae = &(QAT_AE(sc, ae));
2812
2813 for (i = 0; i < sc->sc_aefw_uof.qafu_num_imgs; i++) {
2814 if ((sc->sc_aefw_uof.qafu_imgs[i].qui_image->ui_ae_assigned &
2815 (1 << ae)) == 0)
2816 continue;
2817
2818 error = qat_aefw_uof_assign_image(sc, qae,
2819 &sc->sc_aefw_uof.qafu_imgs[i]);
2820 if (error)
2821 return error;
2822 }
2823
2824 /* XXX UcLo_initNumUwordUsed */
2825
2826 qae->qae_reloc_ustore_dram = UINT_MAX; /* XXX */
2827
2828 error = qat_aefw_uof_init_ae(sc, ae);
2829 if (error)
2830 return error;
2831 }
2832
2833 return 0;
2834 }
2835
2836 int
qat_aefw_load(struct qat_softc * sc)2837 qat_aefw_load(struct qat_softc *sc)
2838 {
2839 int error;
2840
2841 error = qat_aefw_load_mof(sc);
2842 if (error)
2843 return error;
2844
2845 error = qat_aefw_load_mmp(sc);
2846 if (error)
2847 return error;
2848
2849 error = qat_aefw_mof_parse(sc);
2850 if (error) {
2851 aprint_error_dev(sc->sc_dev, "couldn't parse mof: %d\n", error);
2852 return error;
2853 }
2854
2855 if (sc->sc_hw.qhw_fw_auth) {
2856 error = qat_aefw_suof_parse(sc);
2857 if (error) {
2858 aprint_error_dev(sc->sc_dev, "couldn't parse suof: %d\n",
2859 error);
2860 return error;
2861 }
2862
2863 error = qat_aefw_suof_write(sc);
2864 if (error) {
2865 aprint_error_dev(sc->sc_dev,
2866 "could not write firmware: %d\n", error);
2867 return error;
2868 }
2869
2870 } else {
2871 error = qat_aefw_uof_parse(sc);
2872 if (error) {
2873 aprint_error_dev(sc->sc_dev, "couldn't parse uof: %d\n",
2874 error);
2875 return error;
2876 }
2877
2878 error = qat_aefw_uof_init(sc);
2879 if (error) {
2880 aprint_error_dev(sc->sc_dev,
2881 "couldn't init for aefw: %d\n", error);
2882 return error;
2883 }
2884
2885 error = qat_aefw_uof_write(sc);
2886 if (error) {
2887 aprint_error_dev(sc->sc_dev,
2888 "Could not write firmware: %d\n", error);
2889 return error;
2890 }
2891 }
2892
2893 return 0;
2894 }
2895
2896 int
qat_aefw_start(struct qat_softc * sc,u_char ae,u_int ctx_mask)2897 qat_aefw_start(struct qat_softc *sc, u_char ae, u_int ctx_mask)
2898 {
2899 uint32_t fcu;
2900 int retry = 0;
2901
2902 if (sc->sc_hw.qhw_fw_auth) {
2903 qat_cap_global_write_4(sc, FCU_CTRL, FCU_CTRL_CMD_START);
2904 do {
2905 delay(FW_AUTH_WAIT_PERIOD * 1000);
2906 fcu = qat_cap_global_read_4(sc, FCU_STATUS);
2907 if (fcu & FCU_STATUS_DONE)
2908 return 0;
2909 } while (retry++ < FW_AUTH_MAX_RETRY);
2910
2911 aprint_error_dev(sc->sc_dev,
2912 "firmware start timeout: status %08x\n", fcu);
2913 return EINVAL;
2914 } else {
2915 qat_ae_ctx_indr_write(sc, ae, (~ctx_mask) & AE_ALL_CTX,
2916 CTX_WAKEUP_EVENTS_INDIRECT,
2917 CTX_WAKEUP_EVENTS_INDIRECT_SLEEP);
2918 qat_ae_enable_ctx(sc, ae, ctx_mask);
2919 }
2920
2921 return 0;
2922 }
2923
2924 int
qat_aefw_init_memory_one(struct qat_softc * sc,struct uof_init_mem * uim)2925 qat_aefw_init_memory_one(struct qat_softc *sc, struct uof_init_mem *uim)
2926 {
2927 struct qat_aefw_uof *qafu = &sc->sc_aefw_uof;
2928 struct qat_ae_batch_init_list *qabi_list;
2929 struct uof_mem_val_attr *memattr;
2930 size_t *curinit;
2931 u_long ael;
2932 int i;
2933 const char *sym;
2934 char *ep;
2935
2936 memattr = (struct uof_mem_val_attr *)(uim + 1);
2937
2938 switch (uim->uim_region) {
2939 case LMEM_REGION:
2940 if ((uim->uim_addr + uim->uim_num_bytes) > MAX_LMEM_REG * 4) {
2941 aprint_error_dev(sc->sc_dev,
2942 "Invalid lmem addr or bytes\n");
2943 return ENOBUFS;
2944 }
2945 if (uim->uim_scope != UOF_SCOPE_LOCAL)
2946 return EINVAL;
2947 sym = qat_aefw_uof_string(sc, uim->uim_sym_name);
2948 ael = strtoul(sym, &ep, 10);
2949 if (ep == sym || ael > MAX_AE)
2950 return EINVAL;
2951 if ((sc->sc_ae_mask & (1 << ael)) == 0)
2952 return 0; /* ae is fused out */
2953
2954 curinit = &qafu->qafu_num_lm_init[ael];
2955 qabi_list = &qafu->qafu_lm_init[ael];
2956
2957 for (i = 0; i < uim->uim_num_val_attr; i++, memattr++) {
2958 struct qat_ae_batch_init *qabi;
2959
2960 qabi = qat_alloc_mem(sizeof(struct qat_ae_batch_init));
2961 if (*curinit == 0)
2962 SIMPLEQ_INIT(qabi_list);
2963 SIMPLEQ_INSERT_TAIL(qabi_list, qabi, qabi_next);
2964
2965 qabi->qabi_ae = (u_int)ael;
2966 qabi->qabi_addr =
2967 uim->uim_addr + memattr->umva_byte_offset;
2968 qabi->qabi_value = &memattr->umva_value;
2969 qabi->qabi_size = 4;
2970 qafu->qafu_num_lm_init_inst[ael] +=
2971 qat_ae_get_inst_num(qabi->qabi_size);
2972 (*curinit)++;
2973 if (*curinit >= MAX_LMEM_REG) {
2974 aprint_error_dev(sc->sc_dev,
2975 "Invalid lmem val attr\n");
2976 return ENOBUFS;
2977 }
2978 }
2979 break;
2980 case SRAM_REGION:
2981 case DRAM_REGION:
2982 case DRAM1_REGION:
2983 case SCRATCH_REGION:
2984 case UMEM_REGION:
2985 /* XXX */
2986 /* fallthrough */
2987 default:
2988 aprint_error_dev(sc->sc_dev,
2989 "unsupported memory region to init: %d\n",
2990 uim->uim_region);
2991 return ENOTSUP;
2992 }
2993
2994 return 0;
2995 }
2996
2997 void
qat_aefw_free_lm_init(struct qat_softc * sc,u_char ae)2998 qat_aefw_free_lm_init(struct qat_softc *sc, u_char ae)
2999 {
3000 struct qat_aefw_uof *qafu = &sc->sc_aefw_uof;
3001 struct qat_ae_batch_init *qabi;
3002
3003 while ((qabi = SIMPLEQ_FIRST(&qafu->qafu_lm_init[ae])) != NULL) {
3004 SIMPLEQ_REMOVE_HEAD(&qafu->qafu_lm_init[ae], qabi_next);
3005 qat_free_mem(qabi);
3006 }
3007
3008 qafu->qafu_num_lm_init[ae] = 0;
3009 qafu->qafu_num_lm_init_inst[ae] = 0;
3010 }
3011
3012 int
qat_aefw_init_ustore(struct qat_softc * sc)3013 qat_aefw_init_ustore(struct qat_softc *sc)
3014 {
3015 uint64_t *fill;
3016 uint32_t dont_init;
3017 int a, i, p;
3018 int error = 0;
3019 int usz, end, start;
3020 u_char ae, nae;
3021
3022 fill = qat_alloc_mem(MAX_USTORE * sizeof(uint64_t));
3023
3024 for (a = 0; a < sc->sc_aefw_uof.qafu_num_imgs; a++) {
3025 struct qat_uof_image *qui = &sc->sc_aefw_uof.qafu_imgs[a];
3026 struct uof_image *ui = qui->qui_image;
3027
3028 for (i = 0; i < MAX_USTORE; i++)
3029 memcpy(&fill[i], ui->ui_fill_pattern, sizeof(uint64_t));
3030 /*
3031 * Compute do_not_init value as a value that will not be equal
3032 * to fill data when cast to an int
3033 */
3034 dont_init = 0;
3035 if (dont_init == (uint32_t)fill[0])
3036 dont_init = 0xffffffff;
3037
3038 for (p = 0; p < ui->ui_num_pages; p++) {
3039 struct qat_uof_page *qup = &qui->qui_pages[p];
3040 if (!qup->qup_def_page)
3041 continue;
3042
3043 for (i = qup->qup_beg_paddr;
3044 i < qup->qup_beg_paddr + qup->qup_num_micro_words;
3045 i++ ) {
3046 fill[i] = (uint64_t)dont_init;
3047 }
3048 }
3049
3050 for (ae = 0; ae < sc->sc_ae_num; ae++) {
3051 KASSERT(ae < UOF_MAX_NUM_OF_AE);
3052 if ((ui->ui_ae_assigned & (1 << ae)) == 0)
3053 continue;
3054
3055 if (QAT_AE(sc, ae).qae_shareable_ustore && (ae & 1)) {
3056 qat_ae_get_shared_ustore_ae(ae, &nae);
3057 if (ui->ui_ae_assigned & (1 << ae))
3058 continue;
3059 }
3060 usz = QAT_AE(sc, ae).qae_effect_ustore_size;
3061
3062 /* initialize the areas not going to be overwritten */
3063 end = -1;
3064 do {
3065 /* find next uword that needs to be initialized */
3066 for (start = end + 1; start < usz; start++) {
3067 if ((uint32_t)fill[start] != dont_init)
3068 break;
3069 }
3070 /* see if there are no more such uwords */
3071 if (start >= usz)
3072 break;
3073 for (end = start + 1; end < usz; end++) {
3074 if ((uint32_t)fill[end] == dont_init)
3075 break;
3076 }
3077 if (QAT_AE(sc, ae).qae_shareable_ustore) {
3078 error = ENOTSUP; /* XXX */
3079 goto out;
3080 } else {
3081 error = qat_ae_ucode_write(sc, ae,
3082 start, end - start, &fill[start]);
3083 if (error) {
3084 goto out;
3085 }
3086 }
3087
3088 } while (end < usz);
3089 }
3090 }
3091
3092 out:
3093 qat_free_mem(fill);
3094 return error;
3095 }
3096
3097 int
qat_aefw_init_reg(struct qat_softc * sc,u_char ae,u_char ctx_mask,enum aereg_type regtype,u_short regaddr,u_int value)3098 qat_aefw_init_reg(struct qat_softc *sc, u_char ae, u_char ctx_mask,
3099 enum aereg_type regtype, u_short regaddr, u_int value)
3100 {
3101 int error = 0;
3102 u_char ctx;
3103
3104 switch (regtype) {
3105 case AEREG_GPA_REL:
3106 case AEREG_GPB_REL:
3107 case AEREG_SR_REL:
3108 case AEREG_SR_RD_REL:
3109 case AEREG_SR_WR_REL:
3110 case AEREG_DR_REL:
3111 case AEREG_DR_RD_REL:
3112 case AEREG_DR_WR_REL:
3113 case AEREG_NEIGH_REL:
3114 /* init for all valid ctx */
3115 for (ctx = 0; ctx < MAX_AE_CTX; ctx++) {
3116 if ((ctx_mask & (1 << ctx)) == 0)
3117 continue;
3118 error = qat_aereg_rel_data_write(sc, ae, ctx, regtype,
3119 regaddr, value);
3120 }
3121 break;
3122 case AEREG_GPA_ABS:
3123 case AEREG_GPB_ABS:
3124 case AEREG_SR_ABS:
3125 case AEREG_SR_RD_ABS:
3126 case AEREG_SR_WR_ABS:
3127 case AEREG_DR_ABS:
3128 case AEREG_DR_RD_ABS:
3129 case AEREG_DR_WR_ABS:
3130 error = qat_aereg_abs_data_write(sc, ae, regtype,
3131 regaddr, value);
3132 break;
3133 default:
3134 error = EINVAL;
3135 break;
3136 }
3137
3138 return error;
3139 }
3140
3141 int
qat_aefw_init_reg_sym_expr(struct qat_softc * sc,u_char ae,struct qat_uof_image * qui)3142 qat_aefw_init_reg_sym_expr(struct qat_softc *sc, u_char ae,
3143 struct qat_uof_image *qui)
3144 {
3145 u_int i, expres;
3146 u_char ctx_mask;
3147
3148 for (i = 0; i < qui->qui_num_init_reg_sym; i++) {
3149 struct uof_init_reg_sym *uirs = &qui->qui_init_reg_sym[i];
3150
3151 if (uirs->uirs_value_type == EXPR_VAL) {
3152 /* XXX */
3153 aprint_error_dev(sc->sc_dev,
3154 "does not support initializing EXPR_VAL\n");
3155 return ENOTSUP;
3156 } else {
3157 expres = uirs->uirs_value;
3158 }
3159
3160 switch (uirs->uirs_init_type) {
3161 case INIT_REG:
3162 if (__SHIFTOUT(qui->qui_image->ui_ae_mode,
3163 AE_MODE_CTX_MODE) == MAX_AE_CTX) {
3164 ctx_mask = 0xff; /* 8-ctx mode */
3165 } else {
3166 ctx_mask = 0x55; /* 4-ctx mode */
3167 }
3168 qat_aefw_init_reg(sc, ae, ctx_mask,
3169 (enum aereg_type)uirs->uirs_reg_type,
3170 (u_short)uirs->uirs_addr_offset, expres);
3171 break;
3172 case INIT_REG_CTX:
3173 if (__SHIFTOUT(qui->qui_image->ui_ae_mode,
3174 AE_MODE_CTX_MODE) == MAX_AE_CTX) {
3175 ctx_mask = 0xff; /* 8-ctx mode */
3176 } else {
3177 ctx_mask = 0x55; /* 4-ctx mode */
3178 }
3179 if (((1 << uirs->uirs_ctx) & ctx_mask) == 0)
3180 return EINVAL;
3181 qat_aefw_init_reg(sc, ae, 1 << uirs->uirs_ctx,
3182 (enum aereg_type)uirs->uirs_reg_type,
3183 (u_short)uirs->uirs_addr_offset, expres);
3184 break;
3185 case INIT_EXPR:
3186 case INIT_EXPR_ENDIAN_SWAP:
3187 default:
3188 aprint_error_dev(sc->sc_dev,
3189 "does not support initializing init_type %d\n",
3190 uirs->uirs_init_type);
3191 return ENOTSUP;
3192 }
3193 }
3194
3195 return 0;
3196 }
3197
3198 int
qat_aefw_init_memory(struct qat_softc * sc)3199 qat_aefw_init_memory(struct qat_softc *sc)
3200 {
3201 struct qat_aefw_uof *qafu = &sc->sc_aefw_uof;
3202 size_t uimsz, initmemsz = qafu->qafu_init_mem_size;
3203 struct uof_init_mem *uim;
3204 int error, i;
3205 u_char ae;
3206
3207 uim = qafu->qafu_init_mem;
3208 for (i = 0; i < qafu->qafu_num_init_mem; i++) {
3209 uimsz = sizeof(struct uof_init_mem) +
3210 sizeof(struct uof_mem_val_attr) * uim->uim_num_val_attr;
3211 if (uimsz > initmemsz) {
3212 aprint_error_dev(sc->sc_dev,
3213 "invalid uof_init_mem or uof_mem_val_attr size\n");
3214 return EINVAL;
3215 }
3216
3217 if (uim->uim_num_bytes > 0) {
3218 error = qat_aefw_init_memory_one(sc, uim);
3219 if (error) {
3220 aprint_error_dev(sc->sc_dev,
3221 "Could not init ae memory: %d\n", error);
3222 return error;
3223 }
3224 }
3225 uim = (struct uof_init_mem *)((uintptr_t)uim + uimsz);
3226 initmemsz -= uimsz;
3227 }
3228
3229 /* run Batch put LM API */
3230 for (ae = 0; ae < MAX_AE; ae++) {
3231 error = qat_ae_batch_put_lm(sc, ae, &qafu->qafu_lm_init[ae],
3232 qafu->qafu_num_lm_init_inst[ae]);
3233 if (error)
3234 aprint_error_dev(sc->sc_dev, "Could not put lm\n");
3235
3236 qat_aefw_free_lm_init(sc, ae);
3237 }
3238
3239 error = qat_aefw_init_ustore(sc);
3240
3241 /* XXX run Batch put LM API */
3242
3243 return error;
3244 }
3245
3246 int
qat_aefw_init_globals(struct qat_softc * sc)3247 qat_aefw_init_globals(struct qat_softc *sc)
3248 {
3249 struct qat_aefw_uof *qafu = &sc->sc_aefw_uof;
3250 int error, i, p, s;
3251 u_char ae;
3252
3253 /* initialize the memory segments */
3254 if (qafu->qafu_num_init_mem > 0) {
3255 error = qat_aefw_init_memory(sc);
3256 if (error)
3257 return error;
3258 } else {
3259 error = qat_aefw_init_ustore(sc);
3260 if (error)
3261 return error;
3262 }
3263
3264 /* XXX bind import variables with ivd values */
3265
3266 /* XXX bind the uC global variables
3267 * local variables will done on-the-fly */
3268 for (i = 0; i < sc->sc_aefw_uof.qafu_num_imgs; i++) {
3269 for (p = 0; p < sc->sc_aefw_uof.qafu_imgs[i].qui_image->ui_num_pages; p++) {
3270 struct qat_uof_page *qup =
3271 &sc->sc_aefw_uof.qafu_imgs[i].qui_pages[p];
3272 if (qup->qup_num_uw_blocks &&
3273 (qup->qup_num_uc_var || qup->qup_num_imp_var)) {
3274 aprint_error_dev(sc->sc_dev,
3275 "not support uC global variables\n");
3276 return ENOTSUP;
3277 }
3278 }
3279 }
3280
3281 for (ae = 0; ae < sc->sc_ae_num; ae++) {
3282 struct qat_ae *qae = &(QAT_AE(sc, ae));
3283
3284 for (s = 0; s < qae->qae_num_slices; s++) {
3285 struct qat_ae_slice *qas = &qae->qae_slices[s];
3286
3287 if (qas->qas_image == NULL)
3288 continue;
3289
3290 error =
3291 qat_aefw_init_reg_sym_expr(sc, ae, qas->qas_image);
3292 if (error)
3293 return error;
3294 }
3295 }
3296
3297 return 0;
3298 }
3299
3300 uint64_t
qat_aefw_get_uof_inst(struct qat_softc * sc,struct qat_uof_page * qup,u_int addr)3301 qat_aefw_get_uof_inst(struct qat_softc *sc, struct qat_uof_page *qup,
3302 u_int addr)
3303 {
3304 uint64_t uinst = 0;
3305 u_int i;
3306
3307 /* find the block */
3308 for (i = 0; i < qup->qup_num_uw_blocks; i++) {
3309 struct qat_uof_uword_block *quub = &qup->qup_uw_blocks[i];
3310
3311 if ((addr >= quub->quub_start_addr) &&
3312 (addr <= (quub->quub_start_addr +
3313 (quub->quub_num_words - 1)))) {
3314 /* unpack n bytes and assigned to the 64-bit uword value.
3315 note: the microwords are stored as packed bytes.
3316 */
3317 addr -= quub->quub_start_addr;
3318 addr *= AEV2_PACKED_UWORD_BYTES;
3319 memcpy(&uinst,
3320 (void *)((uintptr_t)quub->quub_micro_words + addr),
3321 AEV2_PACKED_UWORD_BYTES);
3322 uinst = uinst & UWORD_MASK;
3323
3324 return uinst;
3325 }
3326 }
3327
3328 return INVLD_UWORD;
3329 }
3330
3331 int
qat_aefw_do_pagein(struct qat_softc * sc,u_char ae,struct qat_uof_page * qup)3332 qat_aefw_do_pagein(struct qat_softc *sc, u_char ae, struct qat_uof_page *qup)
3333 {
3334 struct qat_ae *qae = &(QAT_AE(sc, ae));
3335 uint64_t fill, *ucode_cpybuf;
3336 u_int error, i, upaddr, uraddr, ninst, cpylen;
3337
3338 if (qup->qup_num_uc_var || qup->qup_num_neigh_reg ||
3339 qup->qup_num_imp_var || qup->qup_num_imp_expr) {
3340 aprint_error_dev(sc->sc_dev,
3341 "does not support fixup locals\n");
3342 return ENOTSUP;
3343 }
3344
3345 ucode_cpybuf = qat_alloc_mem(UWORD_CPYBUF_SIZE * sizeof(uint64_t));
3346
3347 /* XXX get fill-pattern from an image -- they are all the same */
3348 memcpy(&fill, sc->sc_aefw_uof.qafu_imgs[0].qui_image->ui_fill_pattern,
3349 sizeof(uint64_t));
3350
3351 upaddr = qup->qup_beg_paddr;
3352 uraddr = 0;
3353 ninst = qup->qup_num_micro_words;
3354 while (ninst > 0) {
3355 cpylen = uimin(ninst, UWORD_CPYBUF_SIZE);
3356
3357 /* load the buffer */
3358 for (i = 0; i < cpylen; i++) {
3359 /* keep below code structure in case there are
3360 * different handling for shared secnarios */
3361 if (!qae->qae_shareable_ustore) {
3362 /* qat_aefw_get_uof_inst() takes an address that
3363 * is relative to the start of the page.
3364 * So we don't need to add in the physical
3365 * offset of the page. */
3366 if (qup->qup_page_region != 0) {
3367 /* XXX */
3368 aprint_error_dev(sc->sc_dev,
3369 "region != 0 is not supported\n");
3370 qat_free_mem(ucode_cpybuf);
3371 return ENOTSUP;
3372 } else {
3373 /* for mixing case, it should take
3374 * physical address */
3375 ucode_cpybuf[i] = qat_aefw_get_uof_inst(
3376 sc, qup, upaddr + i);
3377 if (ucode_cpybuf[i] == INVLD_UWORD) {
3378 /* fill hole in the uof */
3379 ucode_cpybuf[i] = fill;
3380 }
3381 }
3382 } else {
3383 /* XXX */
3384 qat_free_mem(ucode_cpybuf);
3385 return ENOTSUP;
3386 }
3387 }
3388
3389 /* copy the buffer to ustore */
3390 if (!qae->qae_shareable_ustore) {
3391 error = qat_ae_ucode_write(sc, ae, upaddr, cpylen,
3392 ucode_cpybuf);
3393 if (error)
3394 return error;
3395 } else {
3396 /* XXX */
3397 qat_free_mem(ucode_cpybuf);
3398 return ENOTSUP;
3399 }
3400 upaddr += cpylen;
3401 uraddr += cpylen;
3402 ninst -= cpylen;
3403 }
3404
3405 qat_free_mem(ucode_cpybuf);
3406
3407 return 0;
3408 }
3409
3410 int
qat_aefw_uof_write_one(struct qat_softc * sc,struct qat_uof_image * qui)3411 qat_aefw_uof_write_one(struct qat_softc *sc, struct qat_uof_image *qui)
3412 {
3413 struct uof_image *ui = qui->qui_image;
3414 struct qat_ae_page *qap;
3415 u_int s, p, c;
3416 int error;
3417 u_char ae, ctx_mask;
3418
3419 aprint_verbose_dev(sc->sc_dev,
3420 "aefw writing uof %s\n",
3421 qat_aefw_uof_string(sc, qui->qui_image->ui_name));
3422
3423 error = qat_aefw_init_globals(sc);
3424 if (error) {
3425 aprint_error_dev(sc->sc_dev,
3426 "Could not initialize globals\n");
3427 return error;
3428 }
3429
3430 if (__SHIFTOUT(ui->ui_ae_mode, AE_MODE_CTX_MODE) == MAX_AE_CTX)
3431 ctx_mask = 0xff; /* 8-ctx mode */
3432 else
3433 ctx_mask = 0x55; /* 4-ctx mode */
3434
3435 /* load the default page and set assigned CTX PC
3436 * to the entrypoint address */
3437 for (ae = 0; ae < sc->sc_ae_num; ae++) {
3438 struct qat_ae *qae = &(QAT_AE(sc, ae));
3439 struct qat_ae_slice *qas;
3440 u_int metadata;
3441
3442 KASSERT(ae < UOF_MAX_NUM_OF_AE);
3443
3444 if ((ui->ui_ae_assigned & (1 << ae)) == 0)
3445 continue;
3446
3447 /* find the slice to which this image is assigned */
3448 for (s = 0; s < qae->qae_num_slices; s++) {
3449 qas = &qae->qae_slices[s];
3450 if (ui->ui_ctx_assigned & qas->qas_assigned_ctx_mask)
3451 break;
3452 }
3453 if (s >= qae->qae_num_slices)
3454 continue;
3455
3456 qas = &qae->qae_slices[s];
3457
3458 for (p = 0; p < ui->ui_num_pages; p++) {
3459 qap = &qas->qas_pages[p];
3460
3461 /* Only load pages loaded by default */
3462 if (!qap->qap_page->qup_def_page)
3463 continue;
3464
3465 error = qat_aefw_do_pagein(sc, ae, qap->qap_page);
3466 if (error)
3467 return error;
3468 }
3469
3470 metadata = qas->qas_image->qui_image->ui_app_metadata;
3471 if (metadata != 0xffffffff) {
3472 aprint_normal_dev(sc->sc_dev,
3473 "loaded firmware: %s\n",
3474 qat_aefw_uof_string(sc, metadata));
3475 }
3476
3477 /* Assume starting page is page 0 */
3478 qap = &qas->qas_pages[0];
3479 for (c = 0; c < MAX_AE_CTX; c++) {
3480 if (ctx_mask & (1 << c))
3481 qas->qas_cur_pages[c] = qap;
3482 else
3483 qas->qas_cur_pages[c] = NULL;
3484 }
3485
3486 /* set the live context */
3487 qae->qae_live_ctx_mask = ui->ui_ctx_assigned;
3488
3489 /* set context PC to the image entrypoint address */
3490 error = qat_ae_write_pc(sc, ae, ui->ui_ctx_assigned,
3491 ui->ui_entry_address);
3492 if (error)
3493 return error;
3494 }
3495
3496 /* XXX store the checksum for convenience */
3497
3498 return 0;
3499 }
3500
3501 int
qat_aefw_uof_write(struct qat_softc * sc)3502 qat_aefw_uof_write(struct qat_softc *sc)
3503 {
3504 int error = 0;
3505 int i;
3506
3507 for (i = 0; i < sc->sc_aefw_uof.qafu_num_imgs; i++) {
3508 error = qat_aefw_uof_write_one(sc,
3509 &sc->sc_aefw_uof.qafu_imgs[i]);
3510 if (error)
3511 break;
3512 }
3513
3514 /* XXX UcLo_computeFreeUstore */
3515
3516 return error;
3517 }
3518