1848b8605Smrg/*
2848b8605Smrg * Copyright © 2014 Broadcom
3848b8605Smrg *
4848b8605Smrg * Permission is hereby granted, free of charge, to any person obtaining a
5848b8605Smrg * copy of this software and associated documentation files (the "Software"),
6848b8605Smrg * to deal in the Software without restriction, including without limitation
7848b8605Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8848b8605Smrg * and/or sell copies of the Software, and to permit persons to whom the
9848b8605Smrg * Software is furnished to do so, subject to the following conditions:
10848b8605Smrg *
11848b8605Smrg * The above copyright notice and this permission notice (including the next
12848b8605Smrg * paragraph) shall be included in all copies or substantial portions of the
13848b8605Smrg * Software.
14848b8605Smrg *
15848b8605Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16848b8605Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17848b8605Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18848b8605Smrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19848b8605Smrg * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20848b8605Smrg * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21848b8605Smrg * IN THE SOFTWARE.
22848b8605Smrg */
23848b8605Smrg
24848b8605Smrg#ifndef VC4_QPU_H
25848b8605Smrg#define VC4_QPU_H
26848b8605Smrg
27b8e80941Smrg#include <stdio.h>
28848b8605Smrg#include <stdint.h>
29848b8605Smrg
30848b8605Smrg#include "util/u_math.h"
31848b8605Smrg
32848b8605Smrg#include "vc4_qpu_defines.h"
33848b8605Smrg
34b8e80941Smrgstruct vc4_compile;
35b8e80941Smrg
36848b8605Smrgstruct qpu_reg {
37848b8605Smrg        enum qpu_mux mux;
38848b8605Smrg        uint8_t addr;
39848b8605Smrg};
40848b8605Smrg
41848b8605Smrgstatic inline struct qpu_reg
42848b8605Smrgqpu_rn(int n)
43848b8605Smrg{
44848b8605Smrg        struct qpu_reg r = {
45848b8605Smrg                QPU_MUX_R0 + n,
46848b8605Smrg                0,
47848b8605Smrg        };
48848b8605Smrg
49848b8605Smrg        return r;
50848b8605Smrg}
51848b8605Smrg
52848b8605Smrgstatic inline struct qpu_reg
53848b8605Smrgqpu_ra(int addr)
54848b8605Smrg{
55848b8605Smrg        struct qpu_reg r = {
56848b8605Smrg                QPU_MUX_A,
57848b8605Smrg                addr,
58848b8605Smrg        };
59848b8605Smrg
60848b8605Smrg        return r;
61848b8605Smrg}
62848b8605Smrg
63848b8605Smrgstatic inline struct qpu_reg
64848b8605Smrgqpu_rb(int addr)
65848b8605Smrg{
66848b8605Smrg        struct qpu_reg r = {
67848b8605Smrg                QPU_MUX_B,
68848b8605Smrg                addr,
69848b8605Smrg        };
70848b8605Smrg
71848b8605Smrg        return r;
72848b8605Smrg}
73848b8605Smrg
74848b8605Smrgstatic inline struct qpu_reg
75848b8605Smrgqpu_vary()
76848b8605Smrg{
77848b8605Smrg        struct qpu_reg r = {
78848b8605Smrg                QPU_MUX_A,
79848b8605Smrg                QPU_R_VARY,
80848b8605Smrg        };
81848b8605Smrg
82848b8605Smrg        return r;
83848b8605Smrg}
84848b8605Smrg
85848b8605Smrgstatic inline struct qpu_reg
86848b8605Smrgqpu_unif()
87848b8605Smrg{
88848b8605Smrg        struct qpu_reg r = {
89848b8605Smrg                QPU_MUX_A,
90848b8605Smrg                QPU_R_UNIF,
91848b8605Smrg        };
92848b8605Smrg
93848b8605Smrg        return r;
94848b8605Smrg}
95848b8605Smrg
96848b8605Smrgstatic inline struct qpu_reg
97848b8605Smrgqpu_vrsetup()
98848b8605Smrg{
99848b8605Smrg        return qpu_ra(QPU_W_VPMVCD_SETUP);
100848b8605Smrg}
101848b8605Smrg
102848b8605Smrgstatic inline struct qpu_reg
103848b8605Smrgqpu_vwsetup()
104848b8605Smrg{
105848b8605Smrg        return qpu_rb(QPU_W_VPMVCD_SETUP);
106848b8605Smrg}
107848b8605Smrg
108848b8605Smrgstatic inline struct qpu_reg
109848b8605Smrgqpu_tlbc()
110848b8605Smrg{
111848b8605Smrg        struct qpu_reg r = {
112848b8605Smrg                QPU_MUX_A,
113848b8605Smrg                QPU_W_TLB_COLOR_ALL,
114848b8605Smrg        };
115848b8605Smrg
116848b8605Smrg        return r;
117848b8605Smrg}
118848b8605Smrg
119b8e80941Smrgstatic inline struct qpu_reg
120b8e80941Smrgqpu_tlbc_ms()
121b8e80941Smrg{
122b8e80941Smrg        struct qpu_reg r = {
123b8e80941Smrg                QPU_MUX_A,
124b8e80941Smrg                QPU_W_TLB_COLOR_MS,
125b8e80941Smrg        };
126b8e80941Smrg
127b8e80941Smrg        return r;
128b8e80941Smrg}
129b8e80941Smrg
130848b8605Smrgstatic inline struct qpu_reg qpu_r0(void) { return qpu_rn(0); }
131848b8605Smrgstatic inline struct qpu_reg qpu_r1(void) { return qpu_rn(1); }
132848b8605Smrgstatic inline struct qpu_reg qpu_r2(void) { return qpu_rn(2); }
133848b8605Smrgstatic inline struct qpu_reg qpu_r3(void) { return qpu_rn(3); }
134848b8605Smrgstatic inline struct qpu_reg qpu_r4(void) { return qpu_rn(4); }
135848b8605Smrgstatic inline struct qpu_reg qpu_r5(void) { return qpu_rn(5); }
136848b8605Smrg
137b8e80941Smrguint64_t qpu_NOP(void) ATTRIBUTE_CONST;
138b8e80941Smrguint64_t qpu_a_MOV(struct qpu_reg dst, struct qpu_reg src) ATTRIBUTE_CONST;
139b8e80941Smrguint64_t qpu_m_MOV(struct qpu_reg dst, struct qpu_reg src) ATTRIBUTE_CONST;
140848b8605Smrguint64_t qpu_a_alu2(enum qpu_op_add op, struct qpu_reg dst,
141b8e80941Smrg                    struct qpu_reg src0, struct qpu_reg src1) ATTRIBUTE_CONST;
142848b8605Smrguint64_t qpu_m_alu2(enum qpu_op_mul op, struct qpu_reg dst,
143b8e80941Smrg                    struct qpu_reg src0, struct qpu_reg src1) ATTRIBUTE_CONST;
144b8e80941Smrguint64_t qpu_merge_inst(uint64_t a, uint64_t b) ATTRIBUTE_CONST;
145b8e80941Smrguint64_t qpu_load_imm_ui(struct qpu_reg dst, uint32_t val) ATTRIBUTE_CONST;
146b8e80941Smrguint64_t qpu_load_imm_u2(struct qpu_reg dst, uint32_t val) ATTRIBUTE_CONST;
147b8e80941Smrguint64_t qpu_load_imm_i2(struct qpu_reg dst, uint32_t val) ATTRIBUTE_CONST;
148b8e80941Smrguint64_t qpu_branch(uint32_t cond, uint32_t target) ATTRIBUTE_CONST;
149b8e80941Smrguint64_t qpu_set_sig(uint64_t inst, uint32_t sig) ATTRIBUTE_CONST;
150b8e80941Smrguint64_t qpu_set_cond_add(uint64_t inst, uint32_t cond) ATTRIBUTE_CONST;
151b8e80941Smrguint64_t qpu_set_cond_mul(uint64_t inst, uint32_t cond) ATTRIBUTE_CONST;
152b8e80941Smrguint32_t qpu_encode_small_immediate(uint32_t i) ATTRIBUTE_CONST;
153b8e80941Smrguint64_t qpu_m_rot(struct qpu_reg dst, struct qpu_reg src, int rot) ATTRIBUTE_CONST;
154b8e80941Smrg
155b8e80941Smrgbool qpu_waddr_is_tlb(uint32_t waddr) ATTRIBUTE_CONST;
156b8e80941Smrgbool qpu_inst_is_tlb(uint64_t inst) ATTRIBUTE_CONST;
157b8e80941Smrgint qpu_num_sf_accesses(uint64_t inst) ATTRIBUTE_CONST;
158b8e80941Smrgvoid qpu_serialize_one_inst(struct vc4_compile *c, uint64_t inst);
159b8e80941Smrg
160b8e80941Smrgstatic inline enum qpu_cond
161b8e80941Smrgqpu_cond_complement(enum qpu_cond cond)
162b8e80941Smrg{
163b8e80941Smrg        return cond ^ 1;
164b8e80941Smrg}
165848b8605Smrg
166848b8605Smrgstatic inline uint64_t
167848b8605Smrgqpu_load_imm_f(struct qpu_reg dst, float val)
168848b8605Smrg{
169848b8605Smrg        return qpu_load_imm_ui(dst, fui(val));
170848b8605Smrg}
171848b8605Smrg
172848b8605Smrg#define A_ALU2(op)                                                       \
173848b8605Smrgstatic inline uint64_t                                                   \
174848b8605Smrgqpu_a_##op(struct qpu_reg dst, struct qpu_reg src0, struct qpu_reg src1) \
175848b8605Smrg{                                                                        \
176848b8605Smrg        return qpu_a_alu2(QPU_A_##op, dst, src0, src1);                  \
177848b8605Smrg}
178848b8605Smrg
179848b8605Smrg#define M_ALU2(op)                                                       \
180848b8605Smrgstatic inline uint64_t                                                   \
181848b8605Smrgqpu_m_##op(struct qpu_reg dst, struct qpu_reg src0, struct qpu_reg src1) \
182848b8605Smrg{                                                                        \
183848b8605Smrg        return qpu_m_alu2(QPU_M_##op, dst, src0, src1);                  \
184848b8605Smrg}
185848b8605Smrg
186848b8605Smrg#define A_ALU1(op)                                                       \
187848b8605Smrgstatic inline uint64_t                                                   \
188848b8605Smrgqpu_a_##op(struct qpu_reg dst, struct qpu_reg src0)                      \
189848b8605Smrg{                                                                        \
190848b8605Smrg        return qpu_a_alu2(QPU_A_##op, dst, src0, src0);                  \
191848b8605Smrg}
192848b8605Smrg
193848b8605Smrg/*A_ALU2(NOP) */
194848b8605SmrgA_ALU2(FADD)
195848b8605SmrgA_ALU2(FSUB)
196848b8605SmrgA_ALU2(FMIN)
197848b8605SmrgA_ALU2(FMAX)
198848b8605SmrgA_ALU2(FMINABS)
199848b8605SmrgA_ALU2(FMAXABS)
200848b8605SmrgA_ALU1(FTOI)
201848b8605SmrgA_ALU1(ITOF)
202848b8605SmrgA_ALU2(ADD)
203848b8605SmrgA_ALU2(SUB)
204848b8605SmrgA_ALU2(SHR)
205848b8605SmrgA_ALU2(ASR)
206848b8605SmrgA_ALU2(ROR)
207848b8605SmrgA_ALU2(SHL)
208848b8605SmrgA_ALU2(MIN)
209848b8605SmrgA_ALU2(MAX)
210848b8605SmrgA_ALU2(AND)
211848b8605SmrgA_ALU2(OR)
212848b8605SmrgA_ALU2(XOR)
213848b8605SmrgA_ALU1(NOT)
214848b8605SmrgA_ALU1(CLZ)
215848b8605SmrgA_ALU2(V8ADDS)
216848b8605SmrgA_ALU2(V8SUBS)
217848b8605Smrg
218848b8605Smrg/* M_ALU2(NOP) */
219848b8605SmrgM_ALU2(FMUL)
220848b8605SmrgM_ALU2(MUL24)
221848b8605SmrgM_ALU2(V8MULD)
222848b8605SmrgM_ALU2(V8MIN)
223848b8605SmrgM_ALU2(V8MAX)
224848b8605SmrgM_ALU2(V8ADDS)
225848b8605SmrgM_ALU2(V8SUBS)
226848b8605Smrg
227848b8605Smrgvoid
228848b8605Smrgvc4_qpu_disasm(const uint64_t *instructions, int num_instructions);
229848b8605Smrg
230b8e80941Smrgvoid
231b8e80941Smrgvc4_qpu_disasm_pack_mul(FILE *out, uint32_t pack);
232b8e80941Smrg
233b8e80941Smrgvoid
234b8e80941Smrgvc4_qpu_disasm_pack_a(FILE *out, uint32_t pack);
235b8e80941Smrg
236b8e80941Smrgvoid
237b8e80941Smrgvc4_qpu_disasm_unpack(FILE *out, uint32_t pack);
238b8e80941Smrg
239848b8605Smrgvoid
240848b8605Smrgvc4_qpu_validate(uint64_t *insts, uint32_t num_inst);
241848b8605Smrg
242b8e80941Smrgvoid
243b8e80941Smrgvc4_qpu_disasm_cond(FILE *out, uint32_t cond);
244b8e80941Smrg
245b8e80941Smrgvoid
246b8e80941Smrgvc4_qpu_disasm_cond_branch(FILE *out, uint32_t cond);
247b8e80941Smrg
248848b8605Smrg#endif /* VC4_QPU_H */
249