1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * This file is subject to the terms and conditions of the GNU General Public
3*4882a593Smuzhiyun * License. See the file "COPYING" in the main directory of this archive
4*4882a593Smuzhiyun * for more details.
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * A small micro-assembler. It is intentionally kept simple, does only
7*4882a593Smuzhiyun * support a subset of instructions, and does not try to hide pipeline
8*4882a593Smuzhiyun * effects like branch delay slots.
9*4882a593Smuzhiyun *
10*4882a593Smuzhiyun * Copyright (C) 2004, 2005, 2006, 2008 Thiemo Seufer
11*4882a593Smuzhiyun * Copyright (C) 2005, 2007 Maciej W. Rozycki
12*4882a593Smuzhiyun * Copyright (C) 2006 Ralf Baechle (ralf@linux-mips.org)
13*4882a593Smuzhiyun * Copyright (C) 2012, 2013 MIPS Technologies, Inc. All rights reserved.
14*4882a593Smuzhiyun */
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun #include <linux/kernel.h>
17*4882a593Smuzhiyun #include <linux/types.h>
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #include <asm/inst.h>
20*4882a593Smuzhiyun #include <asm/elf.h>
21*4882a593Smuzhiyun #include <asm/bugs.h>
22*4882a593Smuzhiyun #include <asm/uasm.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #define RS_MASK 0x1f
25*4882a593Smuzhiyun #define RS_SH 16
26*4882a593Smuzhiyun #define RT_MASK 0x1f
27*4882a593Smuzhiyun #define RT_SH 21
28*4882a593Smuzhiyun #define SCIMM_MASK 0x3ff
29*4882a593Smuzhiyun #define SCIMM_SH 16
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun /* This macro sets the non-variable bits of an instruction. */
32*4882a593Smuzhiyun #define M(a, b, c, d, e, f) \
33*4882a593Smuzhiyun ((a) << OP_SH \
34*4882a593Smuzhiyun | (b) << RT_SH \
35*4882a593Smuzhiyun | (c) << RS_SH \
36*4882a593Smuzhiyun | (d) << RD_SH \
37*4882a593Smuzhiyun | (e) << RE_SH \
38*4882a593Smuzhiyun | (f) << FUNC_SH)
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun #include "uasm.c"
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun static const struct insn insn_table_MM[insn_invalid] = {
43*4882a593Smuzhiyun [insn_addu] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_addu32_op), RT | RS | RD},
44*4882a593Smuzhiyun [insn_addiu] = {M(mm_addiu32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
45*4882a593Smuzhiyun [insn_and] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_and_op), RT | RS | RD},
46*4882a593Smuzhiyun [insn_andi] = {M(mm_andi32_op, 0, 0, 0, 0, 0), RT | RS | UIMM},
47*4882a593Smuzhiyun [insn_beq] = {M(mm_beq32_op, 0, 0, 0, 0, 0), RS | RT | BIMM},
48*4882a593Smuzhiyun [insn_beql] = {0, 0},
49*4882a593Smuzhiyun [insn_bgez] = {M(mm_pool32i_op, mm_bgez_op, 0, 0, 0, 0), RS | BIMM},
50*4882a593Smuzhiyun [insn_bgezl] = {0, 0},
51*4882a593Smuzhiyun [insn_bltz] = {M(mm_pool32i_op, mm_bltz_op, 0, 0, 0, 0), RS | BIMM},
52*4882a593Smuzhiyun [insn_bltzl] = {0, 0},
53*4882a593Smuzhiyun [insn_bne] = {M(mm_bne32_op, 0, 0, 0, 0, 0), RT | RS | BIMM},
54*4882a593Smuzhiyun [insn_cache] = {M(mm_pool32b_op, 0, 0, mm_cache_func, 0, 0), RT | RS | SIMM},
55*4882a593Smuzhiyun [insn_cfc1] = {M(mm_pool32f_op, 0, 0, 0, mm_cfc1_op, mm_32f_73_op), RT | RS},
56*4882a593Smuzhiyun [insn_cfcmsa] = {M(mm_pool32s_op, 0, msa_cfc_op, 0, 0, mm_32s_elm_op), RD | RE},
57*4882a593Smuzhiyun [insn_ctc1] = {M(mm_pool32f_op, 0, 0, 0, mm_ctc1_op, mm_32f_73_op), RT | RS},
58*4882a593Smuzhiyun [insn_ctcmsa] = {M(mm_pool32s_op, 0, msa_ctc_op, 0, 0, mm_32s_elm_op), RD | RE},
59*4882a593Smuzhiyun [insn_daddu] = {0, 0},
60*4882a593Smuzhiyun [insn_daddiu] = {0, 0},
61*4882a593Smuzhiyun [insn_di] = {M(mm_pool32a_op, 0, 0, 0, mm_di_op, mm_pool32axf_op), RS},
62*4882a593Smuzhiyun [insn_divu] = {M(mm_pool32a_op, 0, 0, 0, mm_divu_op, mm_pool32axf_op), RT | RS},
63*4882a593Smuzhiyun [insn_dmfc0] = {0, 0},
64*4882a593Smuzhiyun [insn_dmtc0] = {0, 0},
65*4882a593Smuzhiyun [insn_dsll] = {0, 0},
66*4882a593Smuzhiyun [insn_dsll32] = {0, 0},
67*4882a593Smuzhiyun [insn_dsra] = {0, 0},
68*4882a593Smuzhiyun [insn_dsrl] = {0, 0},
69*4882a593Smuzhiyun [insn_dsrl32] = {0, 0},
70*4882a593Smuzhiyun [insn_drotr] = {0, 0},
71*4882a593Smuzhiyun [insn_drotr32] = {0, 0},
72*4882a593Smuzhiyun [insn_dsubu] = {0, 0},
73*4882a593Smuzhiyun [insn_eret] = {M(mm_pool32a_op, 0, 0, 0, mm_eret_op, mm_pool32axf_op), 0},
74*4882a593Smuzhiyun [insn_ins] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_ins_op), RT | RS | RD | RE},
75*4882a593Smuzhiyun [insn_ext] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_ext_op), RT | RS | RD | RE},
76*4882a593Smuzhiyun [insn_j] = {M(mm_j32_op, 0, 0, 0, 0, 0), JIMM},
77*4882a593Smuzhiyun [insn_jal] = {M(mm_jal32_op, 0, 0, 0, 0, 0), JIMM},
78*4882a593Smuzhiyun [insn_jalr] = {M(mm_pool32a_op, 0, 0, 0, mm_jalr_op, mm_pool32axf_op), RT | RS},
79*4882a593Smuzhiyun [insn_jr] = {M(mm_pool32a_op, 0, 0, 0, mm_jalr_op, mm_pool32axf_op), RS},
80*4882a593Smuzhiyun [insn_lb] = {M(mm_lb32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
81*4882a593Smuzhiyun [insn_ld] = {0, 0},
82*4882a593Smuzhiyun [insn_lh] = {M(mm_lh32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
83*4882a593Smuzhiyun [insn_ll] = {M(mm_pool32c_op, 0, 0, (mm_ll_func << 1), 0, 0), RS | RT | SIMM},
84*4882a593Smuzhiyun [insn_lld] = {0, 0},
85*4882a593Smuzhiyun [insn_lui] = {M(mm_pool32i_op, mm_lui_op, 0, 0, 0, 0), RS | SIMM},
86*4882a593Smuzhiyun [insn_lw] = {M(mm_lw32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
87*4882a593Smuzhiyun [insn_mfc0] = {M(mm_pool32a_op, 0, 0, 0, mm_mfc0_op, mm_pool32axf_op), RT | RS | RD},
88*4882a593Smuzhiyun [insn_mfhi] = {M(mm_pool32a_op, 0, 0, 0, mm_mfhi32_op, mm_pool32axf_op), RS},
89*4882a593Smuzhiyun [insn_mflo] = {M(mm_pool32a_op, 0, 0, 0, mm_mflo32_op, mm_pool32axf_op), RS},
90*4882a593Smuzhiyun [insn_mtc0] = {M(mm_pool32a_op, 0, 0, 0, mm_mtc0_op, mm_pool32axf_op), RT | RS | RD},
91*4882a593Smuzhiyun [insn_mthi] = {M(mm_pool32a_op, 0, 0, 0, mm_mthi32_op, mm_pool32axf_op), RS},
92*4882a593Smuzhiyun [insn_mtlo] = {M(mm_pool32a_op, 0, 0, 0, mm_mtlo32_op, mm_pool32axf_op), RS},
93*4882a593Smuzhiyun [insn_mul] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_mul_op), RT | RS | RD},
94*4882a593Smuzhiyun [insn_or] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_or32_op), RT | RS | RD},
95*4882a593Smuzhiyun [insn_ori] = {M(mm_ori32_op, 0, 0, 0, 0, 0), RT | RS | UIMM},
96*4882a593Smuzhiyun [insn_pref] = {M(mm_pool32c_op, 0, 0, (mm_pref_func << 1), 0, 0), RT | RS | SIMM},
97*4882a593Smuzhiyun [insn_rfe] = {0, 0},
98*4882a593Smuzhiyun [insn_sc] = {M(mm_pool32c_op, 0, 0, (mm_sc_func << 1), 0, 0), RT | RS | SIMM},
99*4882a593Smuzhiyun [insn_scd] = {0, 0},
100*4882a593Smuzhiyun [insn_sd] = {0, 0},
101*4882a593Smuzhiyun [insn_sll] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_sll32_op), RT | RS | RD},
102*4882a593Smuzhiyun [insn_sllv] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_sllv32_op), RT | RS | RD},
103*4882a593Smuzhiyun [insn_slt] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_slt_op), RT | RS | RD},
104*4882a593Smuzhiyun [insn_sltiu] = {M(mm_sltiu32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
105*4882a593Smuzhiyun [insn_sltu] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_sltu_op), RT | RS | RD},
106*4882a593Smuzhiyun [insn_sra] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_sra_op), RT | RS | RD},
107*4882a593Smuzhiyun [insn_srav] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_srav_op), RT | RS | RD},
108*4882a593Smuzhiyun [insn_srl] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_srl32_op), RT | RS | RD},
109*4882a593Smuzhiyun [insn_srlv] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_srlv32_op), RT | RS | RD},
110*4882a593Smuzhiyun [insn_rotr] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_rotr_op), RT | RS | RD},
111*4882a593Smuzhiyun [insn_subu] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_subu32_op), RT | RS | RD},
112*4882a593Smuzhiyun [insn_sw] = {M(mm_sw32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
113*4882a593Smuzhiyun [insn_sync] = {M(mm_pool32a_op, 0, 0, 0, mm_sync_op, mm_pool32axf_op), RS},
114*4882a593Smuzhiyun [insn_tlbp] = {M(mm_pool32a_op, 0, 0, 0, mm_tlbp_op, mm_pool32axf_op), 0},
115*4882a593Smuzhiyun [insn_tlbr] = {M(mm_pool32a_op, 0, 0, 0, mm_tlbr_op, mm_pool32axf_op), 0},
116*4882a593Smuzhiyun [insn_tlbwi] = {M(mm_pool32a_op, 0, 0, 0, mm_tlbwi_op, mm_pool32axf_op), 0},
117*4882a593Smuzhiyun [insn_tlbwr] = {M(mm_pool32a_op, 0, 0, 0, mm_tlbwr_op, mm_pool32axf_op), 0},
118*4882a593Smuzhiyun [insn_wait] = {M(mm_pool32a_op, 0, 0, 0, mm_wait_op, mm_pool32axf_op), SCIMM},
119*4882a593Smuzhiyun [insn_wsbh] = {M(mm_pool32a_op, 0, 0, 0, mm_wsbh_op, mm_pool32axf_op), RT | RS},
120*4882a593Smuzhiyun [insn_xor] = {M(mm_pool32a_op, 0, 0, 0, 0, mm_xor32_op), RT | RS | RD},
121*4882a593Smuzhiyun [insn_xori] = {M(mm_xori32_op, 0, 0, 0, 0, 0), RT | RS | UIMM},
122*4882a593Smuzhiyun [insn_dins] = {0, 0},
123*4882a593Smuzhiyun [insn_dinsm] = {0, 0},
124*4882a593Smuzhiyun [insn_syscall] = {M(mm_pool32a_op, 0, 0, 0, mm_syscall_op, mm_pool32axf_op), SCIMM},
125*4882a593Smuzhiyun [insn_bbit0] = {0, 0},
126*4882a593Smuzhiyun [insn_bbit1] = {0, 0},
127*4882a593Smuzhiyun [insn_lwx] = {0, 0},
128*4882a593Smuzhiyun [insn_ldx] = {0, 0},
129*4882a593Smuzhiyun };
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun #undef M
132*4882a593Smuzhiyun
build_bimm(s32 arg)133*4882a593Smuzhiyun static inline u32 build_bimm(s32 arg)
134*4882a593Smuzhiyun {
135*4882a593Smuzhiyun WARN(arg > 0xffff || arg < -0x10000,
136*4882a593Smuzhiyun KERN_WARNING "Micro-assembler field overflow\n");
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun WARN(arg & 0x3, KERN_WARNING "Invalid micro-assembler branch target\n");
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun return ((arg < 0) ? (1 << 15) : 0) | ((arg >> 1) & 0x7fff);
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun
build_jimm(u32 arg)143*4882a593Smuzhiyun static inline u32 build_jimm(u32 arg)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun WARN(arg & ~((JIMM_MASK << 2) | 1),
147*4882a593Smuzhiyun KERN_WARNING "Micro-assembler field overflow\n");
148*4882a593Smuzhiyun
149*4882a593Smuzhiyun return (arg >> 1) & JIMM_MASK;
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun /*
153*4882a593Smuzhiyun * The order of opcode arguments is implicitly left to right,
154*4882a593Smuzhiyun * starting with RS and ending with FUNC or IMM.
155*4882a593Smuzhiyun */
build_insn(u32 ** buf,enum opcode opc,...)156*4882a593Smuzhiyun static void build_insn(u32 **buf, enum opcode opc, ...)
157*4882a593Smuzhiyun {
158*4882a593Smuzhiyun const struct insn *ip;
159*4882a593Smuzhiyun va_list ap;
160*4882a593Smuzhiyun u32 op;
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun if (opc < 0 || opc >= insn_invalid ||
163*4882a593Smuzhiyun (opc == insn_daddiu && r4k_daddiu_bug()) ||
164*4882a593Smuzhiyun (insn_table_MM[opc].match == 0 && insn_table_MM[opc].fields == 0))
165*4882a593Smuzhiyun panic("Unsupported Micro-assembler instruction %d", opc);
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun ip = &insn_table_MM[opc];
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun op = ip->match;
170*4882a593Smuzhiyun va_start(ap, opc);
171*4882a593Smuzhiyun if (ip->fields & RS) {
172*4882a593Smuzhiyun if (opc == insn_mfc0 || opc == insn_mtc0 ||
173*4882a593Smuzhiyun opc == insn_cfc1 || opc == insn_ctc1)
174*4882a593Smuzhiyun op |= build_rt(va_arg(ap, u32));
175*4882a593Smuzhiyun else
176*4882a593Smuzhiyun op |= build_rs(va_arg(ap, u32));
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun if (ip->fields & RT) {
179*4882a593Smuzhiyun if (opc == insn_mfc0 || opc == insn_mtc0 ||
180*4882a593Smuzhiyun opc == insn_cfc1 || opc == insn_ctc1)
181*4882a593Smuzhiyun op |= build_rs(va_arg(ap, u32));
182*4882a593Smuzhiyun else
183*4882a593Smuzhiyun op |= build_rt(va_arg(ap, u32));
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun if (ip->fields & RD)
186*4882a593Smuzhiyun op |= build_rd(va_arg(ap, u32));
187*4882a593Smuzhiyun if (ip->fields & RE)
188*4882a593Smuzhiyun op |= build_re(va_arg(ap, u32));
189*4882a593Smuzhiyun if (ip->fields & SIMM)
190*4882a593Smuzhiyun op |= build_simm(va_arg(ap, s32));
191*4882a593Smuzhiyun if (ip->fields & UIMM)
192*4882a593Smuzhiyun op |= build_uimm(va_arg(ap, u32));
193*4882a593Smuzhiyun if (ip->fields & BIMM)
194*4882a593Smuzhiyun op |= build_bimm(va_arg(ap, s32));
195*4882a593Smuzhiyun if (ip->fields & JIMM)
196*4882a593Smuzhiyun op |= build_jimm(va_arg(ap, u32));
197*4882a593Smuzhiyun if (ip->fields & FUNC)
198*4882a593Smuzhiyun op |= build_func(va_arg(ap, u32));
199*4882a593Smuzhiyun if (ip->fields & SET)
200*4882a593Smuzhiyun op |= build_set(va_arg(ap, u32));
201*4882a593Smuzhiyun if (ip->fields & SCIMM)
202*4882a593Smuzhiyun op |= build_scimm(va_arg(ap, u32));
203*4882a593Smuzhiyun va_end(ap);
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun #ifdef CONFIG_CPU_LITTLE_ENDIAN
206*4882a593Smuzhiyun **buf = ((op & 0xffff) << 16) | (op >> 16);
207*4882a593Smuzhiyun #else
208*4882a593Smuzhiyun **buf = op;
209*4882a593Smuzhiyun #endif
210*4882a593Smuzhiyun (*buf)++;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun static inline void
__resolve_relocs(struct uasm_reloc * rel,struct uasm_label * lab)214*4882a593Smuzhiyun __resolve_relocs(struct uasm_reloc *rel, struct uasm_label *lab)
215*4882a593Smuzhiyun {
216*4882a593Smuzhiyun long laddr = (long)lab->addr;
217*4882a593Smuzhiyun long raddr = (long)rel->addr;
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun switch (rel->type) {
220*4882a593Smuzhiyun case R_MIPS_PC16:
221*4882a593Smuzhiyun #ifdef CONFIG_CPU_LITTLE_ENDIAN
222*4882a593Smuzhiyun *rel->addr |= (build_bimm(laddr - (raddr + 4)) << 16);
223*4882a593Smuzhiyun #else
224*4882a593Smuzhiyun *rel->addr |= build_bimm(laddr - (raddr + 4));
225*4882a593Smuzhiyun #endif
226*4882a593Smuzhiyun break;
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun default:
229*4882a593Smuzhiyun panic("Unsupported Micro-assembler relocation %d",
230*4882a593Smuzhiyun rel->type);
231*4882a593Smuzhiyun }
232*4882a593Smuzhiyun }
233