xref: /OK3568_Linux_fs/kernel/arch/mips/mm/uasm-micromips.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * This file is subject to the terms and conditions of the GNU General Public
3*4882a593Smuzhiyun  * License.  See the file "COPYING" in the main directory of this archive
4*4882a593Smuzhiyun  * for more details.
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * A small micro-assembler. It is intentionally kept simple, does only
7*4882a593Smuzhiyun  * support a subset of instructions, and does not try to hide pipeline
8*4882a593Smuzhiyun  * effects like branch delay slots.
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  * Copyright (C) 2004, 2005, 2006, 2008	 Thiemo Seufer
11*4882a593Smuzhiyun  * Copyright (C) 2005, 2007  Maciej W. Rozycki
12*4882a593Smuzhiyun  * Copyright (C) 2006  Ralf Baechle (ralf@linux-mips.org)
13*4882a593Smuzhiyun  * Copyright (C) 2012, 2013   MIPS Technologies, Inc.  All rights reserved.
14*4882a593Smuzhiyun  */
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun #include <linux/kernel.h>
17*4882a593Smuzhiyun #include <linux/types.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #include <asm/inst.h>
20*4882a593Smuzhiyun #include <asm/elf.h>
21*4882a593Smuzhiyun #include <asm/bugs.h>
22*4882a593Smuzhiyun #include <asm/uasm.h>
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun #define RS_MASK		0x1f
25*4882a593Smuzhiyun #define RS_SH		16
26*4882a593Smuzhiyun #define RT_MASK		0x1f
27*4882a593Smuzhiyun #define RT_SH		21
28*4882a593Smuzhiyun #define SCIMM_MASK	0x3ff
29*4882a593Smuzhiyun #define SCIMM_SH	16
30*4882a593Smuzhiyun 
31*4882a593Smuzhiyun /* This macro sets the non-variable bits of an instruction. */
32*4882a593Smuzhiyun #define M(a, b, c, d, e, f)					\
33*4882a593Smuzhiyun 	((a) << OP_SH						\
34*4882a593Smuzhiyun 	 | (b) << RT_SH						\
35*4882a593Smuzhiyun 	 | (c) << RS_SH						\
36*4882a593Smuzhiyun 	 | (d) << RD_SH						\
37*4882a593Smuzhiyun 	 | (e) << RE_SH						\
38*4882a593Smuzhiyun 	 | (f) << FUNC_SH)
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun #include "uasm.c"
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun static const struct insn insn_table_MM[insn_invalid] = {
43*4882a593Smuzhiyun 	[insn_addu]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_addu32_op), RT | RS | RD},
44*4882a593Smuzhiyun 	[insn_addiu]	= {M(mm_addiu32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
45*4882a593Smuzhiyun 	[insn_and]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_and_op), RT | RS | RD},
46*4882a593Smuzhiyun 	[insn_andi]	= {M(mm_andi32_op, 0, 0, 0, 0, 0), RT | RS | UIMM},
47*4882a593Smuzhiyun 	[insn_beq]	= {M(mm_beq32_op, 0, 0, 0, 0, 0), RS | RT | BIMM},
48*4882a593Smuzhiyun 	[insn_beql]	= {0, 0},
49*4882a593Smuzhiyun 	[insn_bgez]	= {M(mm_pool32i_op, mm_bgez_op, 0, 0, 0, 0), RS | BIMM},
50*4882a593Smuzhiyun 	[insn_bgezl]	= {0, 0},
51*4882a593Smuzhiyun 	[insn_bltz]	= {M(mm_pool32i_op, mm_bltz_op, 0, 0, 0, 0), RS | BIMM},
52*4882a593Smuzhiyun 	[insn_bltzl]	= {0, 0},
53*4882a593Smuzhiyun 	[insn_bne]	= {M(mm_bne32_op, 0, 0, 0, 0, 0), RT | RS | BIMM},
54*4882a593Smuzhiyun 	[insn_cache]	= {M(mm_pool32b_op, 0, 0, mm_cache_func, 0, 0), RT | RS | SIMM},
55*4882a593Smuzhiyun 	[insn_cfc1]	= {M(mm_pool32f_op, 0, 0, 0, mm_cfc1_op, mm_32f_73_op), RT | RS},
56*4882a593Smuzhiyun 	[insn_cfcmsa]	= {M(mm_pool32s_op, 0, msa_cfc_op, 0, 0, mm_32s_elm_op), RD | RE},
57*4882a593Smuzhiyun 	[insn_ctc1]	= {M(mm_pool32f_op, 0, 0, 0, mm_ctc1_op, mm_32f_73_op), RT | RS},
58*4882a593Smuzhiyun 	[insn_ctcmsa]	= {M(mm_pool32s_op, 0, msa_ctc_op, 0, 0, mm_32s_elm_op), RD | RE},
59*4882a593Smuzhiyun 	[insn_daddu]	= {0, 0},
60*4882a593Smuzhiyun 	[insn_daddiu]	= {0, 0},
61*4882a593Smuzhiyun 	[insn_di]	= {M(mm_pool32a_op, 0, 0, 0, mm_di_op, mm_pool32axf_op), RS},
62*4882a593Smuzhiyun 	[insn_divu]	= {M(mm_pool32a_op, 0, 0, 0, mm_divu_op, mm_pool32axf_op), RT | RS},
63*4882a593Smuzhiyun 	[insn_dmfc0]	= {0, 0},
64*4882a593Smuzhiyun 	[insn_dmtc0]	= {0, 0},
65*4882a593Smuzhiyun 	[insn_dsll]	= {0, 0},
66*4882a593Smuzhiyun 	[insn_dsll32]	= {0, 0},
67*4882a593Smuzhiyun 	[insn_dsra]	= {0, 0},
68*4882a593Smuzhiyun 	[insn_dsrl]	= {0, 0},
69*4882a593Smuzhiyun 	[insn_dsrl32]	= {0, 0},
70*4882a593Smuzhiyun 	[insn_drotr]	= {0, 0},
71*4882a593Smuzhiyun 	[insn_drotr32]	= {0, 0},
72*4882a593Smuzhiyun 	[insn_dsubu]	= {0, 0},
73*4882a593Smuzhiyun 	[insn_eret]	= {M(mm_pool32a_op, 0, 0, 0, mm_eret_op, mm_pool32axf_op), 0},
74*4882a593Smuzhiyun 	[insn_ins]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_ins_op), RT | RS | RD | RE},
75*4882a593Smuzhiyun 	[insn_ext]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_ext_op), RT | RS | RD | RE},
76*4882a593Smuzhiyun 	[insn_j]	= {M(mm_j32_op, 0, 0, 0, 0, 0), JIMM},
77*4882a593Smuzhiyun 	[insn_jal]	= {M(mm_jal32_op, 0, 0, 0, 0, 0), JIMM},
78*4882a593Smuzhiyun 	[insn_jalr]	= {M(mm_pool32a_op, 0, 0, 0, mm_jalr_op, mm_pool32axf_op), RT | RS},
79*4882a593Smuzhiyun 	[insn_jr]	= {M(mm_pool32a_op, 0, 0, 0, mm_jalr_op, mm_pool32axf_op), RS},
80*4882a593Smuzhiyun 	[insn_lb]	= {M(mm_lb32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
81*4882a593Smuzhiyun 	[insn_ld]	= {0, 0},
82*4882a593Smuzhiyun 	[insn_lh]	= {M(mm_lh32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
83*4882a593Smuzhiyun 	[insn_ll]	= {M(mm_pool32c_op, 0, 0, (mm_ll_func << 1), 0, 0), RS | RT | SIMM},
84*4882a593Smuzhiyun 	[insn_lld]	= {0, 0},
85*4882a593Smuzhiyun 	[insn_lui]	= {M(mm_pool32i_op, mm_lui_op, 0, 0, 0, 0), RS | SIMM},
86*4882a593Smuzhiyun 	[insn_lw]	= {M(mm_lw32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
87*4882a593Smuzhiyun 	[insn_mfc0]	= {M(mm_pool32a_op, 0, 0, 0, mm_mfc0_op, mm_pool32axf_op), RT | RS | RD},
88*4882a593Smuzhiyun 	[insn_mfhi]	= {M(mm_pool32a_op, 0, 0, 0, mm_mfhi32_op, mm_pool32axf_op), RS},
89*4882a593Smuzhiyun 	[insn_mflo]	= {M(mm_pool32a_op, 0, 0, 0, mm_mflo32_op, mm_pool32axf_op), RS},
90*4882a593Smuzhiyun 	[insn_mtc0]	= {M(mm_pool32a_op, 0, 0, 0, mm_mtc0_op, mm_pool32axf_op), RT | RS | RD},
91*4882a593Smuzhiyun 	[insn_mthi]	= {M(mm_pool32a_op, 0, 0, 0, mm_mthi32_op, mm_pool32axf_op), RS},
92*4882a593Smuzhiyun 	[insn_mtlo]	= {M(mm_pool32a_op, 0, 0, 0, mm_mtlo32_op, mm_pool32axf_op), RS},
93*4882a593Smuzhiyun 	[insn_mul]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_mul_op), RT | RS | RD},
94*4882a593Smuzhiyun 	[insn_or]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_or32_op), RT | RS | RD},
95*4882a593Smuzhiyun 	[insn_ori]	= {M(mm_ori32_op, 0, 0, 0, 0, 0), RT | RS | UIMM},
96*4882a593Smuzhiyun 	[insn_pref]	= {M(mm_pool32c_op, 0, 0, (mm_pref_func << 1), 0, 0), RT | RS | SIMM},
97*4882a593Smuzhiyun 	[insn_rfe]	= {0, 0},
98*4882a593Smuzhiyun 	[insn_sc]	= {M(mm_pool32c_op, 0, 0, (mm_sc_func << 1), 0, 0), RT | RS | SIMM},
99*4882a593Smuzhiyun 	[insn_scd]	= {0, 0},
100*4882a593Smuzhiyun 	[insn_sd]	= {0, 0},
101*4882a593Smuzhiyun 	[insn_sll]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_sll32_op), RT | RS | RD},
102*4882a593Smuzhiyun 	[insn_sllv]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_sllv32_op), RT | RS | RD},
103*4882a593Smuzhiyun 	[insn_slt]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_slt_op), RT | RS | RD},
104*4882a593Smuzhiyun 	[insn_sltiu]	= {M(mm_sltiu32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
105*4882a593Smuzhiyun 	[insn_sltu]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_sltu_op), RT | RS | RD},
106*4882a593Smuzhiyun 	[insn_sra]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_sra_op), RT | RS | RD},
107*4882a593Smuzhiyun 	[insn_srav]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_srav_op), RT | RS | RD},
108*4882a593Smuzhiyun 	[insn_srl]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_srl32_op), RT | RS | RD},
109*4882a593Smuzhiyun 	[insn_srlv]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_srlv32_op), RT | RS | RD},
110*4882a593Smuzhiyun 	[insn_rotr]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_rotr_op), RT | RS | RD},
111*4882a593Smuzhiyun 	[insn_subu]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_subu32_op), RT | RS | RD},
112*4882a593Smuzhiyun 	[insn_sw]	= {M(mm_sw32_op, 0, 0, 0, 0, 0), RT | RS | SIMM},
113*4882a593Smuzhiyun 	[insn_sync]	= {M(mm_pool32a_op, 0, 0, 0, mm_sync_op, mm_pool32axf_op), RS},
114*4882a593Smuzhiyun 	[insn_tlbp]	= {M(mm_pool32a_op, 0, 0, 0, mm_tlbp_op, mm_pool32axf_op), 0},
115*4882a593Smuzhiyun 	[insn_tlbr]	= {M(mm_pool32a_op, 0, 0, 0, mm_tlbr_op, mm_pool32axf_op), 0},
116*4882a593Smuzhiyun 	[insn_tlbwi]	= {M(mm_pool32a_op, 0, 0, 0, mm_tlbwi_op, mm_pool32axf_op), 0},
117*4882a593Smuzhiyun 	[insn_tlbwr]	= {M(mm_pool32a_op, 0, 0, 0, mm_tlbwr_op, mm_pool32axf_op), 0},
118*4882a593Smuzhiyun 	[insn_wait]	= {M(mm_pool32a_op, 0, 0, 0, mm_wait_op, mm_pool32axf_op), SCIMM},
119*4882a593Smuzhiyun 	[insn_wsbh]	= {M(mm_pool32a_op, 0, 0, 0, mm_wsbh_op, mm_pool32axf_op), RT | RS},
120*4882a593Smuzhiyun 	[insn_xor]	= {M(mm_pool32a_op, 0, 0, 0, 0, mm_xor32_op), RT | RS | RD},
121*4882a593Smuzhiyun 	[insn_xori]	= {M(mm_xori32_op, 0, 0, 0, 0, 0), RT | RS | UIMM},
122*4882a593Smuzhiyun 	[insn_dins]	= {0, 0},
123*4882a593Smuzhiyun 	[insn_dinsm]	= {0, 0},
124*4882a593Smuzhiyun 	[insn_syscall]	= {M(mm_pool32a_op, 0, 0, 0, mm_syscall_op, mm_pool32axf_op), SCIMM},
125*4882a593Smuzhiyun 	[insn_bbit0]	= {0, 0},
126*4882a593Smuzhiyun 	[insn_bbit1]	= {0, 0},
127*4882a593Smuzhiyun 	[insn_lwx]	= {0, 0},
128*4882a593Smuzhiyun 	[insn_ldx]	= {0, 0},
129*4882a593Smuzhiyun };
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun #undef M
132*4882a593Smuzhiyun 
build_bimm(s32 arg)133*4882a593Smuzhiyun static inline u32 build_bimm(s32 arg)
134*4882a593Smuzhiyun {
135*4882a593Smuzhiyun 	WARN(arg > 0xffff || arg < -0x10000,
136*4882a593Smuzhiyun 	     KERN_WARNING "Micro-assembler field overflow\n");
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	WARN(arg & 0x3, KERN_WARNING "Invalid micro-assembler branch target\n");
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 	return ((arg < 0) ? (1 << 15) : 0) | ((arg >> 1) & 0x7fff);
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun 
build_jimm(u32 arg)143*4882a593Smuzhiyun static inline u32 build_jimm(u32 arg)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 
146*4882a593Smuzhiyun 	WARN(arg & ~((JIMM_MASK << 2) | 1),
147*4882a593Smuzhiyun 	     KERN_WARNING "Micro-assembler field overflow\n");
148*4882a593Smuzhiyun 
149*4882a593Smuzhiyun 	return (arg >> 1) & JIMM_MASK;
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun /*
153*4882a593Smuzhiyun  * The order of opcode arguments is implicitly left to right,
154*4882a593Smuzhiyun  * starting with RS and ending with FUNC or IMM.
155*4882a593Smuzhiyun  */
build_insn(u32 ** buf,enum opcode opc,...)156*4882a593Smuzhiyun static void build_insn(u32 **buf, enum opcode opc, ...)
157*4882a593Smuzhiyun {
158*4882a593Smuzhiyun 	const struct insn *ip;
159*4882a593Smuzhiyun 	va_list ap;
160*4882a593Smuzhiyun 	u32 op;
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	if (opc < 0 || opc >= insn_invalid ||
163*4882a593Smuzhiyun 	    (opc == insn_daddiu && r4k_daddiu_bug()) ||
164*4882a593Smuzhiyun 	    (insn_table_MM[opc].match == 0 && insn_table_MM[opc].fields == 0))
165*4882a593Smuzhiyun 		panic("Unsupported Micro-assembler instruction %d", opc);
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun 	ip = &insn_table_MM[opc];
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun 	op = ip->match;
170*4882a593Smuzhiyun 	va_start(ap, opc);
171*4882a593Smuzhiyun 	if (ip->fields & RS) {
172*4882a593Smuzhiyun 		if (opc == insn_mfc0 || opc == insn_mtc0 ||
173*4882a593Smuzhiyun 		    opc == insn_cfc1 || opc == insn_ctc1)
174*4882a593Smuzhiyun 			op |= build_rt(va_arg(ap, u32));
175*4882a593Smuzhiyun 		else
176*4882a593Smuzhiyun 			op |= build_rs(va_arg(ap, u32));
177*4882a593Smuzhiyun 	}
178*4882a593Smuzhiyun 	if (ip->fields & RT) {
179*4882a593Smuzhiyun 		if (opc == insn_mfc0 || opc == insn_mtc0 ||
180*4882a593Smuzhiyun 		    opc == insn_cfc1 || opc == insn_ctc1)
181*4882a593Smuzhiyun 			op |= build_rs(va_arg(ap, u32));
182*4882a593Smuzhiyun 		else
183*4882a593Smuzhiyun 			op |= build_rt(va_arg(ap, u32));
184*4882a593Smuzhiyun 	}
185*4882a593Smuzhiyun 	if (ip->fields & RD)
186*4882a593Smuzhiyun 		op |= build_rd(va_arg(ap, u32));
187*4882a593Smuzhiyun 	if (ip->fields & RE)
188*4882a593Smuzhiyun 		op |= build_re(va_arg(ap, u32));
189*4882a593Smuzhiyun 	if (ip->fields & SIMM)
190*4882a593Smuzhiyun 		op |= build_simm(va_arg(ap, s32));
191*4882a593Smuzhiyun 	if (ip->fields & UIMM)
192*4882a593Smuzhiyun 		op |= build_uimm(va_arg(ap, u32));
193*4882a593Smuzhiyun 	if (ip->fields & BIMM)
194*4882a593Smuzhiyun 		op |= build_bimm(va_arg(ap, s32));
195*4882a593Smuzhiyun 	if (ip->fields & JIMM)
196*4882a593Smuzhiyun 		op |= build_jimm(va_arg(ap, u32));
197*4882a593Smuzhiyun 	if (ip->fields & FUNC)
198*4882a593Smuzhiyun 		op |= build_func(va_arg(ap, u32));
199*4882a593Smuzhiyun 	if (ip->fields & SET)
200*4882a593Smuzhiyun 		op |= build_set(va_arg(ap, u32));
201*4882a593Smuzhiyun 	if (ip->fields & SCIMM)
202*4882a593Smuzhiyun 		op |= build_scimm(va_arg(ap, u32));
203*4882a593Smuzhiyun 	va_end(ap);
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun #ifdef CONFIG_CPU_LITTLE_ENDIAN
206*4882a593Smuzhiyun 	**buf = ((op & 0xffff) << 16) | (op >> 16);
207*4882a593Smuzhiyun #else
208*4882a593Smuzhiyun 	**buf = op;
209*4882a593Smuzhiyun #endif
210*4882a593Smuzhiyun 	(*buf)++;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun static inline void
__resolve_relocs(struct uasm_reloc * rel,struct uasm_label * lab)214*4882a593Smuzhiyun __resolve_relocs(struct uasm_reloc *rel, struct uasm_label *lab)
215*4882a593Smuzhiyun {
216*4882a593Smuzhiyun 	long laddr = (long)lab->addr;
217*4882a593Smuzhiyun 	long raddr = (long)rel->addr;
218*4882a593Smuzhiyun 
219*4882a593Smuzhiyun 	switch (rel->type) {
220*4882a593Smuzhiyun 	case R_MIPS_PC16:
221*4882a593Smuzhiyun #ifdef CONFIG_CPU_LITTLE_ENDIAN
222*4882a593Smuzhiyun 		*rel->addr |= (build_bimm(laddr - (raddr + 4)) << 16);
223*4882a593Smuzhiyun #else
224*4882a593Smuzhiyun 		*rel->addr |= build_bimm(laddr - (raddr + 4));
225*4882a593Smuzhiyun #endif
226*4882a593Smuzhiyun 		break;
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	default:
229*4882a593Smuzhiyun 		panic("Unsupported Micro-assembler relocation %d",
230*4882a593Smuzhiyun 		      rel->type);
231*4882a593Smuzhiyun 	}
232*4882a593Smuzhiyun }
233