1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /* align.c - handle alignment exceptions for the Power PC.
5 * Copyright (c) 1998-1999 TiVo, Inc.
6 * PowerPC 403GCX modifications.
8 * PowerPC 403GCX/405GP modifications.
9 * Copyright (c) 2001-2002 PPC64 team, IBM Corp
10 * 64-bit and Power4 support
11 * Copyright (c) 2005 Benjamin Herrenschmidt, IBM Corp
13 * Merge ppc32 and ppc64 implementations
16 #include <linux/kernel.h>
18 #include <asm/processor.h>
19 #include <linux/uaccess.h>
20 #include <asm/cache.h>
21 #include <asm/cputable.h>
22 #include <asm/emulated_ops.h>
23 #include <asm/switch_to.h>
24 #include <asm/disassemble.h>
25 #include <asm/cpu_has_feature.h>
26 #include <asm/sstep.h>
35 #define INVALID { 0, 0 }
37 /* Bits in the flags field */
38 #define LD 0 /* load */
39 #define ST 1 /* store */
40 #define SE 2 /* sign-extend value, or FP ld/st as word */
41 #define SW 0x20 /* byte swap */
42 #define E4 0x40 /* SPE endianness is word */
43 #define E8 0x80 /* SPE endianness is double word */
47 static struct aligninfo spe_aligninfo[32] = {
48 { 8, LD+E8 }, /* 0 00 00: evldd[x] */
49 { 8, LD+E4 }, /* 0 00 01: evldw[x] */
50 { 8, LD }, /* 0 00 10: evldh[x] */
51 INVALID, /* 0 00 11 */
52 { 2, LD }, /* 0 01 00: evlhhesplat[x] */
53 INVALID, /* 0 01 01 */
54 { 2, LD }, /* 0 01 10: evlhhousplat[x] */
55 { 2, LD+SE }, /* 0 01 11: evlhhossplat[x] */
56 { 4, LD }, /* 0 10 00: evlwhe[x] */
57 INVALID, /* 0 10 01 */
58 { 4, LD }, /* 0 10 10: evlwhou[x] */
59 { 4, LD+SE }, /* 0 10 11: evlwhos[x] */
60 { 4, LD+E4 }, /* 0 11 00: evlwwsplat[x] */
61 INVALID, /* 0 11 01 */
62 { 4, LD }, /* 0 11 10: evlwhsplat[x] */
63 INVALID, /* 0 11 11 */
65 { 8, ST+E8 }, /* 1 00 00: evstdd[x] */
66 { 8, ST+E4 }, /* 1 00 01: evstdw[x] */
67 { 8, ST }, /* 1 00 10: evstdh[x] */
68 INVALID, /* 1 00 11 */
69 INVALID, /* 1 01 00 */
70 INVALID, /* 1 01 01 */
71 INVALID, /* 1 01 10 */
72 INVALID, /* 1 01 11 */
73 { 4, ST }, /* 1 10 00: evstwhe[x] */
74 INVALID, /* 1 10 01 */
75 { 4, ST }, /* 1 10 10: evstwho[x] */
76 INVALID, /* 1 10 11 */
77 { 4, ST+E4 }, /* 1 11 00: evstwwe[x] */
78 INVALID, /* 1 11 01 */
79 { 4, ST+E4 }, /* 1 11 10: evstwwo[x] */
80 INVALID, /* 1 11 11 */
86 #define EVLHHESPLAT 0x04
87 #define EVLHHOUSPLAT 0x06
88 #define EVLHHOSSPLAT 0x07
92 #define EVLWWSPLAT 0x0C
93 #define EVLWHSPLAT 0x0E
103 * Emulate SPE loads and stores.
104 * Only Book-E has these instructions, and it does true little-endian,
105 * so we don't need the address swizzling.
107 static int emulate_spe(struct pt_regs *regs, unsigned int reg,
108 struct ppc_inst ppc_instr)
117 unsigned char __user *p, *addr;
118 unsigned long *evr = ¤t->thread.evr[reg];
119 unsigned int nb, flags, instr;
121 instr = ppc_inst_val(ppc_instr);
122 instr = (instr >> 1) & 0x1f;
124 /* DAR has the operand effective address */
125 addr = (unsigned char __user *)regs->dar;
127 nb = spe_aligninfo[instr].len;
128 flags = spe_aligninfo[instr].flags;
130 /* Verify the address of the operand */
131 if (unlikely(user_mode(regs) &&
132 !access_ok(addr, nb)))
136 if (unlikely(!user_mode(regs)))
139 flush_spe_to_thread(current);
141 /* If we are loading, get the data from user space, else
142 * get it from register values
151 data.w[1] = regs->gpr[reg];
154 data.h[2] = *evr >> 16;
155 data.h[3] = regs->gpr[reg] >> 16;
158 data.h[2] = *evr & 0xffff;
159 data.h[3] = regs->gpr[reg] & 0xffff;
165 data.w[1] = regs->gpr[reg];
171 temp.ll = data.ll = 0;
177 ret |= __get_user_inatomic(temp.v[0], p++);
178 ret |= __get_user_inatomic(temp.v[1], p++);
179 ret |= __get_user_inatomic(temp.v[2], p++);
180 ret |= __get_user_inatomic(temp.v[3], p++);
183 ret |= __get_user_inatomic(temp.v[4], p++);
184 ret |= __get_user_inatomic(temp.v[5], p++);
187 ret |= __get_user_inatomic(temp.v[6], p++);
188 ret |= __get_user_inatomic(temp.v[7], p++);
200 data.h[0] = temp.h[3];
201 data.h[2] = temp.h[3];
205 data.h[1] = temp.h[3];
206 data.h[3] = temp.h[3];
209 data.h[0] = temp.h[2];
210 data.h[2] = temp.h[3];
214 data.h[1] = temp.h[2];
215 data.h[3] = temp.h[3];
218 data.w[0] = temp.w[1];
219 data.w[1] = temp.w[1];
222 data.h[0] = temp.h[2];
223 data.h[1] = temp.h[2];
224 data.h[2] = temp.h[3];
225 data.h[3] = temp.h[3];
233 switch (flags & 0xf0) {
235 data.ll = swab64(data.ll);
238 data.w[0] = swab32(data.w[0]);
239 data.w[1] = swab32(data.w[1]);
241 /* Its half word endian */
243 data.h[0] = swab16(data.h[0]);
244 data.h[1] = swab16(data.h[1]);
245 data.h[2] = swab16(data.h[2]);
246 data.h[3] = swab16(data.h[3]);
252 data.w[0] = (s16)data.h[1];
253 data.w[1] = (s16)data.h[3];
256 /* Store result to memory or update registers */
262 ret |= __put_user_inatomic(data.v[0], p++);
263 ret |= __put_user_inatomic(data.v[1], p++);
264 ret |= __put_user_inatomic(data.v[2], p++);
265 ret |= __put_user_inatomic(data.v[3], p++);
268 ret |= __put_user_inatomic(data.v[4], p++);
269 ret |= __put_user_inatomic(data.v[5], p++);
272 ret |= __put_user_inatomic(data.v[6], p++);
273 ret |= __put_user_inatomic(data.v[7], p++);
279 regs->gpr[reg] = data.w[1];
284 #endif /* CONFIG_SPE */
287 * Called on alignment exception. Attempts to fixup
289 * Return 1 on success
290 * Return 0 if unable to handle the interrupt
291 * Return -EFAULT if data address is bad
292 * Other negative return values indicate that the instruction can't
293 * be emulated, and the process should be given a SIGBUS.
296 int fix_alignment(struct pt_regs *regs)
298 struct ppc_inst instr;
299 struct instruction_op op;
303 * We require a complete register set, if not, then our assembly
306 CHECK_FULL_REGS(regs);
308 if (unlikely(__get_user_instr(instr, (void __user *)regs->nip)))
310 if ((regs->msr & MSR_LE) != (MSR_KERNEL & MSR_LE)) {
311 /* We don't handle PPC little-endian any more... */
312 if (cpu_has_feature(CPU_FTR_PPC_LE))
314 instr = ppc_inst_swab(instr);
318 if (ppc_inst_primary_opcode(instr) == 0x4) {
319 int reg = (ppc_inst_val(instr) >> 21) & 0x1f;
320 PPC_WARN_ALIGNMENT(spe, regs);
321 return emulate_spe(regs, reg, instr);
327 * ISA 3.0 (such as P9) copy, copy_first, paste and paste_last alignment
330 * Send a SIGBUS to the process that caused the fault.
332 * We do not emulate these because paste may contain additional metadata
333 * when pasting to a co-processor. Furthermore, paste_last is the
334 * synchronisation point for preceding copy/paste sequences.
336 if ((ppc_inst_val(instr) & 0xfc0006fe) == (PPC_INST_COPY & 0xfc0006fe))
339 r = analyse_instr(&op, regs, instr);
343 type = GETTYPE(op.type);
344 if (!OP_IS_LOAD_STORE(type)) {
345 if (op.type != CACHEOP + DCBZ)
347 PPC_WARN_ALIGNMENT(dcbz, regs);
348 r = emulate_dcbz(op.ea, regs);
350 if (type == LARX || type == STCX)
352 PPC_WARN_ALIGNMENT(unaligned, regs);
353 r = emulate_loadstore(regs, &op);