nixpkgs/pkgs/os-specific/linux/kernel/mips-fpu-sigill.patch

From bf55ef4e3c2f622ac013f196affbd11b67b59223 Mon Sep 17 00:00:00 2001
From: Mark H Weaver <mhw@netris.org>
Date: Fri, 28 Oct 2011 13:24:37 -0400
Subject: [PATCH 2/4] Fix handling of prefx instruction in mips/math-emu

* The instruction is named prefx, not pfetch, and its function
  field is 0x17, not 0x07.

* Recognize the prefx instruction regardless of what bits happen to be
  in bits 21-25, which is the format field of the floating-point ops,
  but holds the base register of the prefx instruction.
---
 arch/mips/include/asm/inst.h |    4 ++--
 arch/mips/math-emu/cp1emu.c  |   16 +++++++---------
 2 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/arch/mips/include/asm/inst.h b/arch/mips/include/asm/inst.h
index ab84064..3048edc 100644
--- a/arch/mips/include/asm/inst.h
+++ b/arch/mips/include/asm/inst.h
@@ -161,8 +161,8 @@ enum cop1_sdw_func {
  */
 enum cop1x_func {
 	lwxc1_op     =  0x00, ldxc1_op     =  0x01,
-	pfetch_op    =  0x07, swxc1_op     =  0x08,
-	sdxc1_op     =  0x09, madd_s_op    =  0x20,
+	swxc1_op     =  0x08, sdxc1_op     =  0x09,
+	prefx_op     =  0x17, madd_s_op    =  0x20,
 	madd_d_op    =  0x21, madd_e_op    =  0x22,
 	msub_s_op    =  0x28, msub_d_op    =  0x29,
 	msub_e_op    =  0x2a, nmadd_s_op   =  0x30,
diff --git a/arch/mips/math-emu/cp1emu.c b/arch/mips/math-emu/cp1emu.c
index dbf2f93..87ddba1 100644
--- a/arch/mips/math-emu/cp1emu.c
+++ b/arch/mips/math-emu/cp1emu.c
@@ -739,7 +739,7 @@ static int fpux_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 			break;
 
 		default:
-			return SIGILL;
+			goto SIGILL_unless_prefx_op;
 		}
 		break;
 	}
@@ -809,19 +809,17 @@ static int fpux_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 			goto copcsr;
 
 		default:
-			return SIGILL;
+			goto SIGILL_unless_prefx_op;
 		}
 		break;
 	}
 
-	case 0x7:		/* 7 */
-		if (MIPSInst_FUNC(ir) != pfetch_op) {
-			return SIGILL;
-		}
-		/* ignore prefx operation */
-		break;
-
 	default:
+	      SIGILL_unless_prefx_op:
+		if (MIPSInst_FUNC(ir) == prefx_op) {
+			/* ignore prefx operation */
+			break;
+		}
 		return SIGILL;
 	}
 
-- 
1.7.5.4

From 97a564e3eddbfb84844b8eccb3bd751c71dfb3eb Mon Sep 17 00:00:00 2001
From: Mark H Weaver <mhw@netris.org>
Date: Fri, 28 Oct 2011 13:35:27 -0400
Subject: [PATCH 3/4] Don't process empty cause flags after simple fp move on
 mips

---
 arch/mips/math-emu/cp1emu.c |    4 ++--
 1 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/arch/mips/math-emu/cp1emu.c b/arch/mips/math-emu/cp1emu.c
index 87ddba1..fefcba2 100644
--- a/arch/mips/math-emu/cp1emu.c
+++ b/arch/mips/math-emu/cp1emu.c
@@ -912,7 +912,7 @@ static int fpu_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 		case fmov_op:
 			/* an easy one */
 			SPFROMREG(rv.s, MIPSInst_FS(ir));
-			goto copcsr;
+			break;
 
 			/* binary op on handler */
 		      scopbop:
@@ -1099,7 +1099,7 @@ static int fpu_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 		case fmov_op:
 			/* an easy one */
 			DPFROMREG(rv.d, MIPSInst_FS(ir));
-			goto copcsr;
+			break;
 
 			/* binary op on handler */
 		      dcopbop:{
-- 
1.7.5.4

From 4051727b3007ef3675e7258ed86fa8517f86d929 Mon Sep 17 00:00:00 2001
From: Mark H Weaver <mhw@netris.org>
Date: Fri, 28 Oct 2011 13:39:10 -0400
Subject: [PATCH 4/4] Support Loongson2f floating-point instructions in
 mips/math-emu

* (arch/mips/include/asm/inst.h): Add Loongson2f function field values
  for madd/msub/nmadd/nmsub that use the spec2 opcode, and the
  Loongson2f/MIPS-5 format field value for paired-single
  floating-point operations.

* (arch/mips/math-emu/cp1emu.c): Add support for the Loongson2f
  instructions for madd/msub/nmadd/nmsub, which use the spec2 opcode.
  Also add support for the Loongson2f instructions that use the
  paired-single floating-point format.
---
 arch/mips/include/asm/inst.h |    4 +-
 arch/mips/math-emu/cp1emu.c  |  287 +++++++++++++++++++++++++++++++++++++++++-
 2 files changed, 289 insertions(+), 2 deletions(-)

diff --git a/arch/mips/include/asm/inst.h b/arch/mips/include/asm/inst.h
index 3048edc..0e8ba7c 100644
--- a/arch/mips/include/asm/inst.h
+++ b/arch/mips/include/asm/inst.h
@@ -61,6 +61,8 @@ enum spec_op {
 enum spec2_op {
 	madd_op, maddu_op, mul_op, spec2_3_unused_op,
 	msub_op, msubu_op, /* more unused ops */
+	loongson_madd_op = 0x18, loongson_msub_op,
+	loongson_nmadd_op, loongson_nmsub_op,
 	clz_op = 0x20, clo_op,
 	dclz_op = 0x24, dclo_op,
 	sdbpp_op = 0x3f
@@ -133,7 +135,7 @@ enum cop0_com_func {
  */
 enum cop1_fmt {
 	s_fmt, d_fmt, e_fmt, q_fmt,
-	w_fmt, l_fmt
+	w_fmt, l_fmt, ps_fmt
 };
 
 /*
diff --git a/arch/mips/math-emu/cp1emu.c b/arch/mips/math-emu/cp1emu.c
index fefcba2..166b2a4 100644
--- a/arch/mips/math-emu/cp1emu.c
+++ b/arch/mips/math-emu/cp1emu.c
@@ -7,6 +7,9 @@
  * Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com
  * Copyright (C) 2000  MIPS Technologies, Inc.
  *
+ * Loongson instruction support
+ * Copyright (C) 2011  Mark H Weaver <mhw@netris.org>
+ *
  *  This program is free software; you can distribute it and/or modify it
  *  under the terms of the GNU General Public License (Version 2) as
  *  published by the Free Software Foundation.
@@ -57,6 +60,14 @@
 #endif
 #define __mips 4
 
+#ifdef __loongson_fp
+#undef __loongson_fp
+#endif
+#if __mips >= 4 && __mips != 32
+/* Include support for Loongson floating point instructions */
+#define __loongson_fp 1
+#endif
+
 /* Function which emulates a floating point instruction. */
 
 static int fpu_emu(struct pt_regs *, struct mips_fpu_struct *,
@@ -66,6 +77,10 @@ static int fpu_emu(struct pt_regs *, struct mips_fpu_struct *,
 static int fpux_emu(struct pt_regs *,
 	struct mips_fpu_struct *, mips_instruction, void *__user *);
 #endif
+#ifdef __loongson_fp
+static int loongson_spec2_emu(struct pt_regs *,
+	struct mips_fpu_struct *, mips_instruction, void *__user *);
+#endif
 
 /* Further private data for which no space exists in mips_fpu_struct */
 
@@ -203,6 +218,14 @@ static inline int cop1_64bit(struct pt_regs *xcp)
 #define DPFROMREG(dp, x)	DIFROMREG((dp).bits, x)
 #define DPTOREG(dp, x)	DITOREG((dp).bits, x)
 
+/* Support for Loongson paired single floating-point format */
+#define PSIFROMREG(si1, si2, x) ({ u64 di; DIFROMREG(di, x);		\
+			(si1) = (u32)di; (si2) = (u32)(di >> 32); })
+#define PSITOREG(si1, si2, x) DITOREG((si1) | ((u64)(si2) << 32), x)
+
+#define PSPFROMREG(sp1, sp2, x) PSIFROMREG((sp1).bits, (sp2).bits, x)
+#define PSPTOREG(sp1, sp2, x)	PSITOREG((sp1).bits, (sp2).bits, x)
+
 /*
  * Emulate the single floating point instruction pointed at by EPC.
  * Two instructions if the instruction is in a branch delay slot.
@@ -568,6 +591,15 @@ static int cop1Emulate(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 		break;
 #endif
 
+#ifdef __loongson_fp
+	case spec2_op:{
+		int sig = loongson_spec2_emu(xcp, ctx, ir, fault_addr);
+		if (sig)
+			return sig;
+		break;
+	}
+#endif
+
 	default:
 		return SIGILL;
 	}
@@ -646,6 +678,172 @@ DEF3OP(msub, dp, ieee754dp_mul, ieee754dp_sub, );
 DEF3OP(nmadd, dp, ieee754dp_mul, ieee754dp_add, ieee754dp_neg);
 DEF3OP(nmsub, dp, ieee754dp_mul, ieee754dp_sub, ieee754dp_neg);
 
+#ifdef __loongson_fp
+static int loongson_spec2_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
+	mips_instruction ir, void *__user *fault_addr)
+{
+	int rfmt;		/* resulting format */
+	unsigned rcsr = 0;	/* resulting csr */
+	union {
+		ieee754dp d;
+		struct {
+			ieee754sp s;
+			ieee754sp s2;
+		};
+	} rv;			/* resulting value */
+
+	/* XXX maybe add a counter for loongson spec2 fp instructions? */
+	/* MIPS_FPU_EMU_INC_STATS(cp1xops); */
+
+	switch (rfmt = (MIPSInst_FFMT(ir) & 0xf)) {
+	case s_fmt:{
+		ieee754sp(*handler) (ieee754sp, ieee754sp, ieee754sp);
+		ieee754sp fd, fs, ft;
+
+		switch (MIPSInst_FUNC(ir)) {
+		case loongson_madd_op:
+			handler = fpemu_sp_madd;
+			goto scoptop;
+		case loongson_msub_op:
+			handler = fpemu_sp_msub;
+			goto scoptop;
+		case loongson_nmadd_op:
+			handler = fpemu_sp_nmadd;
+			goto scoptop;
+		case loongson_nmsub_op:
+			handler = fpemu_sp_nmsub;
+			goto scoptop;
+
+		      scoptop:
+			SPFROMREG(fd, MIPSInst_FD(ir));
+			SPFROMREG(fs, MIPSInst_FS(ir));
+			SPFROMREG(ft, MIPSInst_FT(ir));
+			rv.s = (*handler) (fd, fs, ft);
+
+		      copcsr:
+			if (ieee754_cxtest(IEEE754_INEXACT))
+				rcsr |= FPU_CSR_INE_X | FPU_CSR_INE_S;
+			if (ieee754_cxtest(IEEE754_UNDERFLOW))
+				rcsr |= FPU_CSR_UDF_X | FPU_CSR_UDF_S;
+			if (ieee754_cxtest(IEEE754_OVERFLOW))
+				rcsr |= FPU_CSR_OVF_X | FPU_CSR_OVF_S;
+			if (ieee754_cxtest(IEEE754_INVALID_OPERATION))
+				rcsr |= FPU_CSR_INV_X | FPU_CSR_INV_S;
+
+			break;
+
+		default:
+			return SIGILL;
+		}
+		break;
+	}
+
+	case d_fmt:{
+		ieee754dp(*handler) (ieee754dp, ieee754dp, ieee754dp);
+		ieee754dp fd, fs, ft;
+
+		switch (MIPSInst_FUNC(ir)) {
+		case loongson_madd_op:
+			handler = fpemu_dp_madd;
+			goto dcoptop;
+		case loongson_msub_op:
+			handler = fpemu_dp_msub;
+			goto dcoptop;
+		case loongson_nmadd_op:
+			handler = fpemu_dp_nmadd;
+			goto dcoptop;
+		case loongson_nmsub_op:
+			handler = fpemu_dp_nmsub;
+			goto dcoptop;
+
+		      dcoptop:
+			DPFROMREG(fd, MIPSInst_FD(ir));
+			DPFROMREG(fs, MIPSInst_FS(ir));
+			DPFROMREG(ft, MIPSInst_FT(ir));
+			rv.d = (*handler) (fd, fs, ft);
+			goto copcsr;
+
+		default:
+			return SIGILL;
+		}
+		break;
+	}
+
+	case ps_fmt:{
+		ieee754sp(*handler) (ieee754sp, ieee754sp, ieee754sp);
+		struct _ieee754_csr ieee754_csr_save;
+		ieee754sp fd1, fs1, ft1;
+		ieee754sp fd2, fs2, ft2;
+
+		switch (MIPSInst_FUNC(ir)) {
+		case loongson_madd_op:
+			handler = fpemu_sp_madd;
+			goto pscoptop;
+		case loongson_msub_op:
+			handler = fpemu_sp_msub;
+			goto pscoptop;
+		case loongson_nmadd_op:
+			handler = fpemu_sp_nmadd;
+			goto pscoptop;
+		case loongson_nmsub_op:
+			handler = fpemu_sp_nmsub;
+			goto pscoptop;
+
+		      pscoptop:
+			PSPFROMREG(fd1, fd2, MIPSInst_FD(ir));
+			PSPFROMREG(fs1, fs2, MIPSInst_FS(ir));
+			PSPFROMREG(ft1, ft2, MIPSInst_FT(ir));
+			rv.s = (*handler) (fd1, fs1, ft1);
+			ieee754_csr_save = ieee754_csr;
+			rv.s2 = (*handler) (fd2, fs2, ft2);
+			ieee754_csr.cx |= ieee754_csr_save.cx;
+			ieee754_csr.sx |= ieee754_csr_save.sx;
+			goto copcsr;
+
+		default:
+			return SIGILL;
+		}
+		break;
+	}
+
+	default:
+		return SIGILL;
+	}
+
+	/*
+	 * Update the fpu CSR register for this operation.
+	 * If an exception is required, generate a tidy SIGFPE exception,
+	 * without updating the result register.
+	 * Note: cause exception bits do not accumulate, they are rewritten
+	 * for each op; only the flag/sticky bits accumulate.
+	 */
+	ctx->fcr31 = (ctx->fcr31 & ~FPU_CSR_ALL_X) | rcsr;
+	if ((ctx->fcr31 >> 5) & ctx->fcr31 & FPU_CSR_ALL_E) {
+		/*printk ("SIGFPE: fpu csr = %08x\n",ctx->fcr31); */
+		return SIGFPE;
+	}
+
+	/*
+	 * Now we can safely write the result back to the register file.
+	 */
+	switch (rfmt) {
+	case d_fmt:
+		DPTOREG(rv.d, MIPSInst_FD(ir));
+		break;
+	case s_fmt:
+		SPTOREG(rv.s, MIPSInst_FD(ir));
+		break;
+	case ps_fmt:
+		PSPTOREG(rv.s, rv.s2, MIPSInst_FD(ir));
+		break;
+	default:
+		return SIGILL;
+	}
+
+	return 0;
+}
+#endif
+
 static int fpux_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 	mips_instruction ir, void *__user *fault_addr)
 {
@@ -840,7 +1038,12 @@ static int fpu_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 	unsigned cond;
 	union {
 		ieee754dp d;
-		ieee754sp s;
+		struct {
+			ieee754sp s;
+#ifdef __loongson_fp
+			ieee754sp s2; /* for Loongson paired singles */
+#endif
+		};
 		int w;
 #ifdef __mips64
 		s64 l;
@@ -1210,6 +1413,83 @@ static int fpu_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 		break;
 	}
 
+#ifdef __loongson_fp
+	case ps_fmt:{		/* 6 */
+		/* Support for Loongson paired single fp instructions */
+		union {
+			ieee754sp(*b) (ieee754sp, ieee754sp);
+			ieee754sp(*u) (ieee754sp);
+		} handler;
+
+		switch (MIPSInst_FUNC(ir)) {
+			/* binary ops */
+		case fadd_op:
+			handler.b = ieee754sp_add;
+			goto pscopbop;
+		case fsub_op:
+			handler.b = ieee754sp_sub;
+			goto pscopbop;
+		case fmul_op:
+			handler.b = ieee754sp_mul;
+			goto pscopbop;
+
+			/* unary  ops */
+		case fabs_op:
+			handler.u = ieee754sp_abs;
+			goto pscopuop;
+		case fneg_op:
+			handler.u = ieee754sp_neg;
+			goto pscopuop;
+		case fmov_op:
+			/* an easy one */
+			PSPFROMREG(rv.s, rv.s2, MIPSInst_FS(ir));
+			break;
+
+		      pscopbop: /* paired binary op handler */
+			{
+				struct _ieee754_csr ieee754_csr_save;
+				ieee754sp fs1, ft1;
+				ieee754sp fs2, ft2;
+
+				PSPFROMREG(fs1, fs2, MIPSInst_FS(ir));
+				PSPFROMREG(ft1, ft2, MIPSInst_FT(ir));
+				rv.s  = (*handler.b) (fs1, ft1);
+				ieee754_csr_save = ieee754_csr;
+				rv.s2 = (*handler.b) (fs2, ft2);
+				ieee754_csr.cx |= ieee754_csr_save.cx;
+				ieee754_csr.sx |= ieee754_csr_save.sx;
+				goto copcsr;
+			}
+		      pscopuop: /* paired unary op handler */
+			{
+				struct _ieee754_csr ieee754_csr_save;
+				ieee754sp fs1;
+				ieee754sp fs2;
+
+				PSPFROMREG(fs1, fs2, MIPSInst_FS(ir));
+				rv.s  = (*handler.u) (fs1);
+				ieee754_csr_save = ieee754_csr;
+				rv.s2 = (*handler.u) (fs2);
+				ieee754_csr.cx |= ieee754_csr_save.cx;
+				ieee754_csr.sx |= ieee754_csr_save.sx;
+				goto copcsr;
+			}
+			break;
+
+		default:
+			if (MIPSInst_FUNC(ir) >= fcmp_op) {
+				/* Loongson fp hardware handles all
+				   cases of fp compare insns, so we
+				   shouldn't have to */
+				printk ("Loongson paired-single fp compare"
+					" unimplemented in cp1emu.c\n");
+			}
+			return SIGILL;
+		}
+		break;
+	}
+#endif
+
 	case w_fmt:{
 		ieee754sp fs;
 
@@ -1299,6 +1579,11 @@ static int fpu_emu(struct pt_regs *xcp, struct mips_fpu_struct *ctx,
 		DITOREG(rv.l, MIPSInst_FD(ir));
 		break;
 #endif
+#ifdef __loongson_fp
+	case ps_fmt:
+		PSPTOREG(rv.s, rv.s2, MIPSInst_FD(ir));
+		break;
+#endif
 	default:
 		return SIGILL;
 	}
-- 
1.7.5.4
Adding two kernel patches for mips, that make the life easier on loongson2f (less sigill, less sigbus). Related to bad handling of FPU instructions. I apply them only to linux 3.4, although I think they can apply to many older kernels too. svn path=/nixpkgs/trunk/; revision=34522 2012-06-16 11:49:03 +01:00			`From bf55ef4e3c2f622ac013f196affbd11b67b59223 Mon Sep 17 00:00:00 2001`
			`From: Mark H Weaver <mhw@netris.org>`
			`Date: Fri, 28 Oct 2011 13:24:37 -0400`
			`Subject: [PATCH 2/4] Fix handling of prefx instruction in mips/math-emu`

			`* The instruction is named prefx, not pfetch, and its function`
			`field is 0x17, not 0x07.`

			`* Recognize the prefx instruction regardless of what bits happen to be`
			`in bits 21-25, which is the format field of the floating-point ops,`
			`but holds the base register of the prefx instruction.`
			`---`
			`arch/mips/include/asm/inst.h \| 4 ++--`
			`arch/mips/math-emu/cp1emu.c \| 16 +++++++---------`
			`2 files changed, 9 insertions(+), 11 deletions(-)`

			`diff --git a/arch/mips/include/asm/inst.h b/arch/mips/include/asm/inst.h`
			`index ab84064..3048edc 100644`
			`--- a/arch/mips/include/asm/inst.h`
			`+++ b/arch/mips/include/asm/inst.h`
			`@@ -161,8 +161,8 @@ enum cop1_sdw_func {`
			`*/`
			`enum cop1x_func {`
			`lwxc1_op = 0x00, ldxc1_op = 0x01,`
			`- pfetch_op = 0x07, swxc1_op = 0x08,`
			`- sdxc1_op = 0x09, madd_s_op = 0x20,`
			`+ swxc1_op = 0x08, sdxc1_op = 0x09,`
			`+ prefx_op = 0x17, madd_s_op = 0x20,`
			`madd_d_op = 0x21, madd_e_op = 0x22,`
			`msub_s_op = 0x28, msub_d_op = 0x29,`
			`msub_e_op = 0x2a, nmadd_s_op = 0x30,`
			`diff --git a/arch/mips/math-emu/cp1emu.c b/arch/mips/math-emu/cp1emu.c`
			`index dbf2f93..87ddba1 100644`
			`--- a/arch/mips/math-emu/cp1emu.c`
			`+++ b/arch/mips/math-emu/cp1emu.c`
			`@@ -739,7 +739,7 @@ static int fpux_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`break;`

			`default:`
			`- return SIGILL;`
			`+ goto SIGILL_unless_prefx_op;`
			`}`
			`break;`
			`}`
			`@@ -809,19 +809,17 @@ static int fpux_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`goto copcsr;`

			`default:`
			`- return SIGILL;`
			`+ goto SIGILL_unless_prefx_op;`
			`}`
			`break;`
			`}`

			`- case 0x7: /* 7 */`
			`- if (MIPSInst_FUNC(ir) != pfetch_op) {`
			`- return SIGILL;`
			`- }`
			`- /* ignore prefx operation */`
			`- break;`
			`-`
			`default:`
			`+ SIGILL_unless_prefx_op:`
			`+ if (MIPSInst_FUNC(ir) == prefx_op) {`
			`+ /* ignore prefx operation */`
			`+ break;`
			`+ }`
			`return SIGILL;`
			`}`

			`--`
			`1.7.5.4`

			`From 97a564e3eddbfb84844b8eccb3bd751c71dfb3eb Mon Sep 17 00:00:00 2001`
			`From: Mark H Weaver <mhw@netris.org>`
			`Date: Fri, 28 Oct 2011 13:35:27 -0400`
			`Subject: [PATCH 3/4] Don't process empty cause flags after simple fp move on`
			`mips`

			`---`
			`arch/mips/math-emu/cp1emu.c \| 4 ++--`
			`1 files changed, 2 insertions(+), 2 deletions(-)`

			`diff --git a/arch/mips/math-emu/cp1emu.c b/arch/mips/math-emu/cp1emu.c`
			`index 87ddba1..fefcba2 100644`
			`--- a/arch/mips/math-emu/cp1emu.c`
			`+++ b/arch/mips/math-emu/cp1emu.c`
			`@@ -912,7 +912,7 @@ static int fpu_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`case fmov_op:`
			`/* an easy one */`
			`SPFROMREG(rv.s, MIPSInst_FS(ir));`
			`- goto copcsr;`
			`+ break;`

			`/* binary op on handler */`
			`scopbop:`
			`@@ -1099,7 +1099,7 @@ static int fpu_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`case fmov_op:`
			`/* an easy one */`
			`DPFROMREG(rv.d, MIPSInst_FS(ir));`
			`- goto copcsr;`
			`+ break;`

			`/* binary op on handler */`
			`dcopbop:{`
			`--`
			`1.7.5.4`

Fixing the mips patch for sigill fpu cases. svn path=/nixpkgs/trunk/; revision=34527 2012-06-16 16:37:04 +01:00			`From 4051727b3007ef3675e7258ed86fa8517f86d929 Mon Sep 17 00:00:00 2001`
			`From: Mark H Weaver <mhw@netris.org>`
			`Date: Fri, 28 Oct 2011 13:39:10 -0400`
			`Subject: [PATCH 4/4] Support Loongson2f floating-point instructions in`
			`mips/math-emu`

			`* (arch/mips/include/asm/inst.h): Add Loongson2f function field values`
			`for madd/msub/nmadd/nmsub that use the spec2 opcode, and the`
			`Loongson2f/MIPS-5 format field value for paired-single`
			`floating-point operations.`

			`* (arch/mips/math-emu/cp1emu.c): Add support for the Loongson2f`
			`instructions for madd/msub/nmadd/nmsub, which use the spec2 opcode.`
			`Also add support for the Loongson2f instructions that use the`
			`paired-single floating-point format.`
			`---`
			`arch/mips/include/asm/inst.h \| 4 +-`
			`arch/mips/math-emu/cp1emu.c \| 287 +++++++++++++++++++++++++++++++++++++++++-`
			`2 files changed, 289 insertions(+), 2 deletions(-)`

			`diff --git a/arch/mips/include/asm/inst.h b/arch/mips/include/asm/inst.h`
			`index 3048edc..0e8ba7c 100644`
			`--- a/arch/mips/include/asm/inst.h`
			`+++ b/arch/mips/include/asm/inst.h`
			`@@ -61,6 +61,8 @@ enum spec_op {`
			`enum spec2_op {`
			`madd_op, maddu_op, mul_op, spec2_3_unused_op,`
			`msub_op, msubu_op, /* more unused ops */`
			`+ loongson_madd_op = 0x18, loongson_msub_op,`
			`+ loongson_nmadd_op, loongson_nmsub_op,`
			`clz_op = 0x20, clo_op,`
			`dclz_op = 0x24, dclo_op,`
			`sdbpp_op = 0x3f`
			`@@ -133,7 +135,7 @@ enum cop0_com_func {`
			`*/`
			`enum cop1_fmt {`
			`s_fmt, d_fmt, e_fmt, q_fmt,`
			`- w_fmt, l_fmt`
			`+ w_fmt, l_fmt, ps_fmt`
			`};`

			`/*`
			`diff --git a/arch/mips/math-emu/cp1emu.c b/arch/mips/math-emu/cp1emu.c`
			`index fefcba2..166b2a4 100644`
			`--- a/arch/mips/math-emu/cp1emu.c`
			`+++ b/arch/mips/math-emu/cp1emu.c`
			`@@ -7,6 +7,9 @@`
			`* Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com`
			`* Copyright (C) 2000 MIPS Technologies, Inc.`
			`*`
			`+ * Loongson instruction support`
			`+ * Copyright (C) 2011 Mark H Weaver <mhw@netris.org>`
			`+ *`
			`* This program is free software; you can distribute it and/or modify it`
			`* under the terms of the GNU General Public License (Version 2) as`
			`* published by the Free Software Foundation.`
			`@@ -57,6 +60,14 @@`
			`#endif`
			`#define __mips 4`

			`+#ifdef __loongson_fp`
			`+#undef __loongson_fp`
			`+#endif`
			`+#if __mips >= 4 && __mips != 32`
			`+/* Include support for Loongson floating point instructions */`
			`+#define __loongson_fp 1`
			`+#endif`
			`+`
			`/* Function which emulates a floating point instruction. */`

			`static int fpu_emu(struct pt_regs , struct mips_fpu_struct ,`
			`@@ -66,6 +77,10 @@ static int fpu_emu(struct pt_regs , struct mips_fpu_struct ,`
			`static int fpux_emu(struct pt_regs *,`
			`struct mips_fpu_struct , mips_instruction, void __user *);`
			`#endif`
			`+#ifdef __loongson_fp`
			`+static int loongson_spec2_emu(struct pt_regs *,`
			`+ struct mips_fpu_struct , mips_instruction, void __user *);`
			`+#endif`

			`/* Further private data for which no space exists in mips_fpu_struct */`

			`@@ -203,6 +218,14 @@ static inline int cop1_64bit(struct pt_regs *xcp)`
			`#define DPFROMREG(dp, x) DIFROMREG((dp).bits, x)`
			`#define DPTOREG(dp, x) DITOREG((dp).bits, x)`

			`+/* Support for Loongson paired single floating-point format */`
			`+#define PSIFROMREG(si1, si2, x) ({ u64 di; DIFROMREG(di, x); \`
			`+ (si1) = (u32)di; (si2) = (u32)(di >> 32); })`
			`+#define PSITOREG(si1, si2, x) DITOREG((si1) \| ((u64)(si2) << 32), x)`
			`+`
			`+#define PSPFROMREG(sp1, sp2, x) PSIFROMREG((sp1).bits, (sp2).bits, x)`
			`+#define PSPTOREG(sp1, sp2, x) PSITOREG((sp1).bits, (sp2).bits, x)`
			`+`
			`/*`
			`* Emulate the single floating point instruction pointed at by EPC.`
			`* Two instructions if the instruction is in a branch delay slot.`
			`@@ -568,6 +591,15 @@ static int cop1Emulate(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`break;`
			`#endif`

			`+#ifdef __loongson_fp`
			`+ case spec2_op:{`
			`+ int sig = loongson_spec2_emu(xcp, ctx, ir, fault_addr);`
			`+ if (sig)`
			`+ return sig;`
			`+ break;`
			`+ }`
			`+#endif`
			`+`
			`default:`
			`return SIGILL;`
			`}`
			`@@ -646,6 +678,172 @@ DEF3OP(msub, dp, ieee754dp_mul, ieee754dp_sub, );`
			`DEF3OP(nmadd, dp, ieee754dp_mul, ieee754dp_add, ieee754dp_neg);`
			`DEF3OP(nmsub, dp, ieee754dp_mul, ieee754dp_sub, ieee754dp_neg);`

			`+#ifdef __loongson_fp`
			`+static int loongson_spec2_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`+ mips_instruction ir, void __user fault_addr)`
			`+{`
			`+ int rfmt; /* resulting format */`
			`+ unsigned rcsr = 0; /* resulting csr */`
			`+ union {`
			`+ ieee754dp d;`
			`+ struct {`
			`+ ieee754sp s;`
			`+ ieee754sp s2;`
			`+ };`
			`+ } rv; /* resulting value */`
			`+`
			`+ /* XXX maybe add a counter for loongson spec2 fp instructions? */`
			`+ /* MIPS_FPU_EMU_INC_STATS(cp1xops); */`
			`+`
			`+ switch (rfmt = (MIPSInst_FFMT(ir) & 0xf)) {`
			`+ case s_fmt:{`
			`+ ieee754sp(*handler) (ieee754sp, ieee754sp, ieee754sp);`
			`+ ieee754sp fd, fs, ft;`
			`+`
			`+ switch (MIPSInst_FUNC(ir)) {`
			`+ case loongson_madd_op:`
			`+ handler = fpemu_sp_madd;`
			`+ goto scoptop;`
			`+ case loongson_msub_op:`
			`+ handler = fpemu_sp_msub;`
			`+ goto scoptop;`
			`+ case loongson_nmadd_op:`
			`+ handler = fpemu_sp_nmadd;`
			`+ goto scoptop;`
			`+ case loongson_nmsub_op:`
			`+ handler = fpemu_sp_nmsub;`
			`+ goto scoptop;`
			`+`
			`+ scoptop:`
			`+ SPFROMREG(fd, MIPSInst_FD(ir));`
			`+ SPFROMREG(fs, MIPSInst_FS(ir));`
			`+ SPFROMREG(ft, MIPSInst_FT(ir));`
			`+ rv.s = (*handler) (fd, fs, ft);`
			`+`
			`+ copcsr:`
			`+ if (ieee754_cxtest(IEEE754_INEXACT))`
			`+ rcsr \|= FPU_CSR_INE_X \| FPU_CSR_INE_S;`
			`+ if (ieee754_cxtest(IEEE754_UNDERFLOW))`
			`+ rcsr \|= FPU_CSR_UDF_X \| FPU_CSR_UDF_S;`
			`+ if (ieee754_cxtest(IEEE754_OVERFLOW))`
			`+ rcsr \|= FPU_CSR_OVF_X \| FPU_CSR_OVF_S;`
			`+ if (ieee754_cxtest(IEEE754_INVALID_OPERATION))`
			`+ rcsr \|= FPU_CSR_INV_X \| FPU_CSR_INV_S;`
			`+`
			`+ break;`
			`+`
			`+ default:`
			`+ return SIGILL;`
			`+ }`
			`+ break;`
			`+ }`
			`+`
			`+ case d_fmt:{`
			`+ ieee754dp(*handler) (ieee754dp, ieee754dp, ieee754dp);`
			`+ ieee754dp fd, fs, ft;`
			`+`
			`+ switch (MIPSInst_FUNC(ir)) {`
			`+ case loongson_madd_op:`
			`+ handler = fpemu_dp_madd;`
			`+ goto dcoptop;`
			`+ case loongson_msub_op:`
			`+ handler = fpemu_dp_msub;`
			`+ goto dcoptop;`
			`+ case loongson_nmadd_op:`
			`+ handler = fpemu_dp_nmadd;`
			`+ goto dcoptop;`
			`+ case loongson_nmsub_op:`
			`+ handler = fpemu_dp_nmsub;`
			`+ goto dcoptop;`
			`+`
			`+ dcoptop:`
			`+ DPFROMREG(fd, MIPSInst_FD(ir));`
			`+ DPFROMREG(fs, MIPSInst_FS(ir));`
			`+ DPFROMREG(ft, MIPSInst_FT(ir));`
			`+ rv.d = (*handler) (fd, fs, ft);`
			`+ goto copcsr;`
			`+`
			`+ default:`
			`+ return SIGILL;`
			`+ }`
			`+ break;`
			`+ }`
			`+`
			`+ case ps_fmt:{`
			`+ ieee754sp(*handler) (ieee754sp, ieee754sp, ieee754sp);`
			`+ struct _ieee754_csr ieee754_csr_save;`
			`+ ieee754sp fd1, fs1, ft1;`
			`+ ieee754sp fd2, fs2, ft2;`
			`+`
			`+ switch (MIPSInst_FUNC(ir)) {`
			`+ case loongson_madd_op:`
			`+ handler = fpemu_sp_madd;`
			`+ goto pscoptop;`
			`+ case loongson_msub_op:`
			`+ handler = fpemu_sp_msub;`
			`+ goto pscoptop;`
			`+ case loongson_nmadd_op:`
			`+ handler = fpemu_sp_nmadd;`
			`+ goto pscoptop;`
			`+ case loongson_nmsub_op:`
			`+ handler = fpemu_sp_nmsub;`
			`+ goto pscoptop;`
			`+`
			`+ pscoptop:`
			`+ PSPFROMREG(fd1, fd2, MIPSInst_FD(ir));`
			`+ PSPFROMREG(fs1, fs2, MIPSInst_FS(ir));`
			`+ PSPFROMREG(ft1, ft2, MIPSInst_FT(ir));`
			`+ rv.s = (*handler) (fd1, fs1, ft1);`
			`+ ieee754_csr_save = ieee754_csr;`
			`+ rv.s2 = (*handler) (fd2, fs2, ft2);`
			`+ ieee754_csr.cx \|= ieee754_csr_save.cx;`
			`+ ieee754_csr.sx \|= ieee754_csr_save.sx;`
			`+ goto copcsr;`
			`+`
			`+ default:`
			`+ return SIGILL;`
			`+ }`
			`+ break;`
			`+ }`
			`+`
			`+ default:`
			`+ return SIGILL;`
			`+ }`
			`+`
			`+ /*`
			`+ * Update the fpu CSR register for this operation.`
			`+ * If an exception is required, generate a tidy SIGFPE exception,`
			`+ * without updating the result register.`
			`+ * Note: cause exception bits do not accumulate, they are rewritten`
			`+ * for each op; only the flag/sticky bits accumulate.`
			`+ */`
			`+ ctx->fcr31 = (ctx->fcr31 & ~FPU_CSR_ALL_X) \| rcsr;`
			`+ if ((ctx->fcr31 >> 5) & ctx->fcr31 & FPU_CSR_ALL_E) {`
			`+ /printk ("SIGFPE: fpu csr = %08x\n",ctx->fcr31); /`
			`+ return SIGFPE;`
			`+ }`
			`+`
			`+ /*`
			`+ * Now we can safely write the result back to the register file.`
			`+ */`
			`+ switch (rfmt) {`
			`+ case d_fmt:`
			`+ DPTOREG(rv.d, MIPSInst_FD(ir));`
			`+ break;`
			`+ case s_fmt:`
			`+ SPTOREG(rv.s, MIPSInst_FD(ir));`
			`+ break;`
			`+ case ps_fmt:`
			`+ PSPTOREG(rv.s, rv.s2, MIPSInst_FD(ir));`
			`+ break;`
			`+ default:`
			`+ return SIGILL;`
			`+ }`
			`+`
			`+ return 0;`
			`+}`
			`+#endif`
			`+`
			`static int fpux_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`mips_instruction ir, void __user fault_addr)`
			`{`
			`@@ -840,7 +1038,12 @@ static int fpu_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`unsigned cond;`
			`union {`
			`ieee754dp d;`
			`- ieee754sp s;`
			`+ struct {`
			`+ ieee754sp s;`
			`+#ifdef __loongson_fp`
			`+ ieee754sp s2; /* for Loongson paired singles */`
			`+#endif`
			`+ };`
			`int w;`
			`#ifdef __mips64`
			`s64 l;`
			`@@ -1210,6 +1413,83 @@ static int fpu_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`break;`
			`}`

			`+#ifdef __loongson_fp`
			`+ case ps_fmt:{ /* 6 */`
			`+ /* Support for Loongson paired single fp instructions */`
			`+ union {`
			`+ ieee754sp(*b) (ieee754sp, ieee754sp);`
			`+ ieee754sp(*u) (ieee754sp);`
			`+ } handler;`
			`+`
			`+ switch (MIPSInst_FUNC(ir)) {`
			`+ /* binary ops */`
			`+ case fadd_op:`
			`+ handler.b = ieee754sp_add;`
			`+ goto pscopbop;`
			`+ case fsub_op:`
			`+ handler.b = ieee754sp_sub;`
			`+ goto pscopbop;`
			`+ case fmul_op:`
			`+ handler.b = ieee754sp_mul;`
			`+ goto pscopbop;`
			`+`
			`+ /* unary ops */`
			`+ case fabs_op:`
			`+ handler.u = ieee754sp_abs;`
			`+ goto pscopuop;`
			`+ case fneg_op:`
			`+ handler.u = ieee754sp_neg;`
			`+ goto pscopuop;`
			`+ case fmov_op:`
			`+ /* an easy one */`
			`+ PSPFROMREG(rv.s, rv.s2, MIPSInst_FS(ir));`
			`+ break;`
			`+`
			`+ pscopbop: /* paired binary op handler */`
			`+ {`
			`+ struct _ieee754_csr ieee754_csr_save;`
			`+ ieee754sp fs1, ft1;`
			`+ ieee754sp fs2, ft2;`
			`+`
			`+ PSPFROMREG(fs1, fs2, MIPSInst_FS(ir));`
			`+ PSPFROMREG(ft1, ft2, MIPSInst_FT(ir));`
			`+ rv.s = (*handler.b) (fs1, ft1);`
			`+ ieee754_csr_save = ieee754_csr;`
			`+ rv.s2 = (*handler.b) (fs2, ft2);`
			`+ ieee754_csr.cx \|= ieee754_csr_save.cx;`
			`+ ieee754_csr.sx \|= ieee754_csr_save.sx;`
			`+ goto copcsr;`
			`+ }`
			`+ pscopuop: /* paired unary op handler */`
			`+ {`
			`+ struct _ieee754_csr ieee754_csr_save;`
			`+ ieee754sp fs1;`
			`+ ieee754sp fs2;`
			`+`
			`+ PSPFROMREG(fs1, fs2, MIPSInst_FS(ir));`
			`+ rv.s = (*handler.u) (fs1);`
			`+ ieee754_csr_save = ieee754_csr;`
			`+ rv.s2 = (*handler.u) (fs2);`
			`+ ieee754_csr.cx \|= ieee754_csr_save.cx;`
			`+ ieee754_csr.sx \|= ieee754_csr_save.sx;`
			`+ goto copcsr;`
			`+ }`
			`+ break;`
			`+`
			`+ default:`
			`+ if (MIPSInst_FUNC(ir) >= fcmp_op) {`
			`+ /* Loongson fp hardware handles all`
			`+ cases of fp compare insns, so we`
			`+ shouldn't have to */`
			`+ printk ("Loongson paired-single fp compare"`
			`+ " unimplemented in cp1emu.c\n");`
			`+ }`
			`+ return SIGILL;`
			`+ }`
			`+ break;`
			`+ }`
			`+#endif`
			`+`
			`case w_fmt:{`
			`ieee754sp fs;`

			`@@ -1299,6 +1579,11 @@ static int fpu_emu(struct pt_regs xcp, struct mips_fpu_struct ctx,`
			`DITOREG(rv.l, MIPSInst_FD(ir));`
			`break;`
			`#endif`
			`+#ifdef __loongson_fp`
			`+ case ps_fmt:`
			`+ PSPTOREG(rv.s, rv.s2, MIPSInst_FD(ir));`
			`+ break;`
			`+#endif`
			`default:`
			`return SIGILL;`
			`}`
			`--`
			`1.7.5.4`