From c35fad0f2bc16fffe25dfe3b86f0df508d6d0b87 Mon Sep 17 00:00:00 2001
From: Dino Li <Dino.Li@ite.com.tw>
Date: Fri, 26 May 2017 10:11:25 +0800
Subject: chip: it83xx: add support for floating point unit

Because N8 CPU doesn't have floating point unit,
so we implement an extra floating point engine
(single-precision addition, subtraction, multiplication,
and division) into it8320 to improve performance of
floating point operation.

To make CPU's instruction compatible, we use register (DLMB)
to switch ALU (Arithmetic Logic Unit). eg:
Instruction 'ADD45' adds the contents of two registers then
writes the result to the source register.
But if we switch ALU to floating point operation mode,
this instruction will do a floating-point addition instead.

For the other FPU that we don't support as far,
we have to use soft float library routines of nds32.

Signed-off-by: Dino Li <dino.li@ite.com.tw>

BRANCH=none
BUG=none
TEST=add the following console command and test different
scenarios by changing variable a and b.

#define PRINTF_FLOAT(x)  ((int)((x) * 1000.0f))
static int it83xx_fpu_test(int argc, char **argv)
{
	volatile float a = 1.23f;
	volatile float b = 4.56f;
	volatile float c;

	c = a + b;
	ccprintf("__addsf3: (%d)\n", PRINTF_FLOAT(c));
	c = a - b;
	ccprintf("__subsf3: (%d)\n", PRINTF_FLOAT(c));
	c = a * b;
	ccprintf("__mulsf3: (%d)\n", PRINTF_FLOAT(c));
	c = a / b;
	ccprintf("__divsf3: (%d)\n", PRINTF_FLOAT(c));

	return EC_SUCCESS;
}
DECLARE_CONSOLE_COMMAND(fpu, it83xx_fpu_test, "", "");

Change-Id: I4fc1c08d8c2376156bec9f098491187675c4a88f
Reviewed-on: https://chromium-review.googlesource.com/427640
Commit-Ready: Dino Li <Dino.Li@ite.com.tw>
Tested-by: Dino Li <Dino.Li@ite.com.tw>
Reviewed-by: Vincent Palatin <vpalatin@chromium.org>
---
 chip/it83xx/build.mk     |  1 +
 chip/it83xx/it83xx_fpu.S | 81 ++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 82 insertions(+)
 create mode 100644 chip/it83xx/it83xx_fpu.S

(limited to 'chip/it83xx')

diff --git a/chip/it83xx/build.mk b/chip/it83xx/build.mk
index 47820aba34..97f41ce287 100644
--- a/chip/it83xx/build.mk
+++ b/chip/it83xx/build.mk
@@ -18,6 +18,7 @@ chip-y=hwtimer.o uart.o gpio.o system.o jtag.o clock.o irq.o intc.o
 chip-$(CONFIG_WATCHDOG)+=watchdog.o
 chip-$(CONFIG_FANS)+=fan.o pwm.o
 chip-$(CONFIG_FLASH_PHYSICAL)+=flash.o
+chip-$(CONFIG_FPU)+=it83xx_fpu.o
 chip-$(CONFIG_PWM)+=pwm.o
 chip-$(CONFIG_ADC)+=adc.o
 chip-$(CONFIG_EC2I)+=ec2i.o
diff --git a/chip/it83xx/it83xx_fpu.S b/chip/it83xx/it83xx_fpu.S
new file mode 100644
index 0000000000..d98ba0fa67
--- /dev/null
+++ b/chip/it83xx/it83xx_fpu.S
@@ -0,0 +1,81 @@
+/* Copyright 2017 The Chromium OS Authors. All rights reserved.
+ * Use of this source code is governed by a BSD-style license that can be
+ * found in the LICENSE file.
+ */
+
+/*
+ * DLMB register = 0x80189:
+ * Disable all interrupts and switching CPU's
+ * ALU (Arithmetic Logic Unit) to floating point operation mode.
+ * (IEEE standard 754 floating point)
+ *
+ * DLMB register = 0x80009:
+ * Restore interrupts and ALU.
+ */
+	.text
+	.align	2
+	.global	__addsf3
+	.type	__addsf3, @function
+__addsf3:
+	sethi  $r2, 0x80        /* r2 = 0x80000 */
+	addi   $r3, $r2, 0x189  /* r3 = 0x80189 */
+	addi45 $r2, 0x9         /* r2 = 0x80009 */
+	mtsr   $r3, $dlmb       /* dlmb = 0x80189 */
+	dsb
+	/* Floating-point addition single-precision */
+	add45  $r0, $r1
+	mtsr   $r2, $dlmb       /* dlmb = 0x80009 */
+	dsb
+	ret5   $lp
+	.size	__addsf3, .-__addsf3
+
+	.text
+	.align	2
+	.global	__subsf3
+	.type	__subsf3, @function
+__subsf3:
+	sethi  $r2, 0x80        /* r2 = 0x80000 */
+	addi   $r3, $r2, 0x189  /* r3 = 0x80189 */
+	addi45 $r2, 0x9         /* r2 = 0x80009 */
+	mtsr   $r3, $dlmb       /* dlmb = 0x80189 */
+	dsb
+	/* Floating-point subtraction single-precision */
+	sub45  $r0, $r1
+	mtsr   $r2, $dlmb       /* dlmb = 0x80009 */
+	dsb
+	ret5   $lp
+	.size	__subsf3, .-__subsf3
+
+	.text
+	.align	2
+	.global	__mulsf3
+	.type	__mulsf3, @function
+__mulsf3:
+	sethi  $r2, 0x80        /* r2 = 0x80000 */
+	addi   $r3, $r2, 0x189  /* r3 = 0x80189 */
+	addi45 $r2, 0x9         /* r2 = 0x80009 */
+	mtsr   $r3, $dlmb       /* dlmb = 0x80189 */
+	dsb
+	/* Floating-point multiplication single-precision */
+	mul33  $r0, $r1
+	mtsr   $r2, $dlmb       /* dlmb = 0x80009 */
+	dsb
+	ret5   $lp
+	.size	__mulsf3, .-__mulsf3
+
+	.text
+	.align	2
+	.global	__divsf3
+	.type	__divsf3, @function
+__divsf3:
+	sethi  $r2, 0x80        /* r2 = 0x80000 */
+	addi   $r3, $r2, 0x189  /* r3 = 0x80189 */
+	addi45 $r2, 0x9         /* r2 = 0x80009 */
+	mtsr   $r3, $dlmb       /* dlmb = 0x80189 */
+	dsb
+	/* Floating-point division single-precision */
+	divsr  $r0,$r0,$r0,$r1
+	mtsr   $r2, $dlmb       /* dlmb = 0x80009 */
+	dsb
+	ret5   $lp
+	.size	__divsf3, .-__divsf3
-- 
cgit v1.2.1