Module Name: src
Committed By: matt
Date: Mon Dec 10 04:58:54 UTC 2012
Modified Files:
src/sys/arch/arm/conf: files.arm
Added Files:
src/sys/arch/arm/vfp: pmap_vfp.S
Log Message:
Add code to use VFP(or Neon) instructions to zero or copy a page via
pmap_zero_page and pmap_copy_page. (Not hooked into vfp_init yet).
Requires FPU_VFP
To generate a diff of this commit:
cvs rdiff -u -r1.113 -r1.114 src/sys/arch/arm/conf/files.arm
cvs rdiff -u -r0 -r1.1 src/sys/arch/arm/vfp/pmap_vfp.S
Please note that diffs are not public domain; they are subject to the
copyright notices on the relevant files.
Modified files:
Index: src/sys/arch/arm/conf/files.arm
diff -u src/sys/arch/arm/conf/files.arm:1.113 src/sys/arch/arm/conf/files.arm:1.114
--- src/sys/arch/arm/conf/files.arm:1.113 Wed Dec 5 19:05:47 2012
+++ src/sys/arch/arm/conf/files.arm Mon Dec 10 04:58:54 2012
@@ -1,4 +1,4 @@
-# $NetBSD: files.arm,v 1.113 2012/12/05 19:05:47 matt Exp $
+# $NetBSD: files.arm,v 1.114 2012/12/10 04:58:54 matt Exp $
# temporary define to allow easy moving to ../arch/arm/arm32
defflag ARM32
@@ -52,6 +52,7 @@ obsolete defflag ARMFPE
# VFP support
file arch/arm/vfp/vfp_init.c arm32
+file arch/arm/vfp/pmap_vfp.S arm32 & fpu_vfp
# PMAP_DEBUG (heavily abused option)
defflag PMAP_DEBUG
Added files:
Index: src/sys/arch/arm/vfp/pmap_vfp.S
diff -u /dev/null src/sys/arch/arm/vfp/pmap_vfp.S:1.1
--- /dev/null Mon Dec 10 04:58:54 2012
+++ src/sys/arch/arm/vfp/pmap_vfp.S Mon Dec 10 04:58:54 2012
@@ -0,0 +1,101 @@
+/*-
+ * Copyright (c) 2012 The NetBSD Foundation, Inc.
+ * All rights reserved.
+ *
+ * This code is derived from software contributed to The NetBSD Foundation
+ * by Matt Thomas of 3am Software Foundry.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
+ * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
+ * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
+ * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+ * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+ * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+ * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+ * POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "opt_cputypes.h"
+
+#include <machine/asm.h>
+#include "assym.h"
+
+/*
+ * This zeroes a page 64-bytes at a time. 64 is chosen over 32 since
+ * 64 is the cache line size of the Cortex-A8.
+ */
+ENTRY(pmap_zero_page_vfp)
+ mrc p10, 7, r3, c8, c0, 0
+ orr r2, r3, #VFP_FPEXC_EN
+ mcr p10, 7, r2, c8, c0, 0
+ vpush {d0-d7}
+#if (CPU_CORTEX == 0)
+ mov ip, #0
+ vmov s0, ip
+ vmov s1, ip
+ vmov.f64 d1, d0
+ vmov.f64 d2, d0
+ vmov.f64 d3, d0
+ vmov.f64 d4, d0
+ vmov.f64 d5, d0
+ vmov.f64 d6, d0
+ vmov.f64 d7, d0
+#else
+ veor q0, q0, q0
+ veor q1, q1, q1
+ veor q2, q2, q2
+ veor q3, q3, q3
+#endif
+ add r2, r0, #PAGE_SIZE
+1: vstmia r0!, {d0-d7}
+ vstmia r0!, {d0-d7}
+ vstmia r0!, {d0-d7}
+ vstmia r0!, {d0-d7}
+ cmp r0, r2
+ blt 1b
+ vpop {d0-d7}
+ mcr p10, 7, r3, c8, c0, 0
+ bx lr
+END(pmap_zero_page_vfp)
+
+/*
+ * This copies a page 64-bytes at a time. 64 is chosen over 32 since
+ * 64 is the cache line size of the Cortex-A8.
+ */
+ENTRY(pmap_copy_page_vfp)
+ pld [r0] @ preload the first 128 bytes
+ pld [r0, #32]
+ pld [r0, #64]
+ pld [r0, #96]
+ mrc p10, 7, r3, c8, c0, 0
+ orr r2, r3, #VFP_FPEXC_EN
+ mcr p10, 7, r2, c8, c0, 0
+ vpush {d0-d7}
+ add r2, r0, #PAGE_SIZE-128
+1: pld [r0, #128] @ preload the next 128
+ pld [r0, #160]
+ pld [r0, #192]
+ pld [r0, #224]
+2: vldmia r0!, {d0-d7} @ read 0-63
+ vstmia r1!, {d0-d7} @ write 0-63
+ vldmia r0!, {d0-d7} @ read 64-127
+ vstmia r1!, {d0-d7} @ write 64-127
+ cmp r0, r2
+ blt 1b
+ beq 2b
+ vpop {d0-d7}
+ mcr p10, 7, r3, c8, c0, 0
+ bx lr
+END(pmap_copy_page_vfp)