-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
sparc64: Add SPARC-T4 optimized memcpy.
Before After -------------- -------------- bw_tcp: 1288.53 MB/sec 1637.77 MB/sec bw_pipe: 1517.18 MB/sec 2107.61 MB/sec bw_unix: 1838.38 MB/sec 2640.91 MB/sec make -s -j128 allmodconfig 5min 49sec 5min 31sec Signed-off-by: David S. Miller <davem@davemloft.net>
- Loading branch information
David S. Miller
committed
Sep 27, 2012
1 parent
da20116
commit ae2c6ca
Showing
8 changed files
with
546 additions
and
2 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,30 @@ | ||
/* NG4copy_from_user.S: Niagara-2 optimized copy from userspace. | ||
* | ||
* Copyright (C) 2012 David S. Miller (davem@davemloft.net) | ||
*/ | ||
|
||
#define EX_LD(x) \ | ||
98: x; \ | ||
.section __ex_table,"a";\ | ||
.align 4; \ | ||
.word 98b, __retl_one_asi;\ | ||
.text; \ | ||
.align 4; | ||
|
||
#ifndef ASI_AIUS | ||
#define ASI_AIUS 0x11 | ||
#endif | ||
|
||
#define FUNC_NAME NG4copy_from_user | ||
#define LOAD(type,addr,dest) type##a [addr] %asi, dest | ||
#define EX_RETVAL(x) 0 | ||
|
||
#ifdef __KERNEL__ | ||
#define PREAMBLE \ | ||
rd %asi, %g1; \ | ||
cmp %g1, ASI_AIUS; \ | ||
bne,pn %icc, ___copy_in_user; \ | ||
nop | ||
#endif | ||
|
||
#include "NG4memcpy.S" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,57 @@ | ||
/* NG4copy_page.S: Niagara-4 optimized copy page. | ||
* | ||
* Copyright (C) 2012 (davem@davemloft.net) | ||
*/ | ||
|
||
#include <asm/asi.h> | ||
#include <asm/page.h> | ||
|
||
.text | ||
.align 32 | ||
|
||
.register %g2, #scratch | ||
.register %g3, #scratch | ||
|
||
.globl NG4copy_user_page | ||
NG4copy_user_page: /* %o0=dest, %o1=src, %o2=vaddr */ | ||
prefetch [%o1 + 0x000], #n_reads_strong | ||
prefetch [%o1 + 0x040], #n_reads_strong | ||
prefetch [%o1 + 0x080], #n_reads_strong | ||
prefetch [%o1 + 0x0c0], #n_reads_strong | ||
set PAGE_SIZE, %g7 | ||
prefetch [%o1 + 0x100], #n_reads_strong | ||
prefetch [%o1 + 0x140], #n_reads_strong | ||
prefetch [%o1 + 0x180], #n_reads_strong | ||
prefetch [%o1 + 0x1c0], #n_reads_strong | ||
1: | ||
ldx [%o1 + 0x00], %o2 | ||
subcc %g7, 0x40, %g7 | ||
ldx [%o1 + 0x08], %o3 | ||
ldx [%o1 + 0x10], %o4 | ||
ldx [%o1 + 0x18], %o5 | ||
ldx [%o1 + 0x20], %g1 | ||
stxa %o2, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
ldx [%o1 + 0x28], %g2 | ||
stxa %o3, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
ldx [%o1 + 0x30], %g3 | ||
stxa %o4, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
ldx [%o1 + 0x38], %o2 | ||
add %o1, 0x40, %o1 | ||
stxa %o5, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
stxa %g1, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
stxa %g2, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
stxa %g3, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
stxa %o2, [%o0] ASI_BLK_INIT_QUAD_LDD_P | ||
add %o0, 0x08, %o0 | ||
bne,pt %icc, 1b | ||
prefetch [%o1 + 0x200], #n_reads_strong | ||
retl | ||
membar #StoreLoad | #StoreStore | ||
.size NG4copy_user_page,.-NG4copy_user_page |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
/* NG4copy_to_user.S: Niagara-4 optimized copy to userspace. | ||
* | ||
* Copyright (C) 2012 David S. Miller (davem@davemloft.net) | ||
*/ | ||
|
||
#define EX_ST(x) \ | ||
98: x; \ | ||
.section __ex_table,"a";\ | ||
.align 4; \ | ||
.word 98b, __retl_one_asi;\ | ||
.text; \ | ||
.align 4; | ||
|
||
#ifndef ASI_AIUS | ||
#define ASI_AIUS 0x11 | ||
#endif | ||
|
||
#ifndef ASI_BLK_INIT_QUAD_LDD_AIUS | ||
#define ASI_BLK_INIT_QUAD_LDD_AIUS 0x23 | ||
#endif | ||
|
||
#define FUNC_NAME NG4copy_to_user | ||
#define STORE(type,src,addr) type##a src, [addr] %asi | ||
#define STORE_ASI ASI_BLK_INIT_QUAD_LDD_AIUS | ||
#define EX_RETVAL(x) 0 | ||
|
||
#ifdef __KERNEL__ | ||
/* Writing to %asi is _expensive_ so we hardcode it. | ||
* Reading %asi to check for KERNEL_DS is comparatively | ||
* cheap. | ||
*/ | ||
#define PREAMBLE \ | ||
rd %asi, %g1; \ | ||
cmp %g1, ASI_AIUS; \ | ||
bne,pn %icc, ___copy_in_user; \ | ||
nop | ||
#endif | ||
|
||
#include "NG4memcpy.S" |
Oops, something went wrong.