|
@@ -0,0 +1,95 @@
|
|
|
|
+/* NGpage.S: Niagara optimize clear and copy page.
|
|
|
|
+ *
|
|
|
|
+ * Copyright (C) 2006 (davem@davemloft.net)
|
|
|
|
+ */
|
|
|
|
+
|
|
|
|
+#include <asm/asi.h>
|
|
|
|
+#include <asm/page.h>
|
|
|
|
+
|
|
|
|
+ .text
|
|
|
|
+ .align 32
|
|
|
|
+
|
|
|
|
+ /* This is heavily simplified from the sun4u variants
|
|
|
|
+ * because Niagara does not have any D-cache aliasing issues
|
|
|
|
+ * and also we don't need to use the FPU in order to implement
|
|
|
|
+ * an optimal page copy/clear.
|
|
|
|
+ */
|
|
|
|
+
|
|
|
|
+NGcopy_user_page: /* %o0=dest, %o1=src, %o2=vaddr */
|
|
|
|
+ prefetch [%o1 + 0x00], #one_read
|
|
|
|
+ mov 8, %g1
|
|
|
|
+ mov 16, %g2
|
|
|
|
+ mov 24, %g3
|
|
|
|
+ set PAGE_SIZE, %g7
|
|
|
|
+
|
|
|
|
+1: ldda [%o1 + %g0] ASI_BLK_INIT_QUAD_LDD_P, %o2
|
|
|
|
+ ldda [%o1 + %g2] ASI_BLK_INIT_QUAD_LDD_P, %o4
|
|
|
|
+ prefetch [%o1 + 0x40], #one_read
|
|
|
|
+ add %o1, 32, %o1
|
|
|
|
+ stxa %o2, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %o3, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ ldda [%o1 + %g0] ASI_BLK_INIT_QUAD_LDD_P, %o2
|
|
|
|
+ stxa %o4, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %o5, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ ldda [%o1 + %g2] ASI_BLK_INIT_QUAD_LDD_P, %o4
|
|
|
|
+ add %o1, 32, %o1
|
|
|
|
+ add %o0, 32, %o0
|
|
|
|
+ stxa %o2, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %o3, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %o4, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %o5, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ subcc %g7, 64, %g7
|
|
|
|
+ bne,pt %xcc, 1b
|
|
|
|
+ add %o0, 32, %o0
|
|
|
|
+ retl
|
|
|
|
+ nop
|
|
|
|
+
|
|
|
|
+NGclear_page: /* %o0=dest */
|
|
|
|
+NGclear_user_page: /* %o0=dest, %o1=vaddr */
|
|
|
|
+ mov 8, %g1
|
|
|
|
+ mov 16, %g2
|
|
|
|
+ mov 24, %g3
|
|
|
|
+ set PAGE_SIZE, %g7
|
|
|
|
+
|
|
|
|
+1: stxa %g0, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %g0, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %g0, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %g0, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ add %o0, 32, %o0
|
|
|
|
+ stxa %g0, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %g0, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %g0, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ stxa %g0, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P
|
|
|
|
+ subcc %g7, 64, %g7
|
|
|
|
+ bne,pt %xcc, 1b
|
|
|
|
+ add %o0, 32, %o0
|
|
|
|
+ retl
|
|
|
|
+ nop
|
|
|
|
+
|
|
|
|
+#define BRANCH_ALWAYS 0x10680000
|
|
|
|
+#define NOP 0x01000000
|
|
|
|
+#define NG_DO_PATCH(OLD, NEW) \
|
|
|
|
+ sethi %hi(NEW), %g1; \
|
|
|
|
+ or %g1, %lo(NEW), %g1; \
|
|
|
|
+ sethi %hi(OLD), %g2; \
|
|
|
|
+ or %g2, %lo(OLD), %g2; \
|
|
|
|
+ sub %g1, %g2, %g1; \
|
|
|
|
+ sethi %hi(BRANCH_ALWAYS), %g3; \
|
|
|
|
+ srl %g1, 2, %g1; \
|
|
|
|
+ or %g3, %lo(BRANCH_ALWAYS), %g3; \
|
|
|
|
+ or %g3, %g1, %g3; \
|
|
|
|
+ stw %g3, [%g2]; \
|
|
|
|
+ sethi %hi(NOP), %g3; \
|
|
|
|
+ or %g3, %lo(NOP), %g3; \
|
|
|
|
+ stw %g3, [%g2 + 0x4]; \
|
|
|
|
+ flush %g2;
|
|
|
|
+
|
|
|
|
+ .globl niagara_patch_pageops
|
|
|
|
+ .type niagara_patch_pageops,#function
|
|
|
|
+niagara_patch_pageops:
|
|
|
|
+ NG_DO_PATCH(copy_user_page, NGcopy_user_page)
|
|
|
|
+ NG_DO_PATCH(_clear_page, NGclear_page)
|
|
|
|
+ NG_DO_PATCH(clear_user_page, NGclear_user_page)
|
|
|
|
+ retl
|
|
|
|
+ nop
|
|
|
|
+ .size niagara_patch_pageops,.-niagara_patch_pageops
|