| /* NGpage.S: Niagara optimize clear and copy page. |
| * |
| * Copyright (C) 2006 (davem@davemloft.net) |
| */ |
| |
| #include <asm/asi.h> |
| #include <asm/page.h> |
| |
| .text |
| .align 32 |
| |
| /* This is heavily simplified from the sun4u variants |
| * because Niagara does not have any D-cache aliasing issues |
| * and also we don't need to use the FPU in order to implement |
| * an optimal page copy/clear. |
| */ |
| |
| NGcopy_user_page: /* %o0=dest, %o1=src, %o2=vaddr */ |
| prefetch [%o1 + 0x00], #one_read |
| mov 8, %g1 |
| mov 16, %g2 |
| mov 24, %g3 |
| set PAGE_SIZE, %g7 |
| |
| 1: ldda [%o1 + %g0] ASI_BLK_INIT_QUAD_LDD_P, %o2 |
| ldda [%o1 + %g2] ASI_BLK_INIT_QUAD_LDD_P, %o4 |
| prefetch [%o1 + 0x40], #one_read |
| add %o1, 32, %o1 |
| stxa %o2, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %o3, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P |
| ldda [%o1 + %g0] ASI_BLK_INIT_QUAD_LDD_P, %o2 |
| stxa %o4, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %o5, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P |
| ldda [%o1 + %g2] ASI_BLK_INIT_QUAD_LDD_P, %o4 |
| add %o1, 32, %o1 |
| add %o0, 32, %o0 |
| stxa %o2, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %o3, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %o4, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %o5, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P |
| subcc %g7, 64, %g7 |
| bne,pt %xcc, 1b |
| add %o0, 32, %o0 |
| membar #Sync |
| retl |
| nop |
| |
| .globl NGclear_page, NGclear_user_page |
| NGclear_page: /* %o0=dest */ |
| NGclear_user_page: /* %o0=dest, %o1=vaddr */ |
| mov 8, %g1 |
| mov 16, %g2 |
| mov 24, %g3 |
| set PAGE_SIZE, %g7 |
| |
| 1: stxa %g0, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %g0, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %g0, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %g0, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P |
| add %o0, 32, %o0 |
| stxa %g0, [%o0 + %g0] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %g0, [%o0 + %g1] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %g0, [%o0 + %g2] ASI_BLK_INIT_QUAD_LDD_P |
| stxa %g0, [%o0 + %g3] ASI_BLK_INIT_QUAD_LDD_P |
| subcc %g7, 64, %g7 |
| bne,pt %xcc, 1b |
| add %o0, 32, %o0 |
| membar #Sync |
| retl |
| nop |
| |
| #define BRANCH_ALWAYS 0x10680000 |
| #define NOP 0x01000000 |
| #define NG_DO_PATCH(OLD, NEW) \ |
| sethi %hi(NEW), %g1; \ |
| or %g1, %lo(NEW), %g1; \ |
| sethi %hi(OLD), %g2; \ |
| or %g2, %lo(OLD), %g2; \ |
| sub %g1, %g2, %g1; \ |
| sethi %hi(BRANCH_ALWAYS), %g3; \ |
| sll %g1, 11, %g1; \ |
| srl %g1, 11 + 2, %g1; \ |
| or %g3, %lo(BRANCH_ALWAYS), %g3; \ |
| or %g3, %g1, %g3; \ |
| stw %g3, [%g2]; \ |
| sethi %hi(NOP), %g3; \ |
| or %g3, %lo(NOP), %g3; \ |
| stw %g3, [%g2 + 0x4]; \ |
| flush %g2; |
| |
| .globl niagara_patch_pageops |
| .type niagara_patch_pageops,#function |
| niagara_patch_pageops: |
| NG_DO_PATCH(copy_user_page, NGcopy_user_page) |
| NG_DO_PATCH(_clear_page, NGclear_page) |
| NG_DO_PATCH(clear_user_page, NGclear_user_page) |
| retl |
| nop |
| .size niagara_patch_pageops,.-niagara_patch_pageops |