diff options
author | Miod Vallat <miod@cvs.openbsd.org> | 2006-11-10 19:20:30 +0000 |
---|---|---|
committer | Miod Vallat <miod@cvs.openbsd.org> | 2006-11-10 19:20:30 +0000 |
commit | 73fc99852df1360e5751a7ca64964ac6c2c1d2fa (patch) | |
tree | 20081e1c93b7b1f042e4e02929d417623fe71c27 | |
parent | b32df8f435769c1c1761a730e9305c69fa7f7e19 (diff) |
Avoid an unnecessary branch for byte-by-byte copyin() and copyout().
-rw-r--r-- | sys/arch/m88k/m88k/subr.S | 51 |
1 files changed, 26 insertions, 25 deletions
diff --git a/sys/arch/m88k/m88k/subr.S b/sys/arch/m88k/m88k/subr.S index 0ef756ac903..2d966e1cdbf 100644 --- a/sys/arch/m88k/m88k/subr.S +++ b/sys/arch/m88k/m88k/subr.S @@ -1,4 +1,4 @@ -/* $OpenBSD: subr.S,v 1.11 2006/01/02 19:46:12 miod Exp $ */ +/* $OpenBSD: subr.S,v 1.12 2006/11/10 19:20:29 miod Exp $ */ /* * Mach Operating System * Copyright (c) 1993-1992 Carnegie Mellon University @@ -200,14 +200,12 @@ ENTRY(copyin) or r5, r5, lo16(_ASM_LABEL(Lciflt)) st r5, r6, PCB_ONFAULT /* pcb_onfault = Lciflt */ -#if 0 - bcnd ne0, LEN, 1f /* XXX optimize len = 0 case */ - or r2, r0, 0 - br _ASM_LABEL(Lcidone) -1: bcnd lt0, LEN, _ASM_LABEL(Lciflt) /* EFAULT if len < 0 */ -#endif - - /* If it's a small length (less than 8), then do byte-by-byte */ + /* + * If it's a small length (less than 8), then do byte-by-byte. + * Despite not being optimal if len is 4, and from and to + * are word-aligned, this is still faster than doing more tests + * to save an hyperthetical fraction of cycle. + */ cmp r9, LEN, 8 bb1 lt, r9, _ASM_LABEL(copyin_byte_only) @@ -230,8 +228,11 @@ ASLOCAL(copyin_right_aligned_to_halfword) bb1 1, LEN, _ASM_LABEL(copyin_right_align_to_word) ASLOCAL(copyin_right_aligned_to_word) - /* At this point, both SRC and DEST are aligned to a word */ - /* boundary, and LEN is an even multiple of 4. */ + /* + * At this point, both SRC and DEST are aligned to a word + * boundary, and LEN is a multiple of 4. We want it an even + * multiple of 4. + */ bb1.n 2, LEN, _ASM_LABEL(copyin_right_align_to_doubleword) or r7, r0, 4 @@ -259,8 +260,6 @@ ASLOCAL(copyin_right_aligned_to_doubleword) br.n _ASM_LABEL(Lcidone) or r2, r0, r0 /* successful return */ - /***************************************************/ - ASLOCAL(copyin_left_align_to_halfword) #ifdef ERRATA__XXX_USR NOP @@ -353,8 +352,8 @@ ASLOCAL(copyin_byte_only) bcnd.n ne0, LEN, 1b st.b r5, DEST, LEN 2: - br.n _ASM_LABEL(Lcidone) - or r2, r0, r0 /* successful return */ + or r2, r0, r0 /* successful return */ + /* FALLTHROUGH */ ASLOCAL(Lcidone) ldcr r5, CPU @@ -369,6 +368,7 @@ ASLOCAL(Lciflt) #undef SRC #undef DEST #undef LEN + /*######################################################################*/ /*######################################################################*/ @@ -465,13 +465,13 @@ ENTRY(copyout) or.u r5, r0, hi16(_ASM_LABEL(Lcoflt)) or r5, r5, lo16(_ASM_LABEL(Lcoflt)) st r5, r6, PCB_ONFAULT /* pcb_onfault = Lcoflt */ -#if 0 - bcnd ne0, LEN, 1f /* XXX optimize len = 0 case */ - or r2, r0, 0 - br _ASM_LABEL(Lcodone) -1: bcnd lt0, LEN, _ASM_LABEL(Lcoflt) /* EFAULT if len < 0 */ -#endif - /* If it's a small length (less than 8), then do byte-by-byte */ + + /* + * If it's a small length (less than 8), then do byte-by-byte. + * Despite not being optimal if len is 4, and from and to + * are word-aligned, this is still faster than doing more tests + * to save an hyperthetical fraction of cycle. + */ cmp r9, LEN, 8 bb1 lt, r9, _ASM_LABEL(copyout_byte_only) @@ -496,7 +496,8 @@ ASLOCAL(copyout_right_aligned_to_word) /* * At this point, both SRC and DEST are aligned to a word - * boundary, and LEN is an even multiple of 4. + * boundary, and LEN is a multiple of 4. We want it an even + * multiple of 4. */ bb1.n 2, LEN, _ASM_LABEL(copyout_right_align_to_doubleword) or r7, r0, 4 @@ -627,8 +628,8 @@ ASLOCAL(copyout_byte_only) #endif 2: - br.n _ASM_LABEL(Lcodone) - or r2, r0, r0 /* successful return */ + or r2, r0, r0 /* successful return */ + /* FALLTHROUGH */ ASLOCAL(Lcodone) ldcr r5, CPU |