strncat.s revision 9a70fc3be3b1e966bf78825cdb8d509963a6f0a1
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
* or http://www.opensolaris.org/os/licensing.
* See the License for the specific language governing permissions
* and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright 2004 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
.file "strncat.s"
/
/ strncat(s1, s2, n)
/
/ Concatenates s2 on the end of s1. s1's space must be large enough.
/ At most n characters are moved.
/ Returns s1.
/
/ Fast assembly language version of the following C-program strncat
/ which represents the `standard' for the C-library.
/
/ char *
/ strncat(char *s1, const char *s2, size_t n)
/ {
/ char *os1 = s1;
/
/ n++;
/ while (*s1++)
/ ;
/ --s1;
/ while (*s1++ = *s2++)
/ if (--n == 0) {
/ s1[-1] = '\0';
/ break;
/ }
/ return (os1);
/ }
/
/ In this assembly language version, the following expression is used
/ to check if a 32-bit word data contains a null byte or not:
/ (((A & 0x7f7f7f7f) + 0x7f7f7f7f) | A) & 0x80808080
/ If the above expression geneates a value other than 0x80808080,
/ that means the 32-bit word data contains a null byte.
/
/ The above has been extended for 64-bit support.
/
#include "SYS.h"
ENTRY(strncat) /* (char *, char *, size_t) */
movq %rdi, %rax / save return value
movabsq $0x7f7f7f7f7f7f7f7f, %r8 / %r8 = 0x7f...
movq %r8, %r9
notq %r9 / %r9 = 0x80...
testq $7, %rdi / if %rdi not quadword aligned
jnz .L1 / goto .L1
.align 4
.L2:
movq (%rdi), %r11 / move 1 quadword from (%rdi) to %r11
movq %r8, %rcx
andq %r11, %rcx / %rcx = %r11 & 0x7f7f7f7f
addq $8, %rdi / next quadword
addq %r8, %rcx / %rcx += 0x7f7f7f7f
orq %r11, %rcx / %rcx |= %r11
andq %r9, %rcx / %rcx &= 0x80808080
cmpq %r9, %rcx / if no null byte in this quadword
je .L2 / goto .L2
subq $8, %rdi / post-incremented
.L1:
cmpb $0, (%rdi) / if a byte in (%rdi) is null
je .L3 / goto .L3
incq %rdi / next byte
testq $7, %rdi / if %rdi not quadword aligned
jnz .L1 / goto .L1
jmp .L2 / goto .L2 (%rdi quadword aligned)
.align 4
.L3:
/ %rdi points to a null byte in destination string
testq $7, %rsi / if %rsi not quadword aligned
jnz .L4 / goto .L4
cmpq $8, %rdx / if number of bytes < 8
jb .L7 / goto .L7
.align 4
.L5:
movq (%rsi), %r11 / move 1 quadword from (%rsi) to %r11
movq %r8, %rcx
andq %r11, %rcx / %rcx = %r11 & 0x7f7f7f7f
addq $8, %rsi / next quadword
addq %r8, %rcx / %rcx += 0x7f7f7f7f
orq %r11, %rcx / %rcx |= %r11
andq %r9, %rcx / %rcx &= 0x80808080
cmpq %r9, %rcx / if null byte in this quadword
jne .L6 / goto .L6
movq %r11, (%rdi) / copy this quadword to (%rdi)
subq $8, %rdx / decrement number of bytes by 8
addq $8, %rdi / next quadword
cmpq $8, %rdx / if number of bytes >= 8
jae .L5 / goto .L5
jmp .L7 / goto .L7
.L6:
subq $8, %rsi / post-incremented
.align 4
.L7:
/ number of bytes < 8 or a null byte found in the quadword
cmpq $0, %rdx / if number of bytes == 0
jz .L8 / goto .L8 (finished)
movb (%rsi), %r11b / %r11b = a byte in (%rsi)
decq %rdx / decrement number of bytes by 1
movb %r11b, (%rdi) / copy %r11b to (%rdi)
incq %rsi / next byte
incq %rdi / next byte
cmpb $0, %r11b / compare %r11b with a null byte
je .L9 / if %r11b is a null, goto .L9
jmp .L7 / goto .L7
.align 4
.L4:
/ %rsi not aligned
cmpq $0, %rdx / if number of bytes == 0
jz .L8 / goto .L8 (finished)
movb (%rsi), %r11b / %r11b = a byte in (%rsi)
decq %rdx / decrement number of bytes by 1
movb %r11b, (%rdi) / copy %r11b to (%rdi)
incq %rdi / next byte
incq %rsi / next byte
cmpb $0, %r11b / compare %r11b with a null byte
je .L9 / if %r11b is a null, goto .L9
jmp .L4 / goto .L4
.align 4
.L8:
movb $0, (%rdi) / null termination
.L9:
ret
SET_SIZE(strncat)