1/******************************************************************************* 2 * 3 * Copyright (c) 1993 Intel Corporation 4 * 5 * Intel hereby grants you permission to copy, modify, and distribute this 6 * software and its documentation. Intel grants this permission provided 7 * that the above copyright notice appears in all copies and that both the 8 * copyright notice and this permission notice appear in supporting 9 * documentation. In addition, Intel grants this permission provided that 10 * you prominently mark as "not part of the original" any modifications 11 * made to this software or documentation, and that the name of Intel 12 * Corporation not be used in advertising or publicity pertaining to 13 * distribution of the software or the documentation without specific, 14 * written prior permission. 15 * 16 * Intel Corporation provides this AS IS, WITHOUT ANY WARRANTY, EXPRESS OR 17 * IMPLIED, INCLUDING, WITHOUT LIMITATION, ANY WARRANTY OF MERCHANTABILITY 18 * OR FITNESS FOR A PARTICULAR PURPOSE. Intel makes no guarantee or 19 * representations regarding the use of, or the results of the use of, 20 * the software and documentation in terms of correctness, accuracy, 21 * reliability, currentness, or otherwise; and you rely on the software, 22 * documentation and results solely at your own risk. 23 * 24 * IN NO EVENT SHALL INTEL BE LIABLE FOR ANY LOSS OF USE, LOSS OF BUSINESS, 25 * LOSS OF PROFITS, INDIRECT, INCIDENTAL, SPECIAL OR CONSEQUENTIAL DAMAGES 26 * OF ANY KIND. IN NO EVENT SHALL INTEL'S TOTAL LIABILITY EXCEED THE SUM 27 * PAID TO INTEL FOR THE PRODUCT LICENSED HEREUNDER. 28 * 29 ******************************************************************************/ 30 31 .file "strcmp.s" 32#ifdef __PIC 33 .pic 34#endif 35#ifdef __PID 36 .pid 37#endif 38/* 39 * (c) copyright 1988,1993 Intel Corp., all rights reserved 40 */ 41/* 42 procedure strcmp (optimized assembler version for the 80960K Series) 43 44 result = strcmp (src1_addr, src2_addr) 45 46 compare the null terminated string pointed to by src1_addr to 47 the string pointed to by src2_addr. Return 0 iff the strings 48 are equal, -1 if src1_addr is lexicographically less than src2_addr, 49 and 1 if it is lexicographically greater. 50 51 Undefined behavior will occur if the end of either source string 52 (i.e. the terminating null byte) is in the last two words of the 53 program's allocated memory space. This is so because strcmp fetches 54 ahead. Disallowing the fetch ahead would impose a severe performance 55 penalty. 56 57 Strategy: 58 59 Fetch the source strings by words and compare the words until either 60 differing words are found or the null byte is encountered. In either 61 case, move through the word until either the differing byte if found, 62 in which case return -1 or 1 appropriately; or the null byte is 63 encountered, in which case, return zero (equality). 64 65 Tactics: 66 67 1) Do NOT try to fetch the words in a word aligned manner because, 68 in my judgement, the performance degradation experienced due to 69 non-aligned accesses does NOT outweigh the time and complexity added 70 by the preamble and convoluted body that would be necessary to assure 71 alignment. This is supported by the intuition that many source 72 strings will be word aligned to begin with. 73*/ 74 75 .globl _strcmp 76 .globl __strcmp 77 .leafproc _strcmp,__strcmp 78 .align 2 79 80_strcmp: 81#ifndef __PIC 82 lda .Lrett,g14 83#else 84 lda .Lrett-(.+8)(ip),g14 85#endif 86__strcmp: 87 ld (g0), g5 # fetch first word of source_1 88 mov g14,g7 # preserve return address 89 ldconst 0,g14 # conform to register conventions 90 ldconst 0xff,g4 # byte extraction mask 91.Lwloop: 92 addo 4,g0,g0 # post-increment source_1 byte ptr 93 ld (g1), g3 # fetch word of source_2 94 scanbyte 0,g5 # does word have a null byte? 95 mov g5,g2 # save a copy of the source_1 word 96 be .Lcloop # branch if null byte encountered 97 cmpo g2,g3 # are the source words the same? 98 addo 4,g1,g1 # post-increment source_2 byte ptr 99 ld (g0), g5 # fetch ahead next word of source_1 100 be .Lwloop # fall thru if words are unequal 101 102.Lcloop: and g4,g2,g5 # extract and compare individual bytes 103 and g4,g3,g6 104 cmpobne g5,g6,.diff # if they differ, go return 1 or -1 105 cmpo 0,g6 # they are the same. Are they null? 106 shlo 8,g4,g4 # position mask for next extraction 107 bne .Lcloop # loop if null not encountered 108 109 mov 0,g0 # return equality 110 bx (g7) 111.Lrett: 112 ret 113.diff: bl .neg 114 mov 1,g0 115 bx (g7) 116.neg: subi 1,0,g0 117.Lexit: 118 bx (g7) 119