Home | History | Annotate | Line # | Download | only in libopts
streqvcmp.c revision 1.8
      1 /*	$NetBSD: streqvcmp.c,v 1.8 2024/08/18 20:47:25 christos Exp $	*/
      2 
      3 
      4 /**
      5  * \file streqvcmp.c
      6  *
      7  *  String Equivalence Comparison
      8  *
      9  *  These routines allow any character to be mapped to any other
     10  *  character before comparison.  In processing long option names,
     11  *  the characters "-", "_" and "^" all need to be equivalent
     12  *  (because they are treated so by different development environments).
     13  *
     14  * @addtogroup autoopts
     15  * @{
     16  */
     17 /*
     18  *  This file is part of AutoOpts, a companion to AutoGen.
     19  *  AutoOpts is free software.
     20  *  AutoOpts is Copyright (C) 1992-2018 by Bruce Korb - all rights reserved
     21  *
     22  *  AutoOpts is available under any one of two licenses.  The license
     23  *  in use must be one of these two and the choice is under the control
     24  *  of the user of the license.
     25  *
     26  *   The GNU Lesser General Public License, version 3 or later
     27  *      See the files "COPYING.lgplv3" and "COPYING.gplv3"
     28  *
     29  *   The Modified Berkeley Software Distribution License
     30  *      See the file "COPYING.mbsd"
     31  *
     32  *  These files have the following sha256 sums:
     33  *
     34  *  8584710e9b04216a394078dc156b781d0b47e1729104d666658aecef8ee32e95  COPYING.gplv3
     35  *  4379e7444a0e2ce2b12dd6f5a52a27a4d02d39d247901d3285c88cf0d37f477b  COPYING.lgplv3
     36  *  13aa749a5b0a454917a944ed8fffc530b784f5ead522b1aacaf4ec8aa55a6239  COPYING.mbsd
     37  *
     38  * This array is designed for mapping upper and lower case letter
     39  * together for a case independent comparison.  The mappings are
     40  * based upon ascii character sequences.
     41  */
     42   static unsigned char charmap[] = {
     43     NUL,  0x01, 0x02, 0x03,  0x04, 0x05, 0x06, '\a',
     44     '\b', '\t', NL,   '\v',  '\f', '\r', 0x0E, 0x0F,
     45     0x10, 0x11, 0x12, 0x13,  0x14, 0x15, 0x16, 0x17,
     46     0x18, 0x19, 0x1A, 0x1B,  0x1C, 0x1D, 0x1E, 0x1F,
     47 
     48     ' ',  '!',  '"',  '#',   '$',  '%',  '&',  '\'',
     49     '(',  ')',  '*',  '+',   ',',  '-',  '.',  '/',
     50     '0',  '1',  '2',  '3',   '4',  '5',  '6',  '7',
     51     '8',  '9',  ':',  ';',   '<',  '=',  '>',  '?',
     52 
     53     '@',  'a',  'b',  'c',   'd',  'e',  'f',  'g',
     54     'h',  'i',  'j',  'k',   'l',  'm',  'n',  'o',
     55     'p',  'q',  'r',  's',   't',  'u',  'v',  'w',
     56     'x',  'y',  'z',  '[',   '\\', ']',  '^',  '_',
     57     '`',  'a',  'b',  'c',   'd',  'e',  'f',  'g',
     58     'h',  'i',  'j',  'k',   'l',  'm',  'n',  'o',
     59     'p',  'q',  'r',  's',   't',  'u',  'v',  'w',
     60     'x',  'y',  'z',  '{',   '|',  '}',  '~',  0x7f,
     61 
     62     0x80, 0x81, 0x82, 0x83,  0x84, 0x85, 0x86, 0x87,
     63     0x88, 0x89, 0x8A, 0x8B,  0x8C, 0x8D, 0x8E, 0x8F,
     64     0x90, 0x91, 0x92, 0x93,  0x94, 0x95, 0x96, 0x97,
     65     0x98, 0x99, 0x9A, 0x9B,  0x9C, 0x9D, 0x9E, 0x9F,
     66     0xA0, 0xA1, 0xA2, 0xA3,  0xA4, 0xA5, 0xA6, 0xA7,
     67     0xA8, 0xA9, 0xAA, 0xAB,  0xAC, 0xAD, 0xAE, 0xAF,
     68     0xB0, 0xB1, 0xB2, 0xB3,  0xB4, 0xB5, 0xB6, 0xB7,
     69     0xB8, 0xB9, 0xBA, 0xBB,  0xBC, 0xBD, 0xBE, 0xBF,
     70 
     71     0xC0, 0xC1, 0xC2, 0xC3,  0xC4, 0xC5, 0xC6, 0xC7,
     72     0xC8, 0xC9, 0xCA, 0xCB,  0xCC, 0xCD, 0xCE, 0xCF,
     73     0xD0, 0xD1, 0xD2, 0xD3,  0xD4, 0xD5, 0xD6, 0xD7,
     74     0xD8, 0xD9, 0xDA, 0xDB,  0xDC, 0xDD, 0xDE, 0xDF,
     75     0xE0, 0xE1, 0xE2, 0xE3,  0xE4, 0xE5, 0xE6, 0xE7,
     76     0xE8, 0xE9, 0xEA, 0xEB,  0xEC, 0xED, 0xEE, 0xEF,
     77     0xF0, 0xF1, 0xF2, 0xF3,  0xF4, 0xF5, 0xF6, 0xF7,
     78     0xF8, 0xF9, 0xFA, 0xFB,  0xFC, 0xFD, 0xFE, 0xFF,
     79 };
     80 
     81 
     82 /*=export_func strneqvcmp
     83  *
     84  * what: compare two strings with an equivalence mapping
     85  *
     86  * arg:  + char const * + str1 + first string +
     87  * arg:  + char const * + str2 + second string +
     88  * arg:  + int          + ct   + compare length +
     89  *
     90  * ret_type:  int
     91  * ret_desc:  the difference between two differing characters
     92  *
     93  * doc:
     94  *
     95  * Using a character mapping, two strings are compared for "equivalence".
     96  * Each input character is mapped to a comparison character and the
     97  * mapped-to characters are compared for the two NUL terminated input strings.
     98  * The comparison is limited to @code{ct} bytes.
     99  * This function name is mapped to option_strneqvcmp so as to not conflict
    100  * with the POSIX name space.
    101  *
    102  * err:  none checked.  Caller responsible for seg faults.
    103 =*/
    104 int
    105 strneqvcmp(char const * s1, char const * s2, int ct)
    106 {
    107     for (; ct > 0; --ct) {
    108         unsigned char u1 = (unsigned char) *s1++;
    109         unsigned char u2 = (unsigned char) *s2++;
    110         int dif;
    111         if (u1 == u2) {
    112             if (u1 == NUL)
    113                 return 0;
    114             continue;
    115         }
    116 
    117         dif = charmap[ u1 ] - charmap[ u2 ];
    118 
    119         if (dif != 0)
    120             return dif;
    121 
    122         if (u1 == NUL)
    123             return 0;
    124     }
    125 
    126     return 0;
    127 }
    128 
    129 
    130 /*=export_func streqvcmp
    131  *
    132  * what: compare two strings with an equivalence mapping
    133  *
    134  * arg:  + char const * + str1 + first string +
    135  * arg:  + char const * + str2 + second string +
    136  *
    137  * ret_type:  int
    138  * ret_desc:  the difference between two differing characters
    139  *
    140  * doc:
    141  *
    142  * Using a character mapping, two strings are compared for "equivalence".
    143  * Each input character is mapped to a comparison character and the
    144  * mapped-to characters are compared for the two NUL terminated input strings.
    145  * This function name is mapped to option_streqvcmp so as to not conflict
    146  * with the POSIX name space.
    147  *
    148  * err:  none checked.  Caller responsible for seg faults.
    149 =*/
    150 int
    151 streqvcmp(char const * s1, char const * s2)
    152 {
    153     for (;;) {
    154         unsigned char u1 = (unsigned char) *s1++;
    155         unsigned char u2 = (unsigned char) *s2++;
    156         int dif;
    157         if (u1 == u2) {
    158             if (u1 == NUL)
    159                 return 0;
    160             continue;
    161         }
    162 
    163         dif = charmap[ u1 ] - charmap[ u2 ];
    164 
    165         if (dif != 0)
    166             return dif;
    167 
    168         if (u1 == NUL)
    169             return 0;
    170     }
    171 }
    172 
    173 
    174 /*=export_func streqvmap
    175  *
    176  * what: Set the character mappings for the streqv functions
    177  *
    178  * arg:  + char + from + Input character +
    179  * arg:  + char + to   + Mapped-to character +
    180  * arg:  + int  + ct   + compare length +
    181  *
    182  * doc:
    183  *
    184  * Set the character mapping.  If the count (@code{ct}) is set to zero, then
    185  * the map is cleared by setting all entries in the map to their index
    186  * value.  Otherwise, the "@code{From}" character is mapped to the "@code{To}"
    187  * character.  If @code{ct} is greater than 1, then @code{From} and @code{To}
    188  * are incremented and the process repeated until @code{ct} entries have been
    189  * set. For example,
    190  * @example
    191  *    streqvmap('a', 'A', 26);
    192  * @end example
    193  * @noindent
    194  * will alter the mapping so that all English lower case letters
    195  * will map to upper case.
    196  *
    197  * This function name is mapped to option_streqvmap so as to not conflict
    198  * with the POSIX name space.
    199  *
    200  * err:  none.
    201 =*/
    202 void
    203 streqvmap(char from, char to, int ct)
    204 {
    205     if (ct == 0) {
    206         ct = sizeof(charmap) - 1;
    207         do  {
    208             charmap[ct] = (unsigned char)ct;
    209         } while (--ct >= 0);
    210     }
    211 
    212     else {
    213         unsigned int i_to   = (int)to   & 0xFF;
    214         unsigned int i_from = (int)from & 0xFF;
    215 
    216         do  {
    217             charmap[i_from] = (unsigned char)i_to;
    218             i_from++;
    219             i_to++;
    220             if ((i_from >= sizeof(charmap)) || (i_to >= sizeof(charmap)))
    221                 break;
    222         } while (--ct > 0);
    223     }
    224 }
    225 
    226 
    227 /*=export_func strequate
    228  *
    229  * what: map a list of characters to the same value
    230  *
    231  * arg:  + char const * + ch_list + characters to equivalence +
    232  *
    233  * doc:
    234  *
    235  * Each character in the input string get mapped to the first character
    236  * in the string.
    237  * This function name is mapped to option_strequate so as to not conflict
    238  * with the POSIX name space.
    239  *
    240  * err:  none.
    241 =*/
    242 void
    243 strequate(char const * s)
    244 {
    245     if ((s != NULL) && (*s != NUL)) {
    246         unsigned char equiv = (unsigned char)*s;
    247         while (*s != NUL)
    248             charmap[(unsigned char)*(s++)] = equiv;
    249     }
    250 }
    251 
    252 
    253 /*=export_func strtransform
    254  *
    255  * what: convert a string into its mapped-to value
    256  *
    257  * arg:  + char *       + dest + output string +
    258  * arg:  + char const * + src  + input string +
    259  *
    260  * doc:
    261  *
    262  * Each character in the input string is mapped and the mapped-to
    263  * character is put into the output.
    264  * This function name is mapped to option_strtransform so as to not conflict
    265  * with the POSIX name space.
    266  *
    267  * The source and destination may be the same.
    268  *
    269  * err:  none.
    270 =*/
    271 void
    272 strtransform(char * d, char const * s)
    273 {
    274     do  {
    275         *(d++) = (char)charmap[(unsigned char)*s];
    276     } while (*(s++) != NUL);
    277 }
    278 
    279 /** @}
    280  *
    281  * Local Variables:
    282  * mode: C
    283  * c-file-style: "stroustrup"
    284  * indent-tabs-mode: nil
    285  * End:
    286  * end of autoopts/streqvcmp.c */
    287