1041394f3SDevin Teske /*- 2041394f3SDevin Teske * Copyright (c) 2001-2014 Devin Teske <dteske@FreeBSD.org> 3041394f3SDevin Teske * All rights reserved. 4041394f3SDevin Teske * 5041394f3SDevin Teske * Redistribution and use in source and binary forms, with or without 6041394f3SDevin Teske * modification, are permitted provided that the following conditions 7041394f3SDevin Teske * are met: 8041394f3SDevin Teske * 1. Redistributions of source code must retain the above copyright 9041394f3SDevin Teske * notice, this list of conditions and the following disclaimer. 10041394f3SDevin Teske * 2. Redistributions in binary form must reproduce the above copyright 11041394f3SDevin Teske * notice, this list of conditions and the following disclaimer in the 12041394f3SDevin Teske * documentation and/or other materials provided with the distribution. 13041394f3SDevin Teske * 14041394f3SDevin Teske * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15041394f3SDevin Teske * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16041394f3SDevin Teske * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17041394f3SDevin Teske * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18041394f3SDevin Teske * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19041394f3SDevin Teske * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20041394f3SDevin Teske * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21041394f3SDevin Teske * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22041394f3SDevin Teske * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23041394f3SDevin Teske * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24041394f3SDevin Teske * SUCH DAMAGE. 25041394f3SDevin Teske */ 26041394f3SDevin Teske 27041394f3SDevin Teske #include <ctype.h> 28041394f3SDevin Teske #include <errno.h> 29*c3c06f94SFaraz Vahedi #include <stdint.h> 30041394f3SDevin Teske #include <stdlib.h> 31041394f3SDevin Teske #include <string.h> 32041394f3SDevin Teske 33041394f3SDevin Teske #include "string_m.h" 34041394f3SDevin Teske 35041394f3SDevin Teske /* 36041394f3SDevin Teske * Counts the number of occurrences of one string that appear in the source 37041394f3SDevin Teske * string. Return value is the total count. 38041394f3SDevin Teske * 39041394f3SDevin Teske * An example use would be if you need to know how large a block of memory 40041394f3SDevin Teske * needs to be for a replaceall() series. 41041394f3SDevin Teske */ 42041394f3SDevin Teske unsigned int 43041394f3SDevin Teske strcount(const char *source, const char *find) 44041394f3SDevin Teske { 45041394f3SDevin Teske const char *p = source; 46041394f3SDevin Teske size_t flen; 47041394f3SDevin Teske unsigned int n = 0; 48041394f3SDevin Teske 49041394f3SDevin Teske /* Both parameters are required */ 50041394f3SDevin Teske if (source == NULL || find == NULL) 51041394f3SDevin Teske return (0); 52041394f3SDevin Teske 53041394f3SDevin Teske /* Cache the length of find element */ 54041394f3SDevin Teske flen = strlen(find); 55041394f3SDevin Teske if (strlen(source) == 0 || flen == 0) 56041394f3SDevin Teske return (0); 57041394f3SDevin Teske 58041394f3SDevin Teske /* Loop until the end of the string */ 59041394f3SDevin Teske while (*p != '\0') { 60041394f3SDevin Teske if (strncmp(p, find, flen) == 0) { /* found an instance */ 61041394f3SDevin Teske p += flen; 62041394f3SDevin Teske n++; 63041394f3SDevin Teske } else 64041394f3SDevin Teske p++; 65041394f3SDevin Teske } 66041394f3SDevin Teske 67041394f3SDevin Teske return (n); 68041394f3SDevin Teske } 69041394f3SDevin Teske 70041394f3SDevin Teske /* 71041394f3SDevin Teske * Replaces all occurrences of `find' in `source' with `replace'. 72041394f3SDevin Teske * 73041394f3SDevin Teske * You should not pass a string constant as the first parameter, it needs to be 74041394f3SDevin Teske * a pointer to an allocated block of memory. The block of memory that source 75041394f3SDevin Teske * points to should be large enough to hold the result. If the length of the 76041394f3SDevin Teske * replacement string is greater than the length of the find string, the result 77041394f3SDevin Teske * will be larger than the original source string. To allocate enough space for 78041394f3SDevin Teske * the result, use the function strcount() declared above to determine the 79041394f3SDevin Teske * number of occurrences and how much larger the block size needs to be. 80041394f3SDevin Teske * 81041394f3SDevin Teske * If source is not large enough, the application will crash. The return value 82041394f3SDevin Teske * is the length (in bytes) of the result. 83041394f3SDevin Teske * 84041394f3SDevin Teske * When an error occurs, -1 is returned and the global variable errno is set 85041394f3SDevin Teske * accordingly. Returns zero on success. 86041394f3SDevin Teske */ 87041394f3SDevin Teske int 88041394f3SDevin Teske replaceall(char *source, const char *find, const char *replace) 89041394f3SDevin Teske { 90041394f3SDevin Teske char *p; 91041394f3SDevin Teske char *t; 92041394f3SDevin Teske char *temp; 93041394f3SDevin Teske size_t flen; 94041394f3SDevin Teske size_t rlen; 95041394f3SDevin Teske size_t slen; 96041394f3SDevin Teske uint32_t n = 0; 97041394f3SDevin Teske 98041394f3SDevin Teske errno = 0; /* reset global error number */ 99041394f3SDevin Teske 100041394f3SDevin Teske /* Check that we have non-null parameters */ 101041394f3SDevin Teske if (source == NULL) 102041394f3SDevin Teske return (0); 103041394f3SDevin Teske if (find == NULL) 104041394f3SDevin Teske return (strlen(source)); 105041394f3SDevin Teske 106041394f3SDevin Teske /* Cache the length of the strings */ 107041394f3SDevin Teske slen = strlen(source); 108041394f3SDevin Teske flen = strlen(find); 109041394f3SDevin Teske rlen = replace ? strlen(replace) : 0; 110041394f3SDevin Teske 111041394f3SDevin Teske /* Cases where no replacements need to be made */ 112041394f3SDevin Teske if (slen == 0 || flen == 0 || slen < flen) 113041394f3SDevin Teske return (slen); 114041394f3SDevin Teske 115041394f3SDevin Teske /* If replace is longer than find, we'll need to create a temp copy */ 116041394f3SDevin Teske if (rlen > flen) { 11759ba78ccSStefan Eßer temp = malloc(slen + 1); 1184268f3b3SStefan Eßer if (temp == NULL) /* could not allocate memory */ 119041394f3SDevin Teske return (-1); 12059ba78ccSStefan Eßer memcpy(temp, source, slen + 1); 121041394f3SDevin Teske } else 122041394f3SDevin Teske temp = source; 123041394f3SDevin Teske 124041394f3SDevin Teske /* Reconstruct the string with the replacements */ 125041394f3SDevin Teske p = source; t = temp; /* position elements */ 126041394f3SDevin Teske 127041394f3SDevin Teske while (*t != '\0') { 128041394f3SDevin Teske if (strncmp(t, find, flen) == 0) { 129041394f3SDevin Teske /* found an occurrence */ 130041394f3SDevin Teske for (n = 0; replace && replace[n]; n++) 131041394f3SDevin Teske *p++ = replace[n]; 132041394f3SDevin Teske t += flen; 133041394f3SDevin Teske } else 134041394f3SDevin Teske *p++ = *t++; /* copy character and increment */ 135041394f3SDevin Teske } 136041394f3SDevin Teske 137041394f3SDevin Teske /* Terminate the string */ 138041394f3SDevin Teske *p = '\0'; 139041394f3SDevin Teske 140041394f3SDevin Teske /* Free the temporary allocated memory */ 141041394f3SDevin Teske if (temp != source) 142041394f3SDevin Teske free(temp); 143041394f3SDevin Teske 144041394f3SDevin Teske /* Return the length of the completed string */ 145041394f3SDevin Teske return (strlen(source)); 146041394f3SDevin Teske } 147041394f3SDevin Teske 148041394f3SDevin Teske /* 149041394f3SDevin Teske * Expands escape sequences in a buffer pointed to by `source'. This function 150041394f3SDevin Teske * steps through each character, and converts escape sequences such as "\n", 151041394f3SDevin Teske * "\r", "\t" and others into their respective meanings. 152041394f3SDevin Teske * 153041394f3SDevin Teske * You should not pass a string constant or literal to this function or the 154041394f3SDevin Teske * program will likely segmentation fault when it tries to modify the data. 155041394f3SDevin Teske * 156041394f3SDevin Teske * The string length will either shorten or stay the same depending on whether 157041394f3SDevin Teske * any escape sequences were converted but the amount of memory allocated does 158041394f3SDevin Teske * not change. 159041394f3SDevin Teske * 160041394f3SDevin Teske * Interpreted sequences are: 161041394f3SDevin Teske * 162041394f3SDevin Teske * \0NNN character with octal value NNN (0 to 3 digits) 163041394f3SDevin Teske * \N character with octal value N (0 thru 7) 164041394f3SDevin Teske * \a alert (BEL) 165041394f3SDevin Teske * \b backslash 166041394f3SDevin Teske * \f form feed 167041394f3SDevin Teske * \n new line 168041394f3SDevin Teske * \r carriage return 169041394f3SDevin Teske * \t horizontal tab 170041394f3SDevin Teske * \v vertical tab 171041394f3SDevin Teske * \xNN byte with hexadecimal value NN (1 to 2 digits) 172041394f3SDevin Teske * 173041394f3SDevin Teske * All other sequences are unescaped (ie. '\"' and '\#'). 174041394f3SDevin Teske */ 175041394f3SDevin Teske void strexpand(char *source) 176041394f3SDevin Teske { 177041394f3SDevin Teske uint8_t c; 178041394f3SDevin Teske char *chr; 179041394f3SDevin Teske char *pos; 180041394f3SDevin Teske char d[4]; 181041394f3SDevin Teske 182041394f3SDevin Teske /* Initialize position elements */ 183041394f3SDevin Teske pos = chr = source; 184041394f3SDevin Teske 185041394f3SDevin Teske /* Loop until we hit the end of the string */ 186041394f3SDevin Teske while (*pos != '\0') { 187041394f3SDevin Teske if (*chr != '\\') { 188041394f3SDevin Teske *pos = *chr; /* copy character to current offset */ 189041394f3SDevin Teske pos++; 190041394f3SDevin Teske chr++; 191041394f3SDevin Teske continue; 192041394f3SDevin Teske } 193041394f3SDevin Teske 194041394f3SDevin Teske /* Replace the backslash with the correct character */ 195041394f3SDevin Teske switch (*++chr) { 196041394f3SDevin Teske case 'a': *pos = '\a'; break; /* bell/alert (BEL) */ 197041394f3SDevin Teske case 'b': *pos = '\b'; break; /* backspace */ 198041394f3SDevin Teske case 'f': *pos = '\f'; break; /* form feed */ 199041394f3SDevin Teske case 'n': *pos = '\n'; break; /* new line */ 200041394f3SDevin Teske case 'r': *pos = '\r'; break; /* carriage return */ 201041394f3SDevin Teske case 't': *pos = '\t'; break; /* horizontal tab */ 202041394f3SDevin Teske case 'v': *pos = '\v'; break; /* vertical tab */ 203041394f3SDevin Teske case 'x': /* hex value (1 to 2 digits)(\xNN) */ 204041394f3SDevin Teske d[2] = '\0'; /* pre-terminate the string */ 205041394f3SDevin Teske 206041394f3SDevin Teske /* verify next two characters are hex */ 207041394f3SDevin Teske d[0] = isxdigit(*(chr+1)) ? *++chr : '\0'; 208041394f3SDevin Teske if (d[0] != '\0') 209041394f3SDevin Teske d[1] = isxdigit(*(chr+1)) ? *++chr : '\0'; 210041394f3SDevin Teske 211041394f3SDevin Teske /* convert the characters to decimal */ 212041394f3SDevin Teske c = (uint8_t)strtoul(d, 0, 16); 213041394f3SDevin Teske 214041394f3SDevin Teske /* assign the converted value */ 215041394f3SDevin Teske *pos = (c != 0 || d[0] == '0') ? c : *++chr; 216041394f3SDevin Teske break; 217041394f3SDevin Teske case '0': /* octal value (0 to 3 digits)(\0NNN) */ 218041394f3SDevin Teske d[3] = '\0'; /* pre-terminate the string */ 219041394f3SDevin Teske 220041394f3SDevin Teske /* verify next three characters are octal */ 221041394f3SDevin Teske d[0] = (isdigit(*(chr+1)) && *(chr+1) < '8') ? 222041394f3SDevin Teske *++chr : '\0'; 223041394f3SDevin Teske if (d[0] != '\0') 224041394f3SDevin Teske d[1] = (isdigit(*(chr+1)) && *(chr+1) < '8') ? 225041394f3SDevin Teske *++chr : '\0'; 226041394f3SDevin Teske if (d[1] != '\0') 227041394f3SDevin Teske d[2] = (isdigit(*(chr+1)) && *(chr+1) < '8') ? 228041394f3SDevin Teske *++chr : '\0'; 229041394f3SDevin Teske 230041394f3SDevin Teske /* convert the characters to decimal */ 231041394f3SDevin Teske c = (uint8_t)strtoul(d, 0, 8); 232041394f3SDevin Teske 233041394f3SDevin Teske /* assign the converted value */ 234041394f3SDevin Teske *pos = c; 235041394f3SDevin Teske break; 236041394f3SDevin Teske default: /* single octal (\0..7) or unknown sequence */ 237041394f3SDevin Teske if (isdigit(*chr) && *chr < '8') { 238041394f3SDevin Teske d[0] = *chr; 239041394f3SDevin Teske d[1] = '\0'; 240041394f3SDevin Teske *pos = (uint8_t)strtoul(d, 0, 8); 241041394f3SDevin Teske } else 242041394f3SDevin Teske *pos = *chr; 243041394f3SDevin Teske } 244041394f3SDevin Teske 245041394f3SDevin Teske /* Increment to next offset, possible next escape sequence */ 246041394f3SDevin Teske pos++; 247041394f3SDevin Teske chr++; 248041394f3SDevin Teske } 249041394f3SDevin Teske } 250041394f3SDevin Teske 251041394f3SDevin Teske /* 252041394f3SDevin Teske * Expand only the escaped newlines in a buffer pointed to by `source'. This 253041394f3SDevin Teske * function steps through each character, and converts the "\n" sequence into 254041394f3SDevin Teske * a literal newline and the "\\n" sequence into "\n". 255041394f3SDevin Teske * 256041394f3SDevin Teske * You should not pass a string constant or literal to this function or the 257041394f3SDevin Teske * program will likely segmentation fault when it tries to modify the data. 258041394f3SDevin Teske * 259041394f3SDevin Teske * The string length will either shorten or stay the same depending on whether 260041394f3SDevin Teske * any escaped newlines were converted but the amount of memory allocated does 261041394f3SDevin Teske * not change. 262041394f3SDevin Teske */ 263041394f3SDevin Teske void strexpandnl(char *source) 264041394f3SDevin Teske { 265041394f3SDevin Teske uint8_t backslash = 0; 266041394f3SDevin Teske char *cp1; 267041394f3SDevin Teske char *cp2; 268041394f3SDevin Teske 269041394f3SDevin Teske /* Replace '\n' with literal in dprompt */ 270041394f3SDevin Teske cp1 = cp2 = source; 271041394f3SDevin Teske while (*cp2 != '\0') { 272041394f3SDevin Teske *cp1 = *cp2; 273041394f3SDevin Teske if (*cp2 == '\\') 274041394f3SDevin Teske backslash++; 275041394f3SDevin Teske else if (*cp2 != 'n') 276041394f3SDevin Teske backslash = 0; 277041394f3SDevin Teske else if (backslash > 0) { 278041394f3SDevin Teske *(--cp1) = (backslash & 1) == 1 ? '\n' : 'n'; 279041394f3SDevin Teske backslash = 0; 280041394f3SDevin Teske } 281041394f3SDevin Teske cp1++; 282041394f3SDevin Teske cp2++; 283041394f3SDevin Teske } 284041394f3SDevin Teske *cp1 = *cp2; 285041394f3SDevin Teske } 286041394f3SDevin Teske 287041394f3SDevin Teske /* 288041394f3SDevin Teske * Convert a string to lower case. You should not pass a string constant to 289041394f3SDevin Teske * this function. Only pass pointers to allocated memory with null terminated 290041394f3SDevin Teske * string data. 291041394f3SDevin Teske */ 292041394f3SDevin Teske void 293041394f3SDevin Teske strtolower(char *source) 294041394f3SDevin Teske { 295041394f3SDevin Teske char *p = source; 296041394f3SDevin Teske 297041394f3SDevin Teske if (source == NULL) 298041394f3SDevin Teske return; 299041394f3SDevin Teske 300041394f3SDevin Teske while (*p != '\0') { 301041394f3SDevin Teske *p = tolower(*p); 302041394f3SDevin Teske p++; /* would have just used `*p++' but gcc 3.x warns */ 303041394f3SDevin Teske } 304041394f3SDevin Teske } 305