Subversion Repositories HelenOS

Rev

Rev 4279 | Rev 4281 | Go to most recent revision | Blame | Compare with Previous | Last modification | View Log | Download | RSS feed

  1. /*
  2.  * Copyright (c) 2005 Martin Decky
  3.  * Copyright (c) 2008 Jiri Svoboda
  4.  * All rights reserved.
  5.  *
  6.  * Redistribution and use in source and binary forms, with or without
  7.  * modification, are permitted provided that the following conditions
  8.  * are met:
  9.  *
  10.  * - Redistributions of source code must retain the above copyright
  11.  *   notice, this list of conditions and the following disclaimer.
  12.  * - Redistributions in binary form must reproduce the above copyright
  13.  *   notice, this list of conditions and the following disclaimer in the
  14.  *   documentation and/or other materials provided with the distribution.
  15.  * - The name of the author may not be used to endorse or promote products
  16.  *   derived from this software without specific prior written permission.
  17.  *
  18.  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
  19.  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  20.  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  21.  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
  22.  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  23.  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  24.  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  25.  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  26.  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  27.  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  28.  */
  29.  
  30. /** @addtogroup libc
  31.  * @{
  32.  */
  33. /** @file
  34.  */
  35.  
  36. #include <string.h>
  37. #include <stdlib.h>
  38. #include <limits.h>
  39. #include <ctype.h>
  40. #include <malloc.h>
  41. #include <errno.h>
  42. #include <align.h>
  43. #include <mem.h>
  44. #include <string.h>
  45.  
  46. /** Byte mask consisting of lowest @n bits (out of 8) */
  47. #define LO_MASK_8(n)  ((uint8_t) ((1 << (n)) - 1))
  48.  
  49. /** Byte mask consisting of lowest @n bits (out of 32) */
  50. #define LO_MASK_32(n)  ((uint32_t) ((1 << (n)) - 1))
  51.  
  52. /** Byte mask consisting of highest @n bits (out of 8) */
  53. #define HI_MASK_8(n)  (~LO_MASK_8(8 - (n)))
  54.  
  55. /** Number of data bits in a UTF-8 continuation byte */
  56. #define CONT_BITS  6
  57.  
  58. /** Decode a single character from a string.
  59.  *
  60.  * Decode a single character from a string of size @a size. Decoding starts
  61.  * at @a offset and this offset is moved to the beginning of the next
  62.  * character. In case of decoding error, offset generally advances at least
  63.  * by one. However, offset is never moved beyond size.
  64.  *
  65.  * @param str    String (not necessarily NULL-terminated).
  66.  * @param offset Byte offset in string where to start decoding.
  67.  * @param size   Size of the string (in bytes).
  68.  *
  69.  * @return Value of decoded character, U_SPECIAL on decoding error or
  70.  *         NULL if attempt to decode beyond @a size.
  71.  *
  72.  */
  73. wchar_t str_decode(const char *str, size_t *offset, size_t size)
  74. {
  75.     if (*offset + 1 > size)
  76.         return 0;
  77.    
  78.     /* First byte read from string */
  79.     uint8_t b0 = (uint8_t) str[(*offset)++];
  80.    
  81.     /* Determine code length */
  82.    
  83.     unsigned int b0_bits;  /* Data bits in first byte */
  84.     unsigned int cbytes;   /* Number of continuation bytes */
  85.    
  86.     if ((b0 & 0x80) == 0) {
  87.         /* 0xxxxxxx (Plain ASCII) */
  88.         b0_bits = 7;
  89.         cbytes = 0;
  90.     } else if ((b0 & 0xe0) == 0xc0) {
  91.         /* 110xxxxx 10xxxxxx */
  92.         b0_bits = 5;
  93.         cbytes = 1;
  94.     } else if ((b0 & 0xf0) == 0xe0) {
  95.         /* 1110xxxx 10xxxxxx 10xxxxxx */
  96.         b0_bits = 4;
  97.         cbytes = 2;
  98.     } else if ((b0 & 0xf8) == 0xf0) {
  99.         /* 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx */
  100.         b0_bits = 3;
  101.         cbytes = 3;
  102.     } else {
  103.         /* 10xxxxxx -- unexpected continuation byte */
  104.         return U_SPECIAL;
  105.     }
  106.    
  107.     if (*offset + cbytes > size)
  108.         return U_SPECIAL;
  109.    
  110.     wchar_t ch = b0 & LO_MASK_8(b0_bits);
  111.    
  112.     /* Decode continuation bytes */
  113.     while (cbytes > 0) {
  114.         uint8_t b = (uint8_t) str[(*offset)++];
  115.        
  116.         /* Must be 10xxxxxx */
  117.         if ((b & 0xc0) != 0x80)
  118.             return U_SPECIAL;
  119.        
  120.         /* Shift data bits to ch */
  121.         ch = (ch << CONT_BITS) | (wchar_t) (b & LO_MASK_8(CONT_BITS));
  122.         cbytes--;
  123.     }
  124.    
  125.     return ch;
  126. }
  127.  
  128. /** Encode a single character to string representation.
  129.  *
  130.  * Encode a single character to string representation (i.e. UTF-8) and store
  131.  * it into a buffer at @a offset. Encoding starts at @a offset and this offset
  132.  * is moved to the position where the next character can be written to.
  133.  *
  134.  * @param ch     Input character.
  135.  * @param str    Output buffer.
  136.  * @param offset Byte offset where to start writing.
  137.  * @param size   Size of the output buffer (in bytes).
  138.  *
  139.  * @return EOK if the character was encoded successfully, EOVERFLOW if there
  140.  *     was not enough space in the output buffer or EINVAL if the character
  141.  *     code was invalid.
  142.  */
  143. int chr_encode(const wchar_t ch, char *str, size_t *offset, size_t size)
  144. {
  145.     if (*offset >= size)
  146.         return EOVERFLOW;
  147.    
  148.     if (!chr_check(ch))
  149.         return EINVAL;
  150.    
  151.     /* Unsigned version of ch (bit operations should only be done
  152.        on unsigned types). */
  153.     uint32_t cc = (uint32_t) ch;
  154.    
  155.     /* Determine how many continuation bytes are needed */
  156.    
  157.     unsigned int b0_bits;  /* Data bits in first byte */
  158.     unsigned int cbytes;   /* Number of continuation bytes */
  159.    
  160.     if ((cc & ~LO_MASK_32(7)) == 0) {
  161.         b0_bits = 7;
  162.         cbytes = 0;
  163.     } else if ((cc & ~LO_MASK_32(11)) == 0) {
  164.         b0_bits = 5;
  165.         cbytes = 1;
  166.     } else if ((cc & ~LO_MASK_32(16)) == 0) {
  167.         b0_bits = 4;
  168.         cbytes = 2;
  169.     } else if ((cc & ~LO_MASK_32(21)) == 0) {
  170.         b0_bits = 3;
  171.         cbytes = 3;
  172.     } else {
  173.         /* Codes longer than 21 bits are not supported */
  174.         return EINVAL;
  175.     }
  176.    
  177.     /* Check for available space in buffer */
  178.     if (*offset + cbytes >= size)
  179.         return EOVERFLOW;
  180.    
  181.     /* Encode continuation bytes */
  182.     unsigned int i;
  183.     for (i = cbytes; i > 0; i--) {
  184.         str[*offset + i] = 0x80 | (cc & LO_MASK_32(CONT_BITS));
  185.         cc = cc >> CONT_BITS;
  186.     }
  187.    
  188.     /* Encode first byte */
  189.     str[*offset] = (cc & LO_MASK_32(b0_bits)) | HI_MASK_8(8 - b0_bits - 1);
  190.    
  191.     /* Advance offset */
  192.     *offset += cbytes + 1;
  193.    
  194.     return EOK;
  195. }
  196.  
  197. /** Get size of string.
  198.  *
  199.  * Get the number of bytes which are used by the string @a str (excluding the
  200.  * NULL-terminator).
  201.  *
  202.  * @param str String to consider.
  203.  *
  204.  * @return Number of bytes used by the string
  205.  *
  206.  */
  207. size_t str_size(const char *str)
  208. {
  209.     size_t size = 0;
  210.    
  211.     while (*str++ != 0)
  212.         size++;
  213.    
  214.     return size;
  215. }
  216.  
  217. /** Get size of wide string.
  218.  *
  219.  * Get the number of bytes which are used by the wide string @a str (excluding the
  220.  * NULL-terminator).
  221.  *
  222.  * @param str Wide string to consider.
  223.  *
  224.  * @return Number of bytes used by the wide string
  225.  *
  226.  */
  227. size_t wstr_size(const wchar_t *str)
  228. {
  229.     return (wstr_length(str) * sizeof(wchar_t));
  230. }
  231.  
  232. /** Get size of string with length limit.
  233.  *
  234.  * Get the number of bytes which are used by up to @a max_len first
  235.  * characters in the string @a str. If @a max_len is greater than
  236.  * the length of @a str, the entire string is measured (excluding the
  237.  * NULL-terminator).
  238.  *
  239.  * @param str     String to consider.
  240.  * @param max_len Maximum number of characters to measure.
  241.  *
  242.  * @return Number of bytes used by the characters.
  243.  *
  244.  */
  245. size_t str_lsize(const char *str, count_t max_len)
  246. {
  247.     count_t len = 0;
  248.     size_t offset = 0;
  249.    
  250.     while (len < max_len) {
  251.         if (str_decode(str, &offset, STR_NO_LIMIT) == 0)
  252.             break;
  253.        
  254.         len++;
  255.     }
  256.    
  257.     return offset;
  258. }
  259.  
  260. /** Get size of wide string with length limit.
  261.  *
  262.  * Get the number of bytes which are used by up to @a max_len first
  263.  * wide characters in the wide string @a str. If @a max_len is greater than
  264.  * the length of @a str, the entire wide string is measured (excluding the
  265.  * NULL-terminator).
  266.  *
  267.  * @param str     Wide string to consider.
  268.  * @param max_len Maximum number of wide characters to measure.
  269.  *
  270.  * @return Number of bytes used by the wide characters.
  271.  *
  272.  */
  273. size_t wstr_lsize(const wchar_t *str, count_t max_len)
  274. {
  275.     return (wstr_nlength(str, max_len * sizeof(wchar_t)) * sizeof(wchar_t));
  276. }
  277.  
  278. /** Get number of characters in a string.
  279.  *
  280.  * @param str NULL-terminated string.
  281.  *
  282.  * @return Number of characters in string.
  283.  *
  284.  */
  285. count_t str_length(const char *str)
  286. {
  287.     count_t len = 0;
  288.     size_t offset = 0;
  289.    
  290.     while (str_decode(str, &offset, STR_NO_LIMIT) != 0)
  291.         len++;
  292.    
  293.     return len;
  294. }
  295.  
  296. /** Get number of characters in a wide string.
  297.  *
  298.  * @param str NULL-terminated wide string.
  299.  *
  300.  * @return Number of characters in @a str.
  301.  *
  302.  */
  303. count_t wstr_length(const wchar_t *wstr)
  304. {
  305.     count_t len = 0;
  306.    
  307.     while (*wstr++ != 0)
  308.         len++;
  309.    
  310.     return len;
  311. }
  312.  
  313. /** Get number of characters in a string with size limit.
  314.  *
  315.  * @param str  NULL-terminated string.
  316.  * @param size Maximum number of bytes to consider.
  317.  *
  318.  * @return Number of characters in string.
  319.  *
  320.  */
  321. count_t str_nlength(const char *str, size_t size)
  322. {
  323.     count_t len = 0;
  324.     size_t offset = 0;
  325.    
  326.     while (str_decode(str, &offset, size) != 0)
  327.         len++;
  328.    
  329.     return len;
  330. }
  331.  
  332. /** Get number of characters in a string with size limit.
  333.  *
  334.  * @param str  NULL-terminated string.
  335.  * @param size Maximum number of bytes to consider.
  336.  *
  337.  * @return Number of characters in string.
  338.  *
  339.  */
  340. count_t wstr_nlength(const wchar_t *str, size_t size)
  341. {
  342.     count_t len = 0;
  343.     count_t limit = ALIGN_DOWN(size, sizeof(wchar_t));
  344.     count_t offset = 0;
  345.    
  346.     while ((offset < limit) && (*str++ != 0)) {
  347.         len++;
  348.         offset += sizeof(wchar_t);
  349.     }
  350.    
  351.     return len;
  352. }
  353.  
  354. /** Check whether character is plain ASCII.
  355.  *
  356.  * @return True if character is plain ASCII.
  357.  *
  358.  */
  359. bool ascii_check(wchar_t ch)
  360. {
  361.     if ((ch >= 0) && (ch <= 127))
  362.         return true;
  363.    
  364.     return false;
  365. }
  366.  
  367. /** Check whether character is valid
  368.  *
  369.  * @return True if character is a valid Unicode code point.
  370.  *
  371.  */
  372. bool chr_check(wchar_t ch)
  373. {
  374.     if ((ch >= 0) && (ch <= 1114111))
  375.         return true;
  376.    
  377.     return false;
  378. }
  379.  
  380. /** Compare two NULL terminated strings.
  381.  *
  382.  * Do a char-by-char comparison of two NULL-terminated strings.
  383.  * The strings are considered equal iff they consist of the same
  384.  * characters on the minimum of their lengths.
  385.  *
  386.  * @param s1 First string to compare.
  387.  * @param s2 Second string to compare.
  388.  *
  389.  * @return 0 if the strings are equal, -1 if first is smaller,
  390.  *         1 if second smaller.
  391.  *
  392.  */
  393. int str_cmp(const char *s1, const char *s2)
  394. {
  395.     wchar_t c1 = 0;
  396.     wchar_t c2 = 0;
  397.    
  398.     size_t off1 = 0;
  399.     size_t off2 = 0;
  400.  
  401.     while (true) {
  402.         c1 = str_decode(s1, &off1, STR_NO_LIMIT);
  403.         c2 = str_decode(s2, &off2, STR_NO_LIMIT);
  404.  
  405.         if (c1 < c2)
  406.             return -1;
  407.        
  408.         if (c1 > c2)
  409.             return 1;
  410.  
  411.         if (c1 == 0 || c2 == 0)
  412.             break;     
  413.     }
  414.  
  415.     return 0;
  416. }
  417.  
  418. /** Compare two NULL terminated strings with length limit.
  419.  *
  420.  * Do a char-by-char comparison of two NULL-terminated strings.
  421.  * The strings are considered equal iff they consist of the same
  422.  * characters on the minimum of their lengths and the length limit.
  423.  *
  424.  * @param s1      First string to compare.
  425.  * @param s2      Second string to compare.
  426.  * @param max_len Maximum number of characters to consider.
  427.  *
  428.  * @return 0 if the strings are equal, -1 if first is smaller,
  429.  *         1 if second smaller.
  430.  *
  431.  */
  432. int str_lcmp(const char *s1, const char *s2, count_t max_len)
  433. {
  434.     wchar_t c1 = 0;
  435.     wchar_t c2 = 0;
  436.    
  437.     size_t off1 = 0;
  438.     size_t off2 = 0;
  439.    
  440.     count_t len = 0;
  441.  
  442.     while (true) {
  443.         if (len >= max_len)
  444.             break;
  445.  
  446.         c1 = str_decode(s1, &off1, STR_NO_LIMIT);
  447.         c2 = str_decode(s2, &off2, STR_NO_LIMIT);
  448.  
  449.         if (c1 < c2)
  450.             return -1;
  451.  
  452.         if (c1 > c2)
  453.             return 1;
  454.  
  455.         if (c1 == 0 || c2 == 0)
  456.             break;
  457.  
  458.         ++len; 
  459.     }
  460.  
  461.     return 0;
  462.  
  463. }
  464.  
  465. /** Copy string.
  466.  *
  467.  * Copy source string @a src to destination buffer @a dest.
  468.  * No more than @a size bytes are written. If the size of the output buffer
  469.  * is at least one byte, the output string will always be well-formed, i.e.
  470.  * null-terminated and containing only complete characters.
  471.  *
  472.  * @param dst   Destination buffer.
  473.  * @param count Size of the destination buffer.
  474.  * @param src   Source string.
  475.  */
  476. void str_cpy(char *dest, size_t size, const char *src)
  477. {
  478.     wchar_t ch;
  479.     size_t src_off;
  480.     size_t dest_off;
  481.  
  482.     /* No space for the NULL-terminator in the buffer. */
  483.     if (size == 0)
  484.         return;
  485.    
  486.     src_off = 0;
  487.     dest_off = 0;
  488.  
  489.     while ((ch = str_decode(src, &src_off, STR_NO_LIMIT)) != 0) {
  490.         if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
  491.             break;
  492.     }
  493.  
  494.     dest[dest_off] = '\0';
  495. }
  496.  
  497. /** Copy size-limited substring.
  498.  *
  499.  * Copy source string @a src to destination buffer @a dest.
  500.  * No more than @a size bytes are written. If the size of the output buffer
  501.  * is at least one byte, the output string will always be well-formed, i.e.
  502.  * null-terminated and containing only complete characters.
  503.  *
  504.  * No more than @a n bytes are read from the input string, so it does not
  505.  * have to be null-terminated.
  506.  *
  507.  * @param dst   Destination buffer.
  508.  * @param count Size of the destination buffer.
  509.  * @param src   Source string.
  510.  */
  511. void str_ncpy(char *dest, size_t size, const char *src, size_t n)
  512. {
  513.     wchar_t ch;
  514.     size_t src_off;
  515.     size_t dest_off;
  516.  
  517.     /* No space for the null terminator in the buffer. */
  518.     if (size == 0)
  519.         return;
  520.    
  521.     src_off = 0;
  522.     dest_off = 0;
  523.  
  524.     while ((ch = str_decode(src, &src_off, n)) != 0) {
  525.         if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
  526.             break;
  527.     }
  528.  
  529.     dest[dest_off] = '\0';
  530. }
  531.  
  532. /** Append one string to another.
  533.  *
  534.  * Append source string @a src to string in destination buffer @a dest.
  535.  * Size of the destination buffer is @a dest. If the size of the output buffer
  536.  * is at least one byte, the output string will always be well-formed, i.e.
  537.  * null-terminated and containing only complete characters.
  538.  *
  539.  * @param dst   Destination buffer.
  540.  * @param count Size of the destination buffer.
  541.  * @param src   Source string.
  542.  */
  543. void str_append(char *dest, size_t size, const char *src)
  544. {
  545.     size_t dstr_size;
  546.  
  547.     dstr_size = str_size(dest);
  548.     str_cpy(dest + dstr_size, size - dstr_size, src);
  549. }
  550.  
  551. /** Copy NULL-terminated wide string to string
  552.  *
  553.  * Copy source wide string @a src to destination buffer @a dst.
  554.  * No more than @a size bytes are written. NULL-terminator is always
  555.  * written after the last succesfully copied character (i.e. if the
  556.  * destination buffer is has at least 1 byte, it will be always
  557.  * NULL-terminated).
  558.  *
  559.  * @param src   Source wide string.
  560.  * @param dst   Destination buffer.
  561.  * @param count Size of the destination buffer.
  562.  *
  563.  */
  564. void wstr_nstr(char *dst, const wchar_t *src, size_t size)
  565. {
  566.     /* No space for the NULL-terminator in the buffer */
  567.     if (size == 0)
  568.         return;
  569.    
  570.     wchar_t ch;
  571.     count_t src_idx = 0;
  572.     size_t dst_off = 0;
  573.    
  574.     while ((ch = src[src_idx++]) != 0) {
  575.         if (chr_encode(ch, dst, &dst_off, size) != EOK)
  576.             break;
  577.     }
  578.    
  579.     if (dst_off >= size)
  580.         dst[size - 1] = 0;
  581.     else
  582.         dst[dst_off] = 0;
  583. }
  584.  
  585. /** Find first occurence of character in string.
  586.  *
  587.  * @param str String to search.
  588.  * @param ch  Character to look for.
  589.  *
  590.  * @return Pointer to character in @a str or NULL if not found.
  591.  */
  592. const char *str_chr(const char *str, wchar_t ch)
  593. {
  594.     wchar_t acc;
  595.     size_t off = 0;
  596.    
  597.     while ((acc = str_decode(str, &off, STR_NO_LIMIT)) != 0) {
  598.         if (acc == ch)
  599.             return (str + off);
  600.     }
  601.    
  602.     return NULL;
  603. }
  604.  
  605. /** Find last occurence of character in string.
  606.  *
  607.  * @param str String to search.
  608.  * @param ch  Character to look for.
  609.  *
  610.  * @return Pointer to character in @a str or NULL if not found.
  611.  */
  612. const char *str_rchr(const char *str, wchar_t ch)
  613. {
  614.     wchar_t acc;
  615.     size_t off = 0;
  616.     char *res;
  617.  
  618.     res = NULL;
  619.     while ((acc = str_decode(str, &off, STR_NO_LIMIT)) != 0) {
  620.         if (acc == ch)
  621.             res = (str + off);
  622.     }
  623.  
  624.     return res;
  625. }
  626.  
  627. /** Insert a wide character into a wide string.
  628.  *
  629.  * Insert a wide character into a wide string at position
  630.  * @a pos. The characters after the position are shifted.
  631.  *
  632.  * @param str     String to insert to.
  633.  * @param ch      Character to insert to.
  634.  * @param pos     Character index where to insert.
  635.  @ @param max_pos Characters in the buffer.
  636.  *
  637.  * @return True if the insertion was sucessful, false if the position
  638.  *         is out of bounds.
  639.  *
  640.  */
  641. bool wstr_linsert(wchar_t *str, wchar_t ch, count_t pos, count_t max_pos)
  642. {
  643.     count_t len = wstr_length(str);
  644.    
  645.     if ((pos > len) || (pos + 1 > max_pos))
  646.         return false;
  647.    
  648.     count_t i;
  649.     for (i = len; i + 1 > pos; i--)
  650.         str[i + 1] = str[i];
  651.    
  652.     str[pos] = ch;
  653.    
  654.     return true;
  655. }
  656.  
  657. /** Remove a wide character from a wide string.
  658.  *
  659.  * Remove a wide character from a wide string at position
  660.  * @a pos. The characters after the position are shifted.
  661.  *
  662.  * @param str String to remove from.
  663.  * @param pos Character index to remove.
  664.  *
  665.  * @return True if the removal was sucessful, false if the position
  666.  *         is out of bounds.
  667.  *
  668.  */
  669. bool wstr_remove(wchar_t *str, count_t pos)
  670. {
  671.     count_t len = wstr_length(str);
  672.    
  673.     if (pos >= len)
  674.         return false;
  675.    
  676.     count_t i;
  677.     for (i = pos + 1; i <= len; i++)
  678.         str[i - 1] = str[i];
  679.    
  680.     return true;
  681. }
  682.  
  683. int stricmp(const char *a, const char *b)
  684. {
  685.     int c = 0;
  686.    
  687.     while (a[c] && b[c] && (!(tolower(a[c]) - tolower(b[c]))))
  688.         c++;
  689.    
  690.     return (tolower(a[c]) - tolower(b[c]));
  691. }
  692.  
  693. /** Convert string to a number.
  694.  * Core of strtol and strtoul functions.
  695.  *
  696.  * @param nptr      Pointer to string.
  697.  * @param endptr    If not NULL, function stores here pointer to the first
  698.  *          invalid character.
  699.  * @param base      Zero or number between 2 and 36 inclusive.
  700.  * @param sgn       It's set to 1 if minus found.
  701.  * @return      Result of conversion.
  702.  */
  703. static unsigned long
  704. _strtoul(const char *nptr, char **endptr, int base, char *sgn)
  705. {
  706.     unsigned char c;
  707.     unsigned long result = 0;
  708.     unsigned long a, b;
  709.     const char *str = nptr;
  710.     const char *tmpptr;
  711.    
  712.     while (isspace(*str))
  713.         str++;
  714.    
  715.     if (*str == '-') {
  716.         *sgn = 1;
  717.         ++str;
  718.     } else if (*str == '+')
  719.         ++str;
  720.    
  721.     if (base) {
  722.         if ((base == 1) || (base > 36)) {
  723.             /* FIXME: set errno to EINVAL */
  724.             return 0;
  725.         }
  726.         if ((base == 16) && (*str == '0') && ((str[1] == 'x') ||
  727.             (str[1] == 'X'))) {
  728.             str += 2;
  729.         }
  730.     } else {
  731.         base = 10;
  732.        
  733.         if (*str == '0') {
  734.             base = 8;
  735.             if ((str[1] == 'X') || (str[1] == 'x'))  {
  736.                 base = 16;
  737.                 str += 2;
  738.             }
  739.         }
  740.     }
  741.    
  742.     tmpptr = str;
  743.  
  744.     while (*str) {
  745.         c = *str;
  746.         c = (c >= 'a' ? c - 'a' + 10 : (c >= 'A' ? c - 'A' + 10 :
  747.             (c <= '9' ? c - '0' : 0xff)));
  748.         if (c > base) {
  749.             break;
  750.         }
  751.        
  752.         a = (result & 0xff) * base + c;
  753.         b = (result >> 8) * base + (a >> 8);
  754.        
  755.         if (b > (ULONG_MAX >> 8)) {
  756.             /* overflow */
  757.             /* FIXME: errno = ERANGE*/
  758.             return ULONG_MAX;
  759.         }
  760.    
  761.         result = (b << 8) + (a & 0xff);
  762.         ++str;
  763.     }
  764.    
  765.     if (str == tmpptr) {
  766.         /*
  767.          * No number was found => first invalid character is the first
  768.          * character of the string.
  769.          */
  770.         /* FIXME: set errno to EINVAL */
  771.         str = nptr;
  772.         result = 0;
  773.     }
  774.    
  775.     if (endptr)
  776.         *endptr = (char *) str;
  777.  
  778.     if (nptr == str) {
  779.         /*FIXME: errno = EINVAL*/
  780.         return 0;
  781.     }
  782.  
  783.     return result;
  784. }
  785.  
  786. /** Convert initial part of string to long int according to given base.
  787.  * The number may begin with an arbitrary number of whitespaces followed by
  788.  * optional sign (`+' or `-'). If the base is 0 or 16, the prefix `0x' may be
  789.  * inserted and the number will be taken as hexadecimal one. If the base is 0
  790.  * and the number begin with a zero, number will be taken as octal one (as with
  791.  * base 8). Otherwise the base 0 is taken as decimal.
  792.  *
  793.  * @param nptr      Pointer to string.
  794.  * @param endptr    If not NULL, function stores here pointer to the first
  795.  *          invalid character.
  796.  * @param base      Zero or number between 2 and 36 inclusive.
  797.  * @return      Result of conversion.
  798.  */
  799. long int strtol(const char *nptr, char **endptr, int base)
  800. {
  801.     char sgn = 0;
  802.     unsigned long number = 0;
  803.    
  804.     number = _strtoul(nptr, endptr, base, &sgn);
  805.  
  806.     if (number > LONG_MAX) {
  807.         if ((sgn) && (number == (unsigned long) (LONG_MAX) + 1)) {
  808.             /* FIXME: set 0 to errno */
  809.             return number;     
  810.         }
  811.         /* FIXME: set ERANGE to errno */
  812.         return (sgn ? LONG_MIN : LONG_MAX);
  813.     }
  814.    
  815.     return (sgn ? -number : number);
  816. }
  817.  
  818.  
  819. /** Convert initial part of string to unsigned long according to given base.
  820.  * The number may begin with an arbitrary number of whitespaces followed by
  821.  * optional sign (`+' or `-'). If the base is 0 or 16, the prefix `0x' may be
  822.  * inserted and the number will be taken as hexadecimal one. If the base is 0
  823.  * and the number begin with a zero, number will be taken as octal one (as with
  824.  * base 8). Otherwise the base 0 is taken as decimal.
  825.  *
  826.  * @param nptr      Pointer to string.
  827.  * @param endptr    If not NULL, function stores here pointer to the first
  828.  *          invalid character
  829.  * @param base      Zero or number between 2 and 36 inclusive.
  830.  * @return      Result of conversion.
  831.  */
  832. unsigned long strtoul(const char *nptr, char **endptr, int base)
  833. {
  834.     char sgn = 0;
  835.     unsigned long number = 0;
  836.    
  837.     number = _strtoul(nptr, endptr, base, &sgn);
  838.  
  839.     return (sgn ? -number : number);
  840. }
  841.  
  842. char *str_dup(const char *src)
  843. {
  844.     size_t size = str_size(src);
  845.     void *dest = malloc(size + 1);
  846.  
  847.     if (dest == NULL)
  848.         return (char *) NULL;
  849.  
  850.     return (char *) memcpy(dest, src, size + 1);
  851. }
  852.  
  853. char *strtok(char *s, const char *delim)
  854. {
  855.     static char *next;
  856.  
  857.     return strtok_r(s, delim, &next);
  858. }
  859.  
  860. char *strtok_r(char *s, const char *delim, char **next)
  861. {
  862.     char *start, *end;
  863.  
  864.     if (s == NULL)
  865.         s = *next;
  866.  
  867.     /* Skip over leading delimiters. */
  868.     while (*s && (str_chr(delim, *s) != NULL)) ++s;
  869.     start = s;
  870.  
  871.     /* Skip over token characters. */
  872.     while (*s && (str_chr(delim, *s) == NULL)) ++s;
  873.     end = s;
  874.     *next = (*s ? s + 1 : s);
  875.  
  876.     if (start == end) {
  877.         return NULL;    /* No more tokens. */
  878.     }
  879.  
  880.     /* Overwrite delimiter with NULL terminator. */
  881.     *end = '\0';
  882.     return start;
  883. }
  884.  
  885. /** @}
  886.  */
  887.