1 /* 2 * Copyright 2010 Nexenta Systems, Inc. All rights reserved. 3 * Copyright (c) 1995 Alex Tatmanjants <alex@elvisti.kiev.ua> 4 * at Electronni Visti IA, Kiev, Ukraine. 5 * All rights reserved. 6 * 7 * Copyright (c) 2011 The FreeBSD Foundation 8 * All rights reserved. 9 * Portions of this software were developed by David Chisnall 10 * under sponsorship from the FreeBSD Foundation. 11 * 12 * Redistribution and use in source and binary forms, with or without 13 * modification, are permitted provided that the following conditions 14 * are met: 15 * 1. Redistributions of source code must retain the above copyright 16 * notice, this list of conditions and the following disclaimer. 17 * 2. Redistributions in binary form must reproduce the above copyright 18 * notice, this list of conditions and the following disclaimer in the 19 * documentation and/or other materials provided with the distribution. 20 * 21 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND 22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 24 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE 25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 31 * SUCH DAMAGE. 32 */ 33 34 #include <stdlib.h> 35 #include <string.h> 36 #include <errno.h> 37 #include <wchar.h> 38 #include "collate.h" 39 40 41 /* 42 * In order to properly handle multibyte locales, its easiet to just 43 * convert to wide characters and then use wcscoll. However if an 44 * error occurs, we gracefully fall back to simple strcmp. Caller 45 * should check errno. 46 */ 47 int 48 strcoll_l(const char *s, const char *s2, locale_t locale) 49 { 50 int ret; 51 wchar_t *t1 = NULL, *t2 = NULL; 52 wchar_t *w1 = NULL, *w2 = NULL; 53 const char *cs1, *cs2; 54 mbstate_t mbs1 = { 0 }; 55 mbstate_t mbs2 = { 0 }; 56 size_t sz1, sz2; 57 58 /* 59 * The mbsrtowcs_l function can set the src pointer to null upon 60 * failure, so it should act on a copy to avoid: 61 * - sending null pointer to strcmp 62 * - having strcoll/strcoll_l change *s or *s2 to null 63 */ 64 cs1 = s; 65 cs2 = s2; 66 67 FIX_LOCALE(locale); 68 struct xlocale_collate *table = 69 (struct xlocale_collate*)locale->components[XLC_COLLATE]; 70 71 if (table->__collate_load_error) 72 goto error; 73 74 sz1 = strlen(s) + 1; 75 sz2 = strlen(s2) + 1; 76 77 /* 78 * Simple assumption: conversion to wide format is strictly 79 * reducing, i.e. a single byte (or multibyte character) 80 * cannot result in multiple wide characters. 81 */ 82 if ((t1 = malloc(sz1 * sizeof (wchar_t))) == NULL) 83 goto error; 84 w1 = t1; 85 if ((t2 = malloc(sz2 * sizeof (wchar_t))) == NULL) 86 goto error; 87 w2 = t2; 88 89 if ((mbsrtowcs_l(w1, &cs1, sz1, &mbs1, locale)) == (size_t)-1) 90 goto error; 91 92 if ((mbsrtowcs_l(w2, &cs2, sz2, &mbs2, locale)) == (size_t)-1) 93 goto error; 94 95 ret = wcscoll_l(w1, w2, locale); 96 if (t1) 97 free(t1); 98 if (t2) 99 free(t2); 100 101 return (ret); 102 103 error: 104 if (t1) 105 free(t1); 106 if (t2) 107 free(t2); 108 return (strcmp(s, s2)); 109 } 110 111 int 112 strcoll(const char *s, const char *s2) 113 { 114 return strcoll_l(s, s2, __get_locale()); 115 } 116 117