1 /* Copyright (C) 2000-2012 by George Williams */
2 /*
3  * Redistribution and use in source and binary forms, with or without
4  * modification, are permitted provided that the following conditions are met:
5 
6  * Redistributions of source code must retain the above copyright notice, this
7  * list of conditions and the following disclaimer.
8 
9  * Redistributions in binary form must reproduce the above copyright notice,
10  * this list of conditions and the following disclaimer in the documentation
11  * and/or other materials provided with the distribution.
12 
13  * The name of the author may not be used to endorse or promote products
14  * derived from this software without specific prior written permission.
15 
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
17  * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
18  * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
19  * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
20  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
22  * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
23  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
24  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
25  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26  */
27 #ifndef _UCHAR_H
28 # define _UCHAR_H
29 #include <unibasics.h>
30 #include <stdarg.h>
31 #include <string.h>
32 #include <memory.h>
33 #include <charset.h>
34 
35 extern unichar_t *u_copy(const unichar_t*);
36 extern unichar_t *u_copyn(const unichar_t*, long);
37 extern unichar_t *u_copynallocm(const unichar_t *pt, long n, long m);
38 extern unichar_t *uc_copyn(const char *, int);
39 extern unichar_t *uc_copy(const char*);
40 extern unichar_t *u_concat(const unichar_t*,const unichar_t*);
41 extern char      *cu_copyn(const unichar_t *pt,int len);
42 extern char      *cu_copy(const unichar_t*);
43 
44 extern long uc_strcmp(const unichar_t *,const char *);
45 extern long u_strcmp(const unichar_t *, const unichar_t *);
46 extern long uc_strncmp(const unichar_t *,const char *,int);
47 extern long u_strncmp(const unichar_t *, const unichar_t *,int);
48 extern long uc_strmatch(const unichar_t *,const char *);
49 extern long uc_strnmatch(const unichar_t *,const char *,int);
50 extern long u_strnmatch(const unichar_t *str1, const unichar_t *str2, int len);
51 extern long u_strmatch(const unichar_t *, const unichar_t *);
52 extern int    strmatch(const char *,const char *);
53 extern int    strnmatch(const char *str1, const char *str2, int n);
54 extern void uc_strcpy(unichar_t *, const char *);
55 extern void cu_strcpy(char *, const unichar_t *);
56 extern void u_strcpy(unichar_t *, const unichar_t *);
57 extern void u_strncpy(unichar_t *, const unichar_t *,int);
58 extern void cu_strncpy(char *to, const unichar_t *from, int len);
59 extern void uc_strncpy(unichar_t *to, const char *from, int len);
60 extern void uc_strcat(unichar_t *, const char *);
61 extern void uc_strncat(unichar_t *, const char *,int len);
62 extern void cu_strcat(char *, const unichar_t *);
63 extern void cu_strncat(char *, const unichar_t *,int len);
64 extern void u_strcat(unichar_t *, const unichar_t *);
65 extern void u_strncat(unichar_t *, const unichar_t *, int len);
66 extern int  u_strlen(const unichar_t *);
67 extern unichar_t *u_strchr(const unichar_t *,unichar_t);
68 extern unichar_t *u_strrchr(const unichar_t *,unichar_t);
69 extern unichar_t *uc_strstr(const unichar_t *,const char *);
70 extern unichar_t *u_strstr(const unichar_t *,const unichar_t *);
71 extern unichar_t *uc_strstrmatch(const unichar_t *,const char *);
72 extern unichar_t *u_strstrmatch(const unichar_t *,const unichar_t *);
73 extern char      *  strstrmatch(const char *,const char *);
74 
75 extern char *u_to_c(const unichar_t *);
76 extern unichar_t *c_to_u(const char *);
77 
78 extern unsigned long u_strtoul(const unichar_t *,unichar_t **,int);
79 extern long   u_strtol(const unichar_t *,unichar_t **,int);
80 extern double u_strtod(const unichar_t *,unichar_t **);
81 
82 extern char *strstart(const char *initial,const char *full);
83 extern char *strstartmatch(const char *initial,const char *full);
84 extern unichar_t *u_strstartmatch(const unichar_t *initial, const unichar_t *full);
85 extern unichar_t *cu_strstartmatch(const char *initial, const unichar_t *full);
86 
87 #define utf82u_strncpy utf82U_strncpy
88 extern int32 utf8_ildb(const char **utf8_text);
89 extern char *utf8_idpb(char *utf8_text,uint32 ch);
90 extern char *utf8_db(char *utf8_text);
91 extern char *utf8_ib(char *utf8_text);
92 extern int utf8_valid(const char *str);
93 extern void utf8_truncatevalid(char *str);
94 extern char *latin1_2_utf8_strcpy(char *utf8buf,const char *lbuf);
95 extern char *latin1_2_utf8_copy(const char *lbuf);
96 extern char *utf8_2_latin1_copy(const char *utf8buf);
97 extern int utf8_strlen(const char *utf8_str); /* how many characters in the string */
98 extern int utf82u_strlen(const char *utf8_str); /* how many long would this be in shorts (UCS2) */
99 extern void utf8_strncpy(register char *to, const char *from, int len); /* copy n characters NOT bytes */
100 extern char *def2utf8_copy(const char *from);
101 extern char *utf82def_copy(const char *ufrom);
102 extern char *utf8_strchr(const char *utf8_str, int search_char);
103 
104 extern unichar_t *utf82u_strncpy(unichar_t *ubuf,const char *utf8buf,int len);
105 extern unichar_t *utf82u_strcpy(unichar_t *ubuf,const char *utf8buf);
106 extern void       utf82u_strcat(unichar_t *ubuf,const char *utf8buf);
107 extern unichar_t *utf82u_copyn(const char *utf8buf,int len);
108 extern unichar_t *utf82u_copy(const char *utf8buf);
109 extern char *u2utf8_strcpy(char *utf8buf,const unichar_t *ubuf);
110 extern char *u2utf8_copy(const unichar_t *ubuf);
111 extern char *u2utf8_copyn(const unichar_t *ubuf,int len);
112 extern unichar_t *encoding2u_strncpy(unichar_t *uto, const char *from, int n, enum encoding cs);
113 extern char *u2encoding_strncpy(char *to, const unichar_t *ufrom, int n, enum encoding cs);
114 extern unichar_t *def2u_strncpy(unichar_t *uto, const char *from, int n);
115 extern char *u2def_strncpy(char *to, const unichar_t *ufrom, int n);
116 extern unichar_t *def2u_copy(const char *from);
117 extern char *u2def_copy(const unichar_t *ufrom);
118 
119 extern int u_sprintf(unichar_t *str, const unichar_t *format, ... );
120 extern int u_snprintf(unichar_t *str, int len, const unichar_t *format, ... );
121 extern int u_vsnprintf(unichar_t *str, int len, const unichar_t *format, va_list ap );
122 
123 extern int uAllAscii(const unichar_t *str);
124 extern int AllAscii(const char *);
125 extern char *StripToASCII(const char *utf8_str);
126 
127 extern char *copytolower(const char *);
128 extern int endswith(const char *haystack,const char *needle);
129 extern int endswithi(const char *haystack,const char *needle);
130 extern int endswithi_partialExtension( const char *haystack,const char *needle);
131 
132 /**
133  * Remove trailing \n or \r from the given string. No memory
134  * allocations are performed, null is injected over these terminators
135  * to trim the string.
136  *
137  * This function is designed to be impotent if called with a string
138  * that does not end with \n or \r. ie, you don't need to redundantly
139  * check if there is a newline at the end of string and not call here
140  * if there is no newline. You can just call here with any string and
141  * be assured that afterwards there will be no trailing newline or
142  * carrage return character found at the end of the string pointed to
143  * by 'p'.
144  */
145 extern char* chomp( char* p );
146 
147 /**
148  * Return true if the haystack plain string ends with the string
149  * needle. Return 0 otherwise.
150  *
151  * Needles which are larger than the haystack are handled.
152  *
153  * No new strings are allocated, freed, or returned.
154  */
155 int endswith(const char *haystack,const char *needle);
156 
157 /**
158  * Return true if the haystack unicode string ends with the string needle.
159  * Return 0 otherwise.
160  *
161  * Needles which are larger than the haystack are handled.
162  *
163  * No new strings are allocated, freed, or returned.
164  */
165 extern int u_endswith(const unichar_t *haystack,const unichar_t *needle);
166 
167 #endif
168