1 /* 2 * String Table Functions 3 * 4 * Copyright 2002-2004, Mike McCormack for CodeWeavers 5 * Copyright 2007 Robert Shearman for CodeWeavers 6 * Copyright 2010 Hans Leidekker for CodeWeavers 7 * 8 * This library is free software; you can redistribute it and/or 9 * modify it under the terms of the GNU Lesser General Public 10 * License as published by the Free Software Foundation; either 11 * version 2.1 of the License, or (at your option) any later version. 12 * 13 * This library is distributed in the hope that it will be useful, 14 * but WITHOUT ANY WARRANTY; without even the implied warranty of 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16 * Lesser General Public License for more details. 17 * 18 * You should have received a copy of the GNU Lesser General Public 19 * License along with this library; if not, write to the Free Software 20 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA 21 */ 22 23 #define COBJMACROS 24 25 #include <stdarg.h> 26 #include <assert.h> 27 28 #include "windef.h" 29 #include "winbase.h" 30 #include "winerror.h" 31 #include "wine/debug.h" 32 #include "msi.h" 33 #include "msiquery.h" 34 #include "objbase.h" 35 #include "objidl.h" 36 #include "msipriv.h" 37 #include "winnls.h" 38 39 #include "query.h" 40 41 WINE_DEFAULT_DEBUG_CHANNEL(msidb); 42 43 struct msistring 44 { 45 USHORT persistent_refcount; 46 USHORT nonpersistent_refcount; 47 WCHAR *data; 48 int len; 49 }; 50 51 struct string_table 52 { 53 UINT maxcount; /* the number of strings */ 54 UINT freeslot; 55 UINT codepage; 56 UINT sortcount; 57 struct msistring *strings; /* an array of strings */ 58 UINT *sorted; /* index */ 59 }; 60 61 static BOOL validate_codepage( UINT codepage ) 62 { 63 if (codepage != CP_ACP && !IsValidCodePage( codepage )) 64 { 65 WARN("invalid codepage %u\n", codepage); 66 return FALSE; 67 } 68 return TRUE; 69 } 70 71 static string_table *init_stringtable( int entries, UINT codepage ) 72 { 73 string_table *st; 74 75 if (!validate_codepage( codepage )) 76 return NULL; 77 78 st = malloc( sizeof(string_table) ); 79 if( !st ) 80 return NULL; 81 if( entries < 1 ) 82 entries = 1; 83 84 st->strings = calloc( entries, sizeof(struct msistring) ); 85 if( !st->strings ) 86 { 87 free( st ); 88 return NULL; 89 } 90 91 st->sorted = malloc( sizeof(UINT) * entries ); 92 if( !st->sorted ) 93 { 94 free( st->strings ); 95 free( st ); 96 return NULL; 97 } 98 99 st->maxcount = entries; 100 st->freeslot = 1; 101 st->codepage = codepage; 102 st->sortcount = 0; 103 104 return st; 105 } 106 107 VOID msi_destroy_stringtable( string_table *st ) 108 { 109 UINT i; 110 111 for( i=0; i<st->maxcount; i++ ) 112 { 113 if( st->strings[i].persistent_refcount || 114 st->strings[i].nonpersistent_refcount ) 115 free( st->strings[i].data ); 116 } 117 free( st->strings ); 118 free( st->sorted ); 119 free( st ); 120 } 121 122 static int st_find_free_entry( string_table *st ) 123 { 124 UINT i, sz, *s; 125 struct msistring *p; 126 127 TRACE("%p\n", st); 128 129 if( st->freeslot ) 130 { 131 for( i = st->freeslot; i < st->maxcount; i++ ) 132 if( !st->strings[i].persistent_refcount && 133 !st->strings[i].nonpersistent_refcount ) 134 return i; 135 } 136 for( i = 1; i < st->maxcount; i++ ) 137 if( !st->strings[i].persistent_refcount && 138 !st->strings[i].nonpersistent_refcount ) 139 return i; 140 141 /* dynamically resize */ 142 sz = st->maxcount + 1 + st->maxcount / 2; 143 if (!(p = realloc( st->strings, sz * sizeof(*p) ))) return -1; 144 memset( p + st->maxcount, 0, (sz - st->maxcount) * sizeof(*p) ); 145 146 if (!(s = realloc( st->sorted, sz * sizeof(*s) ))) 147 { 148 free( p ); 149 return -1; 150 } 151 152 st->strings = p; 153 st->sorted = s; 154 155 st->freeslot = st->maxcount; 156 st->maxcount = sz; 157 if( st->strings[st->freeslot].persistent_refcount || 158 st->strings[st->freeslot].nonpersistent_refcount ) 159 ERR("oops. expected freeslot to be free...\n"); 160 return st->freeslot; 161 } 162 163 static inline int cmp_string( const WCHAR *str1, int len1, const WCHAR *str2, int len2 ) 164 { 165 if (len1 < len2) return -1; 166 else if (len1 > len2) return 1; 167 while (len1) 168 { 169 if (*str1 == *str2) { str1++; str2++; } 170 else return *str1 - *str2; 171 len1--; 172 } 173 return 0; 174 } 175 176 static int find_insert_index( const string_table *st, UINT string_id ) 177 { 178 int i, c, low = 0, high = st->sortcount - 1; 179 180 while (low <= high) 181 { 182 i = (low + high) / 2; 183 c = cmp_string( st->strings[string_id].data, st->strings[string_id].len, 184 st->strings[st->sorted[i]].data, st->strings[st->sorted[i]].len ); 185 if (c < 0) 186 high = i - 1; 187 else if (c > 0) 188 low = i + 1; 189 else 190 return -1; /* already exists */ 191 } 192 return high + 1; 193 } 194 195 static void insert_string_sorted( string_table *st, UINT string_id ) 196 { 197 int i; 198 199 i = find_insert_index( st, string_id ); 200 if (i == -1) 201 return; 202 203 memmove( &st->sorted[i] + 1, &st->sorted[i], (st->sortcount - i) * sizeof(UINT) ); 204 st->sorted[i] = string_id; 205 st->sortcount++; 206 } 207 208 static void set_st_entry( string_table *st, UINT n, WCHAR *str, int len, USHORT refcount, 209 BOOL persistent ) 210 { 211 if (persistent) 212 { 213 st->strings[n].persistent_refcount = refcount; 214 st->strings[n].nonpersistent_refcount = 0; 215 } 216 else 217 { 218 st->strings[n].persistent_refcount = 0; 219 st->strings[n].nonpersistent_refcount = refcount; 220 } 221 222 st->strings[n].data = str; 223 st->strings[n].len = len; 224 225 insert_string_sorted( st, n ); 226 227 if( n < st->maxcount ) 228 st->freeslot = n + 1; 229 } 230 231 static UINT string2id( const string_table *st, const char *buffer, UINT *id ) 232 { 233 int sz; 234 UINT r = ERROR_INVALID_PARAMETER; 235 LPWSTR str; 236 237 TRACE("Finding string %s in string table\n", debugstr_a(buffer) ); 238 239 if( buffer[0] == 0 ) 240 { 241 *id = 0; 242 return ERROR_SUCCESS; 243 } 244 245 if (!(sz = MultiByteToWideChar( st->codepage, 0, buffer, -1, NULL, 0 ))) 246 return r; 247 str = malloc( sz * sizeof(WCHAR) ); 248 if( !str ) 249 return ERROR_NOT_ENOUGH_MEMORY; 250 MultiByteToWideChar( st->codepage, 0, buffer, -1, str, sz ); 251 252 r = msi_string2id( st, str, sz - 1, id ); 253 free( str ); 254 return r; 255 } 256 257 static int add_string( string_table *st, UINT n, const char *data, UINT len, USHORT refcount, BOOL persistent ) 258 { 259 LPWSTR str; 260 int sz; 261 262 if( !data || !len ) 263 return 0; 264 if( n > 0 ) 265 { 266 if( st->strings[n].persistent_refcount || 267 st->strings[n].nonpersistent_refcount ) 268 return -1; 269 } 270 else 271 { 272 if (string2id( st, data, &n ) == ERROR_SUCCESS) 273 { 274 if (persistent) 275 st->strings[n].persistent_refcount += refcount; 276 else 277 st->strings[n].nonpersistent_refcount += refcount; 278 return n; 279 } 280 n = st_find_free_entry( st ); 281 if( n == -1 ) 282 return -1; 283 } 284 285 if( n < 1 ) 286 { 287 ERR("invalid index adding %s (%d)\n", debugstr_a( data ), n ); 288 return -1; 289 } 290 291 /* allocate a new string */ 292 sz = MultiByteToWideChar( st->codepage, 0, data, len, NULL, 0 ); 293 str = malloc( (sz + 1) * sizeof(WCHAR) ); 294 if( !str ) 295 return -1; 296 MultiByteToWideChar( st->codepage, 0, data, len, str, sz ); 297 str[sz] = 0; 298 299 set_st_entry( st, n, str, sz, refcount, persistent ); 300 return n; 301 } 302 303 int msi_add_string( string_table *st, const WCHAR *data, int len, BOOL persistent ) 304 { 305 UINT n; 306 LPWSTR str; 307 308 if( !data ) 309 return 0; 310 311 if (len < 0) len = lstrlenW( data ); 312 313 if( !data[0] && !len ) 314 return 0; 315 316 if (msi_string2id( st, data, len, &n) == ERROR_SUCCESS ) 317 { 318 if (persistent) 319 st->strings[n].persistent_refcount++; 320 else 321 st->strings[n].nonpersistent_refcount++; 322 return n; 323 } 324 325 n = st_find_free_entry( st ); 326 if( n == -1 ) 327 return -1; 328 329 /* allocate a new string */ 330 TRACE( "%s, n = %d len = %d\n", debugstr_wn(data, len), n, len ); 331 332 str = malloc( (len + 1) * sizeof(WCHAR) ); 333 if( !str ) 334 return -1; 335 memcpy( str, data, len*sizeof(WCHAR) ); 336 str[len] = 0; 337 338 set_st_entry( st, n, str, len, 1, persistent ); 339 return n; 340 } 341 342 /* find the string identified by an id - return null if there's none */ 343 const WCHAR *msi_string_lookup( const string_table *st, UINT id, int *len ) 344 { 345 if( id == 0 ) 346 { 347 if (len) *len = 0; 348 return L""; 349 } 350 if( id >= st->maxcount ) 351 return NULL; 352 353 if( id && !st->strings[id].persistent_refcount && !st->strings[id].nonpersistent_refcount) 354 return NULL; 355 356 if (len) *len = st->strings[id].len; 357 358 return st->strings[id].data; 359 } 360 361 /* 362 * id2string 363 * 364 * [in] st - pointer to the string table 365 * [in] id - id of the string to retrieve 366 * [out] buffer - destination of the UTF8 string 367 * [in/out] sz - number of bytes available in the buffer on input 368 * number of bytes used on output 369 * 370 * Returned string is not nul terminated. 371 */ 372 static UINT id2string( const string_table *st, UINT id, char *buffer, UINT *sz ) 373 { 374 int len, lenW; 375 const WCHAR *str; 376 377 TRACE("Finding string %d of %d\n", id, st->maxcount); 378 379 str = msi_string_lookup( st, id, &lenW ); 380 if( !str ) 381 return ERROR_FUNCTION_FAILED; 382 383 len = WideCharToMultiByte( st->codepage, 0, str, lenW, NULL, 0, NULL, NULL ); 384 if( *sz < len ) 385 { 386 *sz = len; 387 return ERROR_MORE_DATA; 388 } 389 *sz = WideCharToMultiByte( st->codepage, 0, str, lenW, buffer, *sz, NULL, NULL ); 390 return ERROR_SUCCESS; 391 } 392 393 /* 394 * msi_string2id 395 * 396 * [in] st - pointer to the string table 397 * [in] str - string to find in the string table 398 * [out] id - id of the string, if found 399 */ 400 UINT msi_string2id( const string_table *st, const WCHAR *str, int len, UINT *id ) 401 { 402 int i, c, low = 0, high = st->sortcount - 1; 403 404 if (len < 0) len = lstrlenW( str ); 405 406 while (low <= high) 407 { 408 i = (low + high) / 2; 409 c = cmp_string( str, len, st->strings[st->sorted[i]].data, st->strings[st->sorted[i]].len ); 410 411 if (c < 0) 412 high = i - 1; 413 else if (c > 0) 414 low = i + 1; 415 else 416 { 417 *id = st->sorted[i]; 418 return ERROR_SUCCESS; 419 } 420 } 421 return ERROR_INVALID_PARAMETER; 422 } 423 424 static void string_totalsize( const string_table *st, UINT *datasize, UINT *poolsize ) 425 { 426 UINT i, len, holesize; 427 428 if( st->strings[0].data || st->strings[0].persistent_refcount || st->strings[0].nonpersistent_refcount) 429 ERR("oops. element 0 has a string\n"); 430 431 *poolsize = 4; 432 *datasize = 0; 433 holesize = 0; 434 for( i=1; i<st->maxcount; i++ ) 435 { 436 if( !st->strings[i].persistent_refcount ) 437 { 438 TRACE("[%u] nonpersistent = %s\n", i, debugstr_wn(st->strings[i].data, st->strings[i].len)); 439 (*poolsize) += 4; 440 } 441 else if( st->strings[i].data ) 442 { 443 TRACE("[%u] = %s\n", i, debugstr_wn(st->strings[i].data, st->strings[i].len)); 444 len = WideCharToMultiByte( st->codepage, 0, st->strings[i].data, st->strings[i].len + 1, 445 NULL, 0, NULL, NULL); 446 if( len ) 447 len--; 448 (*datasize) += len; 449 if (len>0xffff) 450 (*poolsize) += 4; 451 (*poolsize) += holesize + 4; 452 holesize = 0; 453 } 454 else 455 holesize += 4; 456 } 457 TRACE("data %u pool %u codepage %x\n", *datasize, *poolsize, st->codepage ); 458 } 459 460 HRESULT msi_init_string_table( IStorage *stg ) 461 { 462 USHORT zero[2] = { 0, 0 }; 463 UINT ret; 464 465 /* create the StringPool stream... add the zero string to it*/ 466 ret = write_stream_data(stg, L"_StringPool", zero, sizeof zero, TRUE); 467 if (ret != ERROR_SUCCESS) 468 return E_FAIL; 469 470 /* create the StringData stream... make it zero length */ 471 ret = write_stream_data(stg, L"_StringData", NULL, 0, TRUE); 472 if (ret != ERROR_SUCCESS) 473 return E_FAIL; 474 475 return S_OK; 476 } 477 478 string_table *msi_load_string_table( IStorage *stg, UINT *bytes_per_strref ) 479 { 480 string_table *st = NULL; 481 CHAR *data = NULL; 482 USHORT *pool = NULL; 483 UINT r, datasize = 0, poolsize = 0, codepage; 484 DWORD i, count, offset, len, n, refs; 485 486 r = read_stream_data( stg, L"_StringPool", TRUE, (BYTE **)&pool, &poolsize ); 487 if( r != ERROR_SUCCESS) 488 goto end; 489 r = read_stream_data( stg, L"_StringData", TRUE, (BYTE **)&data, &datasize ); 490 if( r != ERROR_SUCCESS) 491 goto end; 492 493 if ( (poolsize > 4) && (pool[1] & 0x8000) ) 494 *bytes_per_strref = LONG_STR_BYTES; 495 else 496 *bytes_per_strref = sizeof(USHORT); 497 498 count = poolsize/4; 499 if( poolsize > 4 ) 500 codepage = pool[0] | ( (pool[1] & ~0x8000) << 16 ); 501 else 502 codepage = CP_ACP; 503 st = init_stringtable( count, codepage ); 504 if (!st) 505 goto end; 506 507 offset = 0; 508 n = 1; 509 i = 1; 510 while( i<count ) 511 { 512 /* the string reference count is always the second word */ 513 refs = pool[i*2+1]; 514 515 /* empty entries have two zeros, still have a string id */ 516 if (pool[i*2] == 0 && refs == 0) 517 { 518 i++; 519 n++; 520 continue; 521 } 522 523 /* 524 * If a string is over 64k, the previous string entry is made null 525 * and its the high word of the length is inserted in the null string's 526 * reference count field. 527 */ 528 if( pool[i*2] == 0) 529 { 530 len = (pool[i*2+3] << 16) + pool[i*2+2]; 531 i += 2; 532 } 533 else 534 { 535 len = pool[i*2]; 536 i += 1; 537 } 538 539 if ( (offset + len) > datasize ) 540 { 541 ERR("string table corrupt?\n"); 542 break; 543 } 544 545 r = add_string( st, n, data+offset, len, refs, TRUE ); 546 if( r != n ) 547 ERR( "Failed to add string %lu\n", n ); 548 n++; 549 offset += len; 550 } 551 552 if ( datasize != offset ) 553 ERR( "string table load failed! (%u != %lu), please report\n", datasize, offset ); 554 555 TRACE( "loaded %lu strings\n", count ); 556 557 end: 558 free( pool ); 559 free( data ); 560 561 return st; 562 } 563 564 UINT msi_save_string_table( const string_table *st, IStorage *storage, UINT *bytes_per_strref ) 565 { 566 UINT i, datasize = 0, poolsize = 0, sz, used, r, codepage, n; 567 UINT ret = ERROR_FUNCTION_FAILED; 568 CHAR *data = NULL; 569 USHORT *pool = NULL; 570 571 TRACE("\n"); 572 573 /* construct the new table in memory first */ 574 string_totalsize( st, &datasize, &poolsize ); 575 576 TRACE("%u %u %u\n", st->maxcount, datasize, poolsize ); 577 578 pool = malloc( poolsize ); 579 if( ! pool ) 580 { 581 WARN("Failed to alloc pool %d bytes\n", poolsize ); 582 goto err; 583 } 584 data = malloc( datasize ); 585 if( ! data ) 586 { 587 WARN("Failed to alloc data %d bytes\n", datasize ); 588 goto err; 589 } 590 591 used = 0; 592 codepage = st->codepage; 593 pool[0] = codepage & 0xffff; 594 pool[1] = codepage >> 16; 595 if (st->maxcount > 0xffff) 596 { 597 pool[1] |= 0x8000; 598 *bytes_per_strref = LONG_STR_BYTES; 599 } 600 else 601 *bytes_per_strref = sizeof(USHORT); 602 603 n = 1; 604 for( i=1; i<st->maxcount; i++ ) 605 { 606 if( !st->strings[i].persistent_refcount ) 607 { 608 pool[ n*2 ] = 0; 609 pool[ n*2 + 1] = 0; 610 n++; 611 continue; 612 } 613 614 sz = datasize - used; 615 r = id2string( st, i, data+used, &sz ); 616 if( r != ERROR_SUCCESS ) 617 { 618 ERR("failed to fetch string\n"); 619 sz = 0; 620 } 621 622 if (sz) 623 pool[ n*2 + 1 ] = st->strings[i].persistent_refcount; 624 else 625 pool[ n*2 + 1 ] = 0; 626 if (sz < 0x10000) 627 { 628 pool[ n*2 ] = sz; 629 n++; 630 } 631 else 632 { 633 pool[ n*2 ] = 0; 634 pool[ n*2 + 2 ] = sz&0xffff; 635 pool[ n*2 + 3 ] = (sz>>16); 636 n += 2; 637 } 638 used += sz; 639 if( used > datasize ) 640 { 641 ERR("oops overran %d >= %d\n", used, datasize); 642 goto err; 643 } 644 } 645 646 if( used != datasize ) 647 { 648 ERR("oops used %d != datasize %d\n", used, datasize); 649 goto err; 650 } 651 652 /* write the streams */ 653 r = write_stream_data( storage, L"_StringData", data, datasize, TRUE ); 654 TRACE("Wrote StringData r=%08x\n", r); 655 if( r ) 656 goto err; 657 r = write_stream_data( storage, L"_StringPool", pool, poolsize, TRUE ); 658 TRACE("Wrote StringPool r=%08x\n", r); 659 if( r ) 660 goto err; 661 662 ret = ERROR_SUCCESS; 663 664 err: 665 free( data ); 666 free( pool ); 667 668 return ret; 669 } 670 671 UINT msi_get_string_table_codepage( const string_table *st ) 672 { 673 return st->codepage; 674 } 675 676 UINT msi_set_string_table_codepage( string_table *st, UINT codepage ) 677 { 678 if (validate_codepage( codepage )) 679 { 680 st->codepage = codepage; 681 return ERROR_SUCCESS; 682 } 683 return ERROR_FUNCTION_FAILED; 684 } 685