1 /**************************************************************************** 2 * 3 * psmodule.c 4 * 5 * PSNames module implementation (body). 6 * 7 * Copyright 1996-2018 by 8 * David Turner, Robert Wilhelm, and Werner Lemberg. 9 * 10 * This file is part of the FreeType project, and may only be used, 11 * modified, and distributed under the terms of the FreeType project 12 * license, LICENSE.TXT. By continuing to use, modify, or distribute 13 * this file you indicate that you have read the license and 14 * understand and accept it fully. 15 * 16 */ 17 18 19 #include <ft2build.h> 20 #include FT_INTERNAL_DEBUG_H 21 #include FT_INTERNAL_OBJECTS_H 22 #include FT_SERVICE_POSTSCRIPT_CMAPS_H 23 24 #include "psmodule.h" 25 26 /* 27 * The file `pstables.h' with its arrays and its function 28 * `ft_get_adobe_glyph_index' is useful for other projects also (for 29 * example, `pdfium' is using it). However, if used as a C++ header, 30 * including it in two different source files makes it necessary to use 31 * `extern const' for the declaration of its arrays, otherwise the data 32 * would be duplicated as mandated by the C++ standard. 33 * 34 * For this reason, we use `DEFINE_PS_TABLES' to guard the function 35 * definitions, and `DEFINE_PS_TABLES_DATA' to provide both proper array 36 * declarations and definitions. 37 */ 38 #include "pstables.h" 39 #define DEFINE_PS_TABLES 40 #define DEFINE_PS_TABLES_DATA 41 #include "pstables.h" 42 43 #include "psnamerr.h" 44 45 46 #ifdef FT_CONFIG_OPTION_POSTSCRIPT_NAMES 47 48 49 #ifdef FT_CONFIG_OPTION_ADOBE_GLYPH_LIST 50 51 52 #define VARIANT_BIT 0x80000000UL 53 #define BASE_GLYPH( code ) ( (FT_UInt32)( (code) & ~VARIANT_BIT ) ) 54 55 56 /* Return the Unicode value corresponding to a given glyph. Note that */ 57 /* we do deal with glyph variants by detecting a non-initial dot in */ 58 /* the name, as in `A.swash' or `e.final'; in this case, the */ 59 /* VARIANT_BIT is set in the return value. */ 60 /* */ 61 static FT_UInt32 ps_unicode_value(const char * glyph_name)62 ps_unicode_value( const char* glyph_name ) 63 { 64 /* If the name begins with `uni', then the glyph name may be a */ 65 /* hard-coded unicode character code. */ 66 if ( glyph_name[0] == 'u' && 67 glyph_name[1] == 'n' && 68 glyph_name[2] == 'i' ) 69 { 70 /* determine whether the next four characters following are */ 71 /* hexadecimal. */ 72 73 /* XXX: Add code to deal with ligatures, i.e. glyph names like */ 74 /* `uniXXXXYYYYZZZZ'... */ 75 76 FT_Int count; 77 FT_UInt32 value = 0; 78 const char* p = glyph_name + 3; 79 80 81 for ( count = 4; count > 0; count--, p++ ) 82 { 83 char c = *p; 84 unsigned int d; 85 86 87 d = (unsigned char)c - '0'; 88 if ( d >= 10 ) 89 { 90 d = (unsigned char)c - 'A'; 91 if ( d >= 6 ) 92 d = 16; 93 else 94 d += 10; 95 } 96 97 /* Exit if a non-uppercase hexadecimal character was found */ 98 /* -- this also catches character codes below `0' since such */ 99 /* negative numbers cast to `unsigned int' are far too big. */ 100 if ( d >= 16 ) 101 break; 102 103 value = ( value << 4 ) + d; 104 } 105 106 /* there must be exactly four hex digits */ 107 if ( count == 0 ) 108 { 109 if ( *p == '\0' ) 110 return value; 111 if ( *p == '.' ) 112 return (FT_UInt32)( value | VARIANT_BIT ); 113 } 114 } 115 116 /* If the name begins with `u', followed by four to six uppercase */ 117 /* hexadecimal digits, it is a hard-coded unicode character code. */ 118 if ( glyph_name[0] == 'u' ) 119 { 120 FT_Int count; 121 FT_UInt32 value = 0; 122 const char* p = glyph_name + 1; 123 124 125 for ( count = 6; count > 0; count--, p++ ) 126 { 127 char c = *p; 128 unsigned int d; 129 130 131 d = (unsigned char)c - '0'; 132 if ( d >= 10 ) 133 { 134 d = (unsigned char)c - 'A'; 135 if ( d >= 6 ) 136 d = 16; 137 else 138 d += 10; 139 } 140 141 if ( d >= 16 ) 142 break; 143 144 value = ( value << 4 ) + d; 145 } 146 147 if ( count <= 2 ) 148 { 149 if ( *p == '\0' ) 150 return value; 151 if ( *p == '.' ) 152 return (FT_UInt32)( value | VARIANT_BIT ); 153 } 154 } 155 156 /* Look for a non-initial dot in the glyph name in order to */ 157 /* find variants like `A.swash', `e.final', etc. */ 158 { 159 const char* p = glyph_name; 160 const char* dot = NULL; 161 162 163 for ( ; *p; p++ ) 164 { 165 if ( *p == '.' && p > glyph_name ) 166 { 167 dot = p; 168 break; 169 } 170 } 171 172 /* now look up the glyph in the Adobe Glyph List */ 173 if ( !dot ) 174 return (FT_UInt32)ft_get_adobe_glyph_index( glyph_name, p ); 175 else 176 return (FT_UInt32)( ft_get_adobe_glyph_index( glyph_name, dot ) | 177 VARIANT_BIT ); 178 } 179 } 180 181 182 /* ft_qsort callback to sort the unicode map */ 183 FT_CALLBACK_DEF( int ) compare_uni_maps(const void * a,const void * b)184 compare_uni_maps( const void* a, 185 const void* b ) 186 { 187 PS_UniMap* map1 = (PS_UniMap*)a; 188 PS_UniMap* map2 = (PS_UniMap*)b; 189 FT_UInt32 unicode1 = BASE_GLYPH( map1->unicode ); 190 FT_UInt32 unicode2 = BASE_GLYPH( map2->unicode ); 191 192 193 /* sort base glyphs before glyph variants */ 194 if ( unicode1 == unicode2 ) 195 { 196 if ( map1->unicode > map2->unicode ) 197 return 1; 198 else if ( map1->unicode < map2->unicode ) 199 return -1; 200 else 201 return 0; 202 } 203 else 204 { 205 if ( unicode1 > unicode2 ) 206 return 1; 207 else if ( unicode1 < unicode2 ) 208 return -1; 209 else 210 return 0; 211 } 212 } 213 214 215 /* support for extra glyphs not handled (well) in AGL; */ 216 /* we add extra mappings for them if necessary */ 217 218 #define EXTRA_GLYPH_LIST_SIZE 10 219 220 static const FT_UInt32 ft_extra_glyph_unicodes[EXTRA_GLYPH_LIST_SIZE] = 221 { 222 /* WGL 4 */ 223 0x0394, 224 0x03A9, 225 0x2215, 226 0x00AD, 227 0x02C9, 228 0x03BC, 229 0x2219, 230 0x00A0, 231 /* Romanian */ 232 0x021A, 233 0x021B 234 }; 235 236 static const char ft_extra_glyph_names[] = 237 { 238 'D','e','l','t','a',0, 239 'O','m','e','g','a',0, 240 'f','r','a','c','t','i','o','n',0, 241 'h','y','p','h','e','n',0, 242 'm','a','c','r','o','n',0, 243 'm','u',0, 244 'p','e','r','i','o','d','c','e','n','t','e','r','e','d',0, 245 's','p','a','c','e',0, 246 'T','c','o','m','m','a','a','c','c','e','n','t',0, 247 't','c','o','m','m','a','a','c','c','e','n','t',0 248 }; 249 250 static const FT_Int 251 ft_extra_glyph_name_offsets[EXTRA_GLYPH_LIST_SIZE] = 252 { 253 0, 254 6, 255 12, 256 21, 257 28, 258 35, 259 38, 260 53, 261 59, 262 72 263 }; 264 265 266 static void ps_check_extra_glyph_name(const char * gname,FT_UInt glyph,FT_UInt * extra_glyphs,FT_UInt * states)267 ps_check_extra_glyph_name( const char* gname, 268 FT_UInt glyph, 269 FT_UInt* extra_glyphs, 270 FT_UInt *states ) 271 { 272 FT_UInt n; 273 274 275 for ( n = 0; n < EXTRA_GLYPH_LIST_SIZE; n++ ) 276 { 277 if ( ft_strcmp( ft_extra_glyph_names + 278 ft_extra_glyph_name_offsets[n], gname ) == 0 ) 279 { 280 if ( states[n] == 0 ) 281 { 282 /* mark this extra glyph as a candidate for the cmap */ 283 states[n] = 1; 284 extra_glyphs[n] = glyph; 285 } 286 287 return; 288 } 289 } 290 } 291 292 293 static void ps_check_extra_glyph_unicode(FT_UInt32 uni_char,FT_UInt * states)294 ps_check_extra_glyph_unicode( FT_UInt32 uni_char, 295 FT_UInt *states ) 296 { 297 FT_UInt n; 298 299 300 for ( n = 0; n < EXTRA_GLYPH_LIST_SIZE; n++ ) 301 { 302 if ( uni_char == ft_extra_glyph_unicodes[n] ) 303 { 304 /* disable this extra glyph from being added to the cmap */ 305 states[n] = 2; 306 307 return; 308 } 309 } 310 } 311 312 313 /* Build a table that maps Unicode values to glyph indices. */ 314 static FT_Error ps_unicodes_init(FT_Memory memory,PS_Unicodes table,FT_UInt num_glyphs,PS_GetGlyphNameFunc get_glyph_name,PS_FreeGlyphNameFunc free_glyph_name,FT_Pointer glyph_data)315 ps_unicodes_init( FT_Memory memory, 316 PS_Unicodes table, 317 FT_UInt num_glyphs, 318 PS_GetGlyphNameFunc get_glyph_name, 319 PS_FreeGlyphNameFunc free_glyph_name, 320 FT_Pointer glyph_data ) 321 { 322 FT_Error error; 323 324 FT_UInt extra_glyph_list_states[] = { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; 325 FT_UInt extra_glyphs[EXTRA_GLYPH_LIST_SIZE]; 326 327 328 /* we first allocate the table */ 329 table->num_maps = 0; 330 table->maps = NULL; 331 332 if ( !FT_NEW_ARRAY( table->maps, num_glyphs + EXTRA_GLYPH_LIST_SIZE ) ) 333 { 334 FT_UInt n; 335 FT_UInt count; 336 PS_UniMap* map; 337 FT_UInt32 uni_char; 338 339 340 map = table->maps; 341 342 for ( n = 0; n < num_glyphs; n++ ) 343 { 344 const char* gname = get_glyph_name( glyph_data, n ); 345 346 347 if ( gname ) 348 { 349 ps_check_extra_glyph_name( gname, n, 350 extra_glyphs, extra_glyph_list_states ); 351 uni_char = ps_unicode_value( gname ); 352 353 if ( BASE_GLYPH( uni_char ) != 0 ) 354 { 355 ps_check_extra_glyph_unicode( uni_char, 356 extra_glyph_list_states ); 357 map->unicode = uni_char; 358 map->glyph_index = n; 359 map++; 360 } 361 362 if ( free_glyph_name ) 363 free_glyph_name( glyph_data, gname ); 364 } 365 } 366 367 for ( n = 0; n < EXTRA_GLYPH_LIST_SIZE; n++ ) 368 { 369 if ( extra_glyph_list_states[n] == 1 ) 370 { 371 /* This glyph name has an additional representation. */ 372 /* Add it to the cmap. */ 373 374 map->unicode = ft_extra_glyph_unicodes[n]; 375 map->glyph_index = extra_glyphs[n]; 376 map++; 377 } 378 } 379 380 /* now compress the table a bit */ 381 count = (FT_UInt)( map - table->maps ); 382 383 if ( count == 0 ) 384 { 385 /* No unicode chars here! */ 386 FT_FREE( table->maps ); 387 if ( !error ) 388 error = FT_THROW( No_Unicode_Glyph_Name ); 389 } 390 else 391 { 392 /* Reallocate if the number of used entries is much smaller. */ 393 if ( count < num_glyphs / 2 ) 394 { 395 (void)FT_RENEW_ARRAY( table->maps, 396 num_glyphs + EXTRA_GLYPH_LIST_SIZE, 397 count ); 398 error = FT_Err_Ok; 399 } 400 401 /* Sort the table in increasing order of unicode values, */ 402 /* taking care of glyph variants. */ 403 ft_qsort( table->maps, count, sizeof ( PS_UniMap ), 404 compare_uni_maps ); 405 } 406 407 table->num_maps = count; 408 } 409 410 return error; 411 } 412 413 414 static FT_UInt ps_unicodes_char_index(PS_Unicodes table,FT_UInt32 unicode)415 ps_unicodes_char_index( PS_Unicodes table, 416 FT_UInt32 unicode ) 417 { 418 PS_UniMap *min, *max, *mid, *result = NULL; 419 420 421 /* Perform a binary search on the table. */ 422 423 min = table->maps; 424 max = min + table->num_maps - 1; 425 426 while ( min <= max ) 427 { 428 FT_UInt32 base_glyph; 429 430 431 mid = min + ( ( max - min ) >> 1 ); 432 433 if ( mid->unicode == unicode ) 434 { 435 result = mid; 436 break; 437 } 438 439 base_glyph = BASE_GLYPH( mid->unicode ); 440 441 if ( base_glyph == unicode ) 442 result = mid; /* remember match but continue search for base glyph */ 443 444 if ( min == max ) 445 break; 446 447 if ( base_glyph < unicode ) 448 min = mid + 1; 449 else 450 max = mid - 1; 451 } 452 453 if ( result ) 454 return result->glyph_index; 455 else 456 return 0; 457 } 458 459 460 static FT_UInt32 ps_unicodes_char_next(PS_Unicodes table,FT_UInt32 * unicode)461 ps_unicodes_char_next( PS_Unicodes table, 462 FT_UInt32 *unicode ) 463 { 464 FT_UInt result = 0; 465 FT_UInt32 char_code = *unicode + 1; 466 467 468 { 469 FT_UInt min = 0; 470 FT_UInt max = table->num_maps; 471 FT_UInt mid; 472 PS_UniMap* map; 473 FT_UInt32 base_glyph; 474 475 476 while ( min < max ) 477 { 478 mid = min + ( ( max - min ) >> 1 ); 479 map = table->maps + mid; 480 481 if ( map->unicode == char_code ) 482 { 483 result = map->glyph_index; 484 goto Exit; 485 } 486 487 base_glyph = BASE_GLYPH( map->unicode ); 488 489 if ( base_glyph == char_code ) 490 result = map->glyph_index; 491 492 if ( base_glyph < char_code ) 493 min = mid + 1; 494 else 495 max = mid; 496 } 497 498 if ( result ) 499 goto Exit; /* we have a variant glyph */ 500 501 /* we didn't find it; check whether we have a map just above it */ 502 char_code = 0; 503 504 if ( min < table->num_maps ) 505 { 506 map = table->maps + min; 507 result = map->glyph_index; 508 char_code = BASE_GLYPH( map->unicode ); 509 } 510 } 511 512 Exit: 513 *unicode = char_code; 514 return result; 515 } 516 517 518 #endif /* FT_CONFIG_OPTION_ADOBE_GLYPH_LIST */ 519 520 521 static const char* ps_get_macintosh_name(FT_UInt name_index)522 ps_get_macintosh_name( FT_UInt name_index ) 523 { 524 if ( name_index >= FT_NUM_MAC_NAMES ) 525 name_index = 0; 526 527 return ft_standard_glyph_names + ft_mac_names[name_index]; 528 } 529 530 531 static const char* ps_get_standard_strings(FT_UInt sid)532 ps_get_standard_strings( FT_UInt sid ) 533 { 534 if ( sid >= FT_NUM_SID_NAMES ) 535 return 0; 536 537 return ft_standard_glyph_names + ft_sid_names[sid]; 538 } 539 540 541 #ifdef FT_CONFIG_OPTION_ADOBE_GLYPH_LIST 542 543 FT_DEFINE_SERVICE_PSCMAPSREC( 544 pscmaps_interface, 545 546 (PS_Unicode_ValueFunc) ps_unicode_value, /* unicode_value */ 547 (PS_Unicodes_InitFunc) ps_unicodes_init, /* unicodes_init */ 548 (PS_Unicodes_CharIndexFunc)ps_unicodes_char_index, /* unicodes_char_index */ 549 (PS_Unicodes_CharNextFunc) ps_unicodes_char_next, /* unicodes_char_next */ 550 551 (PS_Macintosh_NameFunc) ps_get_macintosh_name, /* macintosh_name */ 552 (PS_Adobe_Std_StringsFunc) ps_get_standard_strings, /* adobe_std_strings */ 553 554 t1_standard_encoding, /* adobe_std_encoding */ 555 t1_expert_encoding /* adobe_expert_encoding */ 556 ) 557 558 #else 559 560 FT_DEFINE_SERVICE_PSCMAPSREC( 561 pscmaps_interface, 562 563 NULL, /* unicode_value */ 564 NULL, /* unicodes_init */ 565 NULL, /* unicodes_char_index */ 566 NULL, /* unicodes_char_next */ 567 568 (PS_Macintosh_NameFunc) ps_get_macintosh_name, /* macintosh_name */ 569 (PS_Adobe_Std_StringsFunc) ps_get_standard_strings, /* adobe_std_strings */ 570 571 t1_standard_encoding, /* adobe_std_encoding */ 572 t1_expert_encoding /* adobe_expert_encoding */ 573 ) 574 575 #endif /* FT_CONFIG_OPTION_ADOBE_GLYPH_LIST */ 576 577 578 FT_DEFINE_SERVICEDESCREC1( 579 pscmaps_services, 580 581 FT_SERVICE_ID_POSTSCRIPT_CMAPS, &pscmaps_interface ) 582 583 584 static FT_Pointer psnames_get_service(FT_Module module,const char * service_id)585 psnames_get_service( FT_Module module, 586 const char* service_id ) 587 { 588 FT_UNUSED( module ); 589 590 return ft_service_list_lookup( pscmaps_services, service_id ); 591 } 592 593 #endif /* FT_CONFIG_OPTION_POSTSCRIPT_NAMES */ 594 595 596 #ifndef FT_CONFIG_OPTION_POSTSCRIPT_NAMES 597 #define PUT_PS_NAMES_SERVICE( a ) NULL 598 #else 599 #define PUT_PS_NAMES_SERVICE( a ) a 600 #endif 601 602 FT_DEFINE_MODULE( 603 psnames_module_class, 604 605 0, /* this is not a font driver, nor a renderer */ 606 sizeof ( FT_ModuleRec ), 607 608 "psnames", /* driver name */ 609 0x10000L, /* driver version */ 610 0x20000L, /* driver requires FreeType 2 or above */ 611 612 PUT_PS_NAMES_SERVICE( 613 (void*)&pscmaps_interface ), /* module specific interface */ 614 615 (FT_Module_Constructor)NULL, /* module_init */ 616 (FT_Module_Destructor) NULL, /* module_done */ 617 (FT_Module_Requester) PUT_PS_NAMES_SERVICE( psnames_get_service ) /* get_interface */ 618 ) 619 620 621 /* END */ 622