xref: /aosp_15_r20/external/harfbuzz_ng/src/OT/name/name.hh (revision 2d1272b857b1f7575e6e246373e1cb218663db8a)
1 /*
2  * Copyright © 2011,2012  Google, Inc.
3  *
4  *  This is part of HarfBuzz, a text shaping library.
5  *
6  * Permission is hereby granted, without written agreement and without
7  * license or royalty fees, to use, copy, modify, and distribute this
8  * software and its documentation for any purpose, provided that the
9  * above copyright notice and the following two paragraphs appear in
10  * all copies of this software.
11  *
12  * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13  * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14  * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15  * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
16  * DAMAGE.
17  *
18  * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20  * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
21  * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22  * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23  *
24  * Google Author(s): Behdad Esfahbod
25  */
26 
27 #ifndef OT_NAME_NAME_HH
28 #define OT_NAME_NAME_HH
29 
30 #include "../../hb-open-type.hh"
31 #include "../../hb-ot-name-language.hh"
32 #include "../../hb-aat-layout.hh"
33 #include "../../hb-utf.hh"
34 
35 
36 namespace OT {
37 
38 template <typename in_utf_t, typename out_utf_t>
39 inline unsigned int
hb_ot_name_convert_utf(hb_bytes_t bytes,unsigned int * text_size,typename out_utf_t::codepoint_t * text)40 hb_ot_name_convert_utf (hb_bytes_t                       bytes,
41 			unsigned int                    *text_size /* IN/OUT */,
42 			typename out_utf_t::codepoint_t *text /* OUT */)
43 {
44   unsigned int src_len = bytes.length / sizeof (typename in_utf_t::codepoint_t);
45   const typename in_utf_t::codepoint_t *src = (const typename in_utf_t::codepoint_t *) bytes.arrayZ;
46   const typename in_utf_t::codepoint_t *src_end = src + src_len;
47 
48   typename out_utf_t::codepoint_t *dst = text;
49 
50   hb_codepoint_t unicode;
51   const hb_codepoint_t replacement = HB_BUFFER_REPLACEMENT_CODEPOINT_DEFAULT;
52 
53   if (text_size && *text_size)
54   {
55     (*text_size)--; /* Save room for NUL-termination. */
56     const typename out_utf_t::codepoint_t *dst_end = text + *text_size;
57 
58     while (src < src_end && dst < dst_end)
59     {
60       const typename in_utf_t::codepoint_t *src_next = in_utf_t::next (src, src_end, &unicode, replacement);
61       typename out_utf_t::codepoint_t *dst_next = out_utf_t::encode (dst, dst_end, unicode);
62       if (dst_next == dst)
63 	break; /* Out-of-room. */
64 
65       dst = dst_next;
66       src = src_next;
67     }
68 
69     *text_size = dst - text;
70     *dst = 0; /* NUL-terminate. */
71   }
72 
73   /* Accumulate length of rest. */
74   unsigned int dst_len = dst - text;
75   while (src < src_end)
76   {
77     src = in_utf_t::next (src, src_end, &unicode, replacement);
78     dst_len += out_utf_t::encode_len (unicode);
79   }
80   return dst_len;
81 }
82 
83 #define entry_score var.u16[0]
84 #define entry_index var.u16[1]
85 
86 
87 /*
88  * name -- Naming
89  * https://docs.microsoft.com/en-us/typography/opentype/spec/name
90  */
91 #define HB_OT_TAG_name HB_TAG('n','a','m','e')
92 
93 #define UNSUPPORTED	42
94 
95 struct NameRecord
96 {
languageOT::NameRecord97   hb_language_t language (hb_face_t *face) const
98   {
99 #ifndef HB_NO_OT_NAME_LANGUAGE
100     unsigned int p = platformID;
101     unsigned int l = languageID;
102 
103     if (p == 3)
104       return _hb_ot_name_language_for_ms_code (l);
105 
106     if (p == 1)
107       return _hb_ot_name_language_for_mac_code (l);
108 
109 #ifndef HB_NO_OT_NAME_LANGUAGE_AAT
110     if (p == 0)
111       return face->table.ltag->get_language (l);
112 #endif
113 
114 #endif
115     return HB_LANGUAGE_INVALID;
116   }
117 
scoreOT::NameRecord118   uint16_t score () const
119   {
120     /* Same order as in cmap::find_best_subtable(). */
121     unsigned int p = platformID;
122     unsigned int e = encodingID;
123 
124     /* 32-bit. */
125     if (p == 3 && e == 10) return 0;
126     if (p == 0 && e ==  6) return 1;
127     if (p == 0 && e ==  4) return 2;
128 
129     /* 16-bit. */
130     if (p == 3 && e ==  1) return 3;
131     if (p == 0 && e ==  3) return 4;
132     if (p == 0 && e ==  2) return 5;
133     if (p == 0 && e ==  1) return 6;
134     if (p == 0 && e ==  0) return 7;
135 
136     /* Symbol. */
137     if (p == 3 && e ==  0) return 8;
138 
139     /* We treat all Mac Latin names as ASCII only. */
140     if (p == 1 && e ==  0) return 10; /* 10 is magic number :| */
141 
142     return UNSUPPORTED;
143   }
144 
copyOT::NameRecord145   NameRecord* copy (hb_serialize_context_t *c, const void *base
146 #ifdef HB_EXPERIMENTAL_API
147                     , const hb_hashmap_t<hb_ot_name_record_ids_t, hb_bytes_t> *name_table_overrides
148 #endif
149 		    ) const
150   {
151     TRACE_SERIALIZE (this);
152     HB_UNUSED auto snap = c->snapshot ();
153     auto *out = c->embed (this);
154     if (unlikely (!out)) return_trace (nullptr);
155 #ifdef HB_EXPERIMENTAL_API
156     hb_ot_name_record_ids_t record_ids (platformID, encodingID, languageID, nameID);
157     hb_bytes_t* name_bytes;
158 
159     if (name_table_overrides->has (record_ids, &name_bytes)) {
160       hb_bytes_t encoded_bytes = *name_bytes;
161       char *name_str_utf16_be = nullptr;
162 
163       if (platformID != 1)
164       {
165         unsigned text_size = hb_ot_name_convert_utf<hb_utf8_t, hb_utf16_be_t> (*name_bytes, nullptr, nullptr);
166 
167         text_size++; // needs to consider NULL terminator for use in hb_ot_name_convert_utf()
168         unsigned byte_len = text_size * hb_utf16_be_t::codepoint_t::static_size;
169         name_str_utf16_be = (char *) hb_calloc (byte_len, 1);
170         if (!name_str_utf16_be)
171         {
172           c->revert (snap);
173           return_trace (nullptr);
174         }
175         hb_ot_name_convert_utf<hb_utf8_t, hb_utf16_be_t> (*name_bytes, &text_size,
176                                                           (hb_utf16_be_t::codepoint_t *) name_str_utf16_be);
177 
178         unsigned encoded_byte_len = text_size * hb_utf16_be_t::codepoint_t::static_size;
179         if (!encoded_byte_len || !c->check_assign (out->length, encoded_byte_len, HB_SERIALIZE_ERROR_INT_OVERFLOW)) {
180           c->revert (snap);
181           hb_free (name_str_utf16_be);
182           return_trace (nullptr);
183         }
184 
185         encoded_bytes = hb_bytes_t (name_str_utf16_be, encoded_byte_len);
186       }
187       else
188       {
189         // mac platform, copy the UTF-8 string(all ascii characters) as is
190         if (!c->check_assign (out->length, encoded_bytes.length, HB_SERIALIZE_ERROR_INT_OVERFLOW)) {
191           c->revert (snap);
192           return_trace (nullptr);
193         }
194       }
195 
196       out->offset = 0;
197       c->push ();
198       encoded_bytes.copy (c);
199       c->add_link (out->offset, c->pop_pack (), hb_serialize_context_t::Tail, 0);
200       hb_free (name_str_utf16_be);
201     }
202     else
203 #endif
204     {
205       out->offset.serialize_copy (c, offset, base, 0, hb_serialize_context_t::Tail, length);
206     }
207     return_trace (out);
208   }
209 
isUnicodeOT::NameRecord210   bool isUnicode () const
211   {
212     unsigned int p = platformID;
213     unsigned int e = encodingID;
214 
215     return (p == 0 ||
216 	    (p == 3 && (e == 0 || e == 1 || e == 10)));
217   }
218 
cmpOT::NameRecord219   static int cmp (const void *pa, const void *pb)
220   {
221     const NameRecord *a = (const NameRecord *)pa;
222     const NameRecord *b = (const NameRecord *)pb;
223 
224     if (a->platformID != b->platformID)
225       return a->platformID - b->platformID;
226 
227     if (a->encodingID != b->encodingID)
228       return a->encodingID - b->encodingID;
229 
230     if (a->languageID != b->languageID)
231       return a->languageID - b->languageID;
232 
233     if (a->nameID != b->nameID)
234       return a->nameID - b->nameID;
235 
236     if (a->length != b->length)
237       return a->length - b->length;
238 
239     return 0;
240   }
241 
sanitizeOT::NameRecord242   bool sanitize (hb_sanitize_context_t *c, const void *base) const
243   {
244     TRACE_SANITIZE (this);
245     return_trace (c->check_struct (this) &&
246 		  hb_barrier () &&
247 		  offset.sanitize (c, base, length));
248   }
249 
250   HBUINT16	platformID;	/* Platform ID. */
251   HBUINT16	encodingID;	/* Platform-specific encoding ID. */
252   HBUINT16	languageID;	/* Language ID. */
253   HBUINT16	nameID;		/* Name ID. */
254   HBUINT16	length;		/* String length (in bytes). */
255   NNOffset16To<UnsizedArrayOf<HBUINT8>>
256 		offset;		/* String offset from start of storage area (in bytes). */
257   public:
258   DEFINE_SIZE_STATIC (12);
259 };
260 
261 static int
_hb_ot_name_entry_cmp_key(const void * pa,const void * pb,bool exact)262 _hb_ot_name_entry_cmp_key (const void *pa, const void *pb, bool exact)
263 {
264   const hb_ot_name_entry_t *a = (const hb_ot_name_entry_t *) pa;
265   const hb_ot_name_entry_t *b = (const hb_ot_name_entry_t *) pb;
266 
267   /* Compare by name_id, then language. */
268 
269   if (a->name_id != b->name_id)
270     return a->name_id - b->name_id;
271 
272   if (a->language == b->language) return 0;
273   if (!a->language) return -1;
274   if (!b->language) return +1;
275 
276   const char *astr = hb_language_to_string (a->language);
277   const char *bstr = hb_language_to_string (b->language);
278 
279   signed c = strcmp (astr, bstr);
280 
281   // 'a' is the user request, and 'b' is string in the font.
282   // If eg. user asks for "en-us" and font has "en", approve.
283   if (!exact && c &&
284       hb_language_matches (b->language, a->language))
285     return 0;
286 
287   return c;
288 }
289 
290 static int
_hb_ot_name_entry_cmp(const void * pa,const void * pb)291 _hb_ot_name_entry_cmp (const void *pa, const void *pb)
292 {
293   /* Compare by name_id, then language, then score, then index. */
294 
295   int v = _hb_ot_name_entry_cmp_key (pa, pb, true);
296   if (v)
297     return v;
298 
299   const hb_ot_name_entry_t *a = (const hb_ot_name_entry_t *) pa;
300   const hb_ot_name_entry_t *b = (const hb_ot_name_entry_t *) pb;
301 
302   if (a->entry_score != b->entry_score)
303     return a->entry_score - b->entry_score;
304 
305   if (a->entry_index != b->entry_index)
306     return a->entry_index - b->entry_index;
307 
308   return 0;
309 }
310 
311 struct name
312 {
313   static constexpr hb_tag_t tableTag = HB_OT_TAG_name;
314 
get_sizeOT::name315   unsigned int get_size () const
316   { return min_size + count * nameRecordZ.item_size; }
317 
318   template <typename Iterator,
319 	    hb_requires (hb_is_source_of (Iterator, const NameRecord &))>
serializeOT::name320   bool serialize (hb_serialize_context_t *c,
321 		  Iterator it,
322 		  const void *src_string_pool
323 #ifdef HB_EXPERIMENTAL_API
324                   , const hb_vector_t<hb_ot_name_record_ids_t>& insert_name_records
325 		  , const hb_hashmap_t<hb_ot_name_record_ids_t, hb_bytes_t> *name_table_overrides
326 #endif
327 		  )
328   {
329     TRACE_SERIALIZE (this);
330 
331     if (unlikely (!c->extend_min ((*this))))  return_trace (false);
332 
333     unsigned total_count = it.len ()
334 #ifdef HB_EXPERIMENTAL_API
335         + insert_name_records.length
336 #endif
337         ;
338     this->format = 0;
339     if (!c->check_assign (this->count, total_count, HB_SERIALIZE_ERROR_INT_OVERFLOW))
340       return false;
341 
342     NameRecord *name_records = (NameRecord *) hb_calloc (total_count, NameRecord::static_size);
343     if (unlikely (!name_records)) return_trace (false);
344 
345     hb_array_t<NameRecord> records (name_records, total_count);
346 
347     for (const NameRecord& record : it)
348     {
349       hb_memcpy (name_records, &record, NameRecord::static_size);
350       name_records++;
351     }
352 
353 #ifdef HB_EXPERIMENTAL_API
354     for (unsigned i = 0; i < insert_name_records.length; i++)
355     {
356       const hb_ot_name_record_ids_t& ids = insert_name_records[i];
357       NameRecord record;
358       record.platformID = ids.platform_id;
359       record.encodingID = ids.encoding_id;
360       record.languageID = ids.language_id;
361       record.nameID = ids.name_id;
362       record.length = 0; // handled in NameRecord copy()
363       record.offset = 0;
364       hb_memcpy (name_records, &record, NameRecord::static_size);
365       name_records++;
366     }
367 #endif
368 
369     records.qsort ();
370 
371     c->copy_all (records,
372 		 src_string_pool
373 #ifdef HB_EXPERIMENTAL_API
374 		 , name_table_overrides
375 #endif
376 		 );
377     hb_free (records.arrayZ);
378 
379 
380     if (unlikely (c->ran_out_of_room ())) return_trace (false);
381 
382     this->stringOffset = c->length ();
383 
384     return_trace (true);
385   }
386 
subsetOT::name387   bool subset (hb_subset_context_t *c) const
388   {
389     auto *name_prime = c->serializer->start_embed<name> ();
390 
391 #ifdef HB_EXPERIMENTAL_API
392     const hb_hashmap_t<hb_ot_name_record_ids_t, hb_bytes_t> *name_table_overrides =
393         &c->plan->name_table_overrides;
394 #endif
395 
396     auto it =
397     + nameRecordZ.as_array (count)
398     | hb_filter (c->plan->name_ids, &NameRecord::nameID)
399     | hb_filter (c->plan->name_languages, &NameRecord::languageID)
400     | hb_filter ([&] (const NameRecord& namerecord) {
401       return
402           (c->plan->flags & HB_SUBSET_FLAGS_NAME_LEGACY)
403           || namerecord.isUnicode ();
404     })
405 #ifdef HB_EXPERIMENTAL_API
406     | hb_filter ([&] (const NameRecord& namerecord) {
407       if (name_table_overrides->is_empty ())
408         return true;
409       hb_ot_name_record_ids_t rec_ids (namerecord.platformID,
410                                        namerecord.encodingID,
411                                        namerecord.languageID,
412                                        namerecord.nameID);
413 
414       hb_bytes_t *p;
415       if (name_table_overrides->has (rec_ids, &p) &&
416           (*p).length == 0)
417         return false;
418       return true;
419     })
420 #endif
421     ;
422 
423 #ifdef HB_EXPERIMENTAL_API
424     hb_hashmap_t<hb_ot_name_record_ids_t, unsigned> retained_name_record_ids;
425     for (const NameRecord& rec : it)
426     {
427       hb_ot_name_record_ids_t rec_ids (rec.platformID,
428                                        rec.encodingID,
429                                        rec.languageID,
430                                        rec.nameID);
431       retained_name_record_ids.set (rec_ids, 1);
432     }
433 
434     hb_vector_t<hb_ot_name_record_ids_t> insert_name_records;
435     if (!name_table_overrides->is_empty ())
436     {
437       if (unlikely (!insert_name_records.alloc (name_table_overrides->get_population (), true)))
438         return false;
439       for (const auto& record_ids : name_table_overrides->keys ())
440       {
441         if (name_table_overrides->get (record_ids).length == 0)
442           continue;
443         if (retained_name_record_ids.has (record_ids))
444           continue;
445         insert_name_records.push (record_ids);
446       }
447     }
448 #endif
449 
450     return name_prime->serialize (c->serializer, it,
451 				  std::addressof (this + stringOffset)
452 #ifdef HB_EXPERIMENTAL_API
453 				  , insert_name_records
454 				  , name_table_overrides
455 #endif
456 				  );
457   }
458 
sanitize_recordsOT::name459   bool sanitize_records (hb_sanitize_context_t *c) const
460   {
461     TRACE_SANITIZE (this);
462     const void *string_pool = (this+stringOffset).arrayZ;
463     return_trace (nameRecordZ.sanitize (c, count, string_pool));
464   }
465 
sanitizeOT::name466   bool sanitize (hb_sanitize_context_t *c) const
467   {
468     TRACE_SANITIZE (this);
469     return_trace (c->check_struct (this) &&
470 		  hb_barrier () &&
471 		  likely (format == 0 || format == 1) &&
472 		  c->check_array (nameRecordZ.arrayZ, count) &&
473 		  c->check_range (this, stringOffset) &&
474 		  sanitize_records (c));
475   }
476 
477   struct accelerator_t
478   {
accelerator_tOT::name::accelerator_t479     accelerator_t (hb_face_t *face)
480     {
481       this->table = hb_sanitize_context_t ().reference_table<name> (face);
482       assert (this->table.get_length () >= this->table->stringOffset);
483       this->pool = (const char *) (const void *) (this->table+this->table->stringOffset);
484       this->pool_len = this->table.get_length () - this->table->stringOffset;
485       const hb_array_t<const NameRecord> all_names (this->table->nameRecordZ.arrayZ,
486 						    this->table->count);
487 
488       this->names.alloc (all_names.length, true);
489 
490       for (unsigned int i = 0; i < all_names.length; i++)
491       {
492 	hb_ot_name_entry_t *entry = this->names.push ();
493 
494 	entry->name_id = all_names[i].nameID;
495 	entry->language = all_names[i].language (face);
496 	entry->entry_score =  all_names[i].score ();
497 	entry->entry_index = i;
498       }
499 
500       this->names.qsort (_hb_ot_name_entry_cmp);
501       /* Walk and pick best only for each name_id,language pair,
502        * while dropping unsupported encodings. */
503       unsigned int j = 0;
504       for (unsigned int i = 0; i < this->names.length; i++)
505       {
506 	if (this->names[i].entry_score == UNSUPPORTED ||
507 	    this->names[i].language == HB_LANGUAGE_INVALID)
508 	  continue;
509 	if (i &&
510 	    this->names[i - 1].name_id  == this->names[i].name_id &&
511 	    this->names[i - 1].language == this->names[i].language)
512 	  continue;
513 	this->names[j++] = this->names[i];
514       }
515       this->names.resize (j);
516     }
~accelerator_tOT::name::accelerator_t517     ~accelerator_t ()
518     {
519       this->table.destroy ();
520     }
521 
get_indexOT::name::accelerator_t522     int get_index (hb_ot_name_id_t  name_id,
523 		   hb_language_t    language,
524 		   unsigned int    *width=nullptr) const
525     {
526       const hb_ot_name_entry_t key = {name_id, {0}, language};
527       const hb_ot_name_entry_t *entry = hb_bsearch (key, (const hb_ot_name_entry_t *) this->names,
528 						    this->names.length,
529 						    sizeof (hb_ot_name_entry_t),
530 						    _hb_ot_name_entry_cmp_key,
531 						    true);
532 
533       if (!entry)
534       {
535 	entry = hb_bsearch (key, (const hb_ot_name_entry_t *) this->names,
536 			    this->names.length,
537 			    sizeof (hb_ot_name_entry_t),
538 			    _hb_ot_name_entry_cmp_key,
539 			    false);
540       }
541 
542       if (!entry)
543 	return -1;
544 
545       if (width)
546 	*width = entry->entry_score < 10 ? 2 : 1;
547 
548       return entry->entry_index;
549     }
550 
get_nameOT::name::accelerator_t551     hb_bytes_t get_name (unsigned int idx) const
552     {
553       const hb_array_t<const NameRecord> all_names (table->nameRecordZ.arrayZ, table->count);
554       const NameRecord &record = all_names[idx];
555       const hb_bytes_t string_pool (pool, pool_len);
556       return string_pool.sub_array (record.offset, record.length);
557     }
558 
559     private:
560     const char *pool;
561     unsigned int pool_len;
562     public:
563     hb_blob_ptr_t<name> table;
564     hb_vector_t<hb_ot_name_entry_t> names;
565   };
566 
567   public:
568   /* We only implement format 0 for now. */
569   HBUINT16	format;		/* Format selector (=0/1). */
570   HBUINT16	count;		/* Number of name records. */
571   NNOffset16To<UnsizedArrayOf<HBUINT8>>
572 		stringOffset;	/* Offset to start of string storage (from start of table). */
573   UnsizedArrayOf<NameRecord>
574 		nameRecordZ;	/* The name records where count is the number of records. */
575   public:
576   DEFINE_SIZE_ARRAY (6, nameRecordZ);
577 };
578 
579 #undef entry_index
580 #undef entry_score
581 
582 struct name_accelerator_t : name::accelerator_t {
name_accelerator_tOT::name_accelerator_t583   name_accelerator_t (hb_face_t *face) : name::accelerator_t (face) {}
584 };
585 
586 } /* namespace OT */
587 
588 
589 #endif /* OT_NAME_NAME_HH */
590