t1parse.c source code [Godot/thirdparty/freetype/src/type1/t1parse.c]

1	/****************************************************************************
2	*
3	* t1parse.c
4	*
5	* Type 1 parser (body).
6	*
7	* Copyright (C) 1996-2023 by
8	* David Turner, Robert Wilhelm, and Werner Lemberg.
9	*
10	* This file is part of the FreeType project, and may only be used,
11	* modified, and distributed under the terms of the FreeType project
12	* license, LICENSE.TXT. By continuing to use, modify, or distribute
13	* this file you indicate that you have read the license and
14	* understand and accept it fully.
15	*
16	*/
17
18
19	/**************************************************************************
20	*
21	* The Type 1 parser is in charge of the following:
22	*
23	* - provide an implementation of a growing sequence of objects called
24	* a `T1_Table' (used to build various tables needed by the loader).
25	*
26	* - opening .pfb and .pfa files to extract their top-level and private
27	* dictionaries.
28	*
29	* - read numbers, arrays & strings from any dictionary.
30	*
31	* See `t1load.c' to see how data is loaded from the font file.
32	*
33	*/
34
35
36	#include <freetype/internal/ftdebug.h>
37	#include <freetype/internal/ftstream.h>
38	#include <freetype/internal/psaux.h>
39
40	#include "t1parse.h"
41
42	#include "t1errors.h"
43
44
45	/**************************************************************************
46	*
47	* The macro FT_COMPONENT is used in trace mode. It is an implicit
48	* parameter of the FT_TRACE() and FT_ERROR() macros, used to print/log
49	* messages during execution.
50	*/
51	#undef FT_COMPONENT
52	#define FT_COMPONENT t1parse
53
54
55	/***********************************************************************/
56	/***********************************************************************/
57	/***********************************************************************/
58	/** **/
59	/** INPUT STREAM PARSER **/
60	/** **/
61	/***********************************************************************/
62	/***********************************************************************/
63	/***********************************************************************/
64
65
66	/ see Adobe Technical Note 5040.Download_Fonts.pdf /
67
68	static FT_Error
69	read_pfb_tag( FT_Stream stream,
70	FT_UShort *atag,
71	FT_ULong *asize )
72	{
73	FT_Error error;
74	FT_UShort tag;
75	FT_ULong size;
76
77
78	*atag = `0`;
79	*asize = `0`;
80
81	if ( !FT_READ_USHORT( tag ) )
82	{
83	if ( tag == `0x8001U` \|\| tag == `0x8002U` )
84	{
85	if ( !FT_READ_ULONG_LE( size ) )
86	*asize = size;
87	}
88
89	*atag = tag;
90	}
91
92	return error;
93	}
94
95
96	static FT_Error
97	check_type1_format( FT_Stream stream,
98	const char* header_string,
99	size_t header_length )
100	{
101	FT_Error error;
102	FT_UShort tag;
103	FT_ULong dummy;
104
105
106	if ( FT_STREAM_SEEK( `0` ) )
107	goto Exit;
108
109	error = read_pfb_tag( stream, &tag, &dummy );
110	if ( error )
111	goto Exit;
112
113	/ We assume that the first segment in a PFB is always encoded as /
114	/ text. This might be wrong (and the specification doesn't insist /
115	/ on that), but we have never seen a counterexample. /
116	if ( tag != `0x8001U` && FT_STREAM_SEEK( `0` ) )
117	goto Exit;
118
119	if ( !FT_FRAME_ENTER( header_length ) )
120	{
121	error = FT_Err_Ok;
122
123	if ( ft_memcmp( stream->cursor, header_string, header_length ) != `0` )
124	error = FT_THROW( Unknown_File_Format );
125
126	FT_FRAME_EXIT();
127	}
128
129	Exit:
130	return error;
131	}
132
133
134	FT_LOCAL_DEF( FT_Error )
135	T1_New_Parser( T1_Parser parser,
136	FT_Stream stream,
137	FT_Memory memory,
138	PSAux_Service psaux )
139	{
140	FT_Error error;
141	FT_UShort tag;
142	FT_ULong size;
143
144
145	psaux->ps_parser_funcs->init( &parser->root, NULL, NULL, memory );
146
147	parser->stream = stream;
148	parser->base_len = `0`;
149	parser->base_dict = NULL;
150	parser->private_len = `0`;
151	parser->private_dict = NULL;
152	parser->in_pfb = `0`;
153	parser->in_memory = `0`;
154	parser->single_block = `0`;
155
156	/ check the header format /
157	error = check_type1_format( stream, "%!PS-AdobeFont", `14` );
158	if ( error )
159	{
160	if ( FT_ERR_NEQ( error, Unknown_File_Format ) )
161	goto Exit;
162
163	error = check_type1_format( stream, "%!FontType", `10` );
164	if ( error )
165	{
166	FT_TRACE2(( " not a Type 1 font\n" ));
167	goto Exit;
168	}
169	}
170
171	/*******************************************************************
172	*
173	* Here a short summary of what is going on:
174	*
175	* When creating a new Type 1 parser, we try to locate and load
176	* the base dictionary if this is possible (i.e., for PFB
177	* files). Otherwise, we load the whole font into memory.
178	*
179	* When `loading' the base dictionary, we only setup pointers
180	* in the case of a memory-based stream. Otherwise, we
181	* allocate and load the base dictionary in it.
182	*
183	* parser->in_pfb is set if we are in a binary (`.pfb') font.
184	* parser->in_memory is set if we have a memory stream.
185	*/
186
187	/ try to compute the size of the base dictionary; /
188	/ look for a Postscript binary file tag, i.e., 0x8001 /
189	if ( FT_STREAM_SEEK( `0L` ) )
190	goto Exit;
191
192	error = read_pfb_tag( stream, &tag, &size );
193	if ( error )
194	goto Exit;
195
196	if ( tag != `0x8001U` )
197	{
198	/ assume that this is a PFA file for now; an error will /
199	/ be produced later when more things are checked /
200	if ( FT_STREAM_SEEK( `0L` ) )
201	goto Exit;
202	size = stream->size;
203	}
204	else
205	parser->in_pfb = `1`;
206
207	/ now, try to load `size' bytes of the `base' dictionary we /
208	/ found previously /
209
210	/ if it is a memory-based resource, set up pointers /
211	if ( !stream->read )
212	{
213	parser->base_dict = (FT_Byte*)stream->base + stream->pos;
214	parser->base_len = size;
215	parser->in_memory = `1`;
216
217	/ check that the `size' field is valid /
218	if ( FT_STREAM_SKIP( size ) )
219	goto Exit;
220	}
221	else
222	{
223	/ read segment in memory -- this is clumsy, but so does the format /
224	if ( FT_QALLOC( parser->base_dict, size ) \|\|
225	FT_STREAM_READ( parser->base_dict, size ) )
226	goto Exit;
227	parser->base_len = size;
228	}
229
230	parser->root.base = parser->base_dict;
231	parser->root.cursor = parser->base_dict;
232	parser->root.limit = parser->root.cursor + parser->base_len;
233
234	Exit:
235	if ( error && !parser->in_memory )
236	FT_FREE( parser->base_dict );
237
238	return error;
239	}
240
241
242	FT_LOCAL_DEF( void )
243	T1_Finalize_Parser( T1_Parser parser )
244	{
245	FT_Memory memory = parser->root.memory;
246
247
248	/ always free the private dictionary /
249	FT_FREE( parser->private_dict );
250
251	/ free the base dictionary only when we have a disk stream /
252	if ( !parser->in_memory )
253	FT_FREE( parser->base_dict );
254
255	parser->root.funcs.done( &parser->root );
256	}
257
258
259	FT_LOCAL_DEF( FT_Error )
260	T1_Get_Private_Dict( T1_Parser parser,
261	PSAux_Service psaux )
262	{
263	FT_Stream stream = parser->stream;
264	FT_Memory memory = parser->root.memory;
265	FT_Error error = FT_Err_Ok;
266	FT_ULong size;
267
268
269	if ( parser->in_pfb )
270	{
271	/ in the case of the PFB format, the private dictionary can be /
272	/ made of several segments. We thus first read the number of /
273	/ segments to compute the total size of the private dictionary /
274	/ then re-read them into memory. /
275	FT_ULong start_pos = FT_STREAM_POS();
276	FT_UShort tag;
277
278
279	parser->private_len = `0`;
280	for (;;)
281	{
282	error = read_pfb_tag( stream, &tag, &size );
283	if ( error )
284	goto Fail;
285
286	if ( tag != `0x8002U` )
287	break;
288
289	parser->private_len += size;
290
291	if ( FT_STREAM_SKIP( size ) )
292	goto Fail;
293	}
294
295	/ Check that we have a private dictionary there /
296	/ and allocate private dictionary buffer /
297	if ( parser->private_len == `0` )
298	{
299	FT_ERROR(( "T1_Get_Private_Dict:"
300	" invalid private dictionary section\n" ));
301	error = FT_THROW( Invalid_File_Format );
302	goto Fail;
303	}
304
305	if ( FT_STREAM_SEEK( start_pos ) \|\|
306	FT_QALLOC( parser->private_dict, parser->private_len ) )
307	goto Fail;
308
309	parser->private_len = `0`;
310	for (;;)
311	{
312	error = read_pfb_tag( stream, &tag, &size );
313	if ( error \|\| tag != `0x8002U` )
314	{
315	error = FT_Err_Ok;
316	break;
317	}
318
319	if ( FT_STREAM_READ( parser->private_dict + parser->private_len,
320	size ) )
321	goto Fail;
322
323	parser->private_len += size;
324	}
325	}
326	else
327	{
328	/ We have already `loaded' the whole PFA font file into memory; /
329	/ if this is a memory resource, allocate a new block to hold /
330	/ the private dict. Otherwise, simply overwrite into the base /
331	/ dictionary block in the heap. /
332
333	/ First look for the `eexec' keyword. Ensure `eexec' is real -- /
334	/ it could be in a comment or string (as e.g. in u003043t.gsf /
335	/ from ghostscript). /
336	FT_Byte* cur = parser->base_dict;
337	FT_Byte* limit = cur + parser->base_len;
338	FT_Pointer pos_lf;
339	FT_Bool test_cr;
340
341
342	parser->root.cursor = parser->base_dict;
343	parser->root.limit = parser->base_dict + parser->base_len;
344
345	cur = parser->root.cursor;
346	limit = parser->root.limit;
347
348	while ( cur < limit )
349	{
350	/ 9 = 5 letters for `eexec' + whitespace + 4 chars /
351	if ( cur[`0`] == `'e'` && cur + `9` < limit )
352	{
353	if ( cur[`1`] == `'e'` &&
354	cur[`2`] == `'x'` &&
355	cur[`3`] == `'e'` &&
356	cur[`4`] == `'c'` )
357	goto Found;
358	}
359
360	T1_Skip_PS_Token( parser );
361	if ( parser->root.error )
362	break;
363	T1_Skip_Spaces ( parser );
364	cur = parser->root.cursor;
365	}
366
367	FT_ERROR(( "T1_Get_Private_Dict: could not find `eexec' keyword\n" ));
368	error = FT_THROW( Invalid_File_Format );
369	goto Exit;
370
371	/ now determine where to write the _encrypted_ binary private /
372	/ dictionary. We overwrite the base dictionary for disk-based /
373	/ resources and allocate a new block otherwise /
374
375	Found:
376	parser->root.limit = parser->base_dict + parser->base_len;
377
378	T1_Skip_PS_Token( parser );
379	cur = parser->root.cursor;
380	limit = parser->root.limit;
381
382	/ According to the Type 1 spec, the first cipher byte must not be /
383	/ an ASCII whitespace character code (blank, tab, carriage return /
384	/ or line feed). We have seen Type 1 fonts with two line feed /
385	/ characters... So skip now all whitespace character codes. /
386	/ /
387	/ On the other hand, Adobe's Type 1 parser handles fonts just /
388	/ fine that are violating this limitation, so we add a heuristic /
389	/ test to stop at \r only if it is not used for EOL. /
390
391	pos_lf = ft_memchr( cur, `'\n'`, (size_t)( limit - cur ) );
392	test_cr = FT_BOOL( !pos_lf \|\|
393	pos_lf > ft_memchr( cur,
394	`'\r'`,
395	(size_t)( limit - cur ) ) );
396
397	while ( cur < limit &&
398	( *cur == `' '` \|\|
399	*cur == `'\t'` \|\|
400	(test_cr && *cur == `'\r'` ) \|\|
401	*cur == `'\n'` ) )
402	cur++;
403	if ( cur >= limit )
404	{
405	FT_ERROR(( "T1_Get_Private_Dict:"
406	" `eexec' not properly terminated\n" ));
407	error = FT_THROW( Invalid_File_Format );
408	goto Exit;
409	}
410
411	size = parser->base_len - (FT_ULong)( cur - parser->base_dict );
412
413	if ( parser->in_memory )
414	{
415	/ note that we allocate one more byte to put a terminating `0' /
416	if ( FT_QALLOC( parser->private_dict, size + `1` ) )
417	goto Fail;
418	parser->private_len = size;
419	}
420	else
421	{
422	parser->single_block = `1`;
423	parser->private_dict = parser->base_dict;
424	parser->private_len = size;
425	parser->base_dict = NULL;
426	parser->base_len = `0`;
427	}
428
429	/ now determine whether the private dictionary is encoded in binary /
430	/ or hexadecimal ASCII format -- decode it accordingly /
431
432	/ we need to access the next 4 bytes (after the final whitespace /
433	/ following the `eexec' keyword); if they all are hexadecimal /
434	/ digits, then we have a case of ASCII storage /
435
436	if ( cur + `3` < limit &&
437	ft_isxdigit( cur[`0`] ) && ft_isxdigit( cur[`1`] ) &&
438	ft_isxdigit( cur[`2`] ) && ft_isxdigit( cur[`3`] ) )
439	{
440	/ ASCII hexadecimal encoding /
441	FT_ULong len;
442
443
444	parser->root.cursor = cur;
445	(void)psaux->ps_parser_funcs->to_bytes( &parser->root,
446	parser->private_dict,
447	parser->private_len,
448	&len,
449	`0` );
450	parser->private_len = len;
451
452	/ put a safeguard /
453	parser->private_dict[len] = `'\0'`;
454	}
455	else
456	/ binary encoding -- copy the private dict /
457	FT_MEM_MOVE( parser->private_dict, cur, size );
458	}
459
460	/ we now decrypt the encoded binary private dictionary /
461	psaux->t1_decrypt( parser->private_dict, parser->private_len, `55665U` );
462
463	if ( parser->private_len < `4` )
464	{
465	FT_ERROR(( "T1_Get_Private_Dict:"
466	" invalid private dictionary section\n" ));
467	error = FT_THROW( Invalid_File_Format );
468	goto Fail;
469	}
470
471	/ replace the four random bytes at the beginning with whitespace /
472	parser->private_dict[`0`] = `' '`;
473	parser->private_dict[`1`] = `' '`;
474	parser->private_dict[`2`] = `' '`;
475	parser->private_dict[`3`] = `' '`;
476
477	parser->root.base = parser->private_dict;
478	parser->root.cursor = parser->private_dict;
479	parser->root.limit = parser->root.cursor + parser->private_len;
480
481	Fail:
482	Exit:
483	return error;
484	}
485
486
487	/ END /
488

Browse the source code of Godot/thirdparty/freetype/src/type1/t1parse.c