xref: /PHP-7.2/ext/standard/iptc.c (revision 7a7ec01a)
1 /*
2    +----------------------------------------------------------------------+
3    | PHP Version 7                                                        |
4    +----------------------------------------------------------------------+
5    | Copyright (c) 1997-2018 The PHP Group                                |
6    +----------------------------------------------------------------------+
7    | This source file is subject to version 3.01 of the PHP license,      |
8    | that is bundled with this package in the file LICENSE, and is        |
9    | available through the world-wide-web at the following url:           |
10    | http://www.php.net/license/3_01.txt                                  |
11    | If you did not receive a copy of the PHP license and are unable to   |
12    | obtain it through the world-wide-web, please send a note to          |
13    | license@php.net so we can mail you a copy immediately.               |
14    +----------------------------------------------------------------------+
15    | Author: Thies C. Arntzen <thies@thieso.net>                          |
16    +----------------------------------------------------------------------+
17  */
18 
19 /* $Id$ */
20 
21 /*
22  * Functions to parse & compse IPTC data.
23  * PhotoShop >= 3.0 can read and write textual data to JPEG files.
24  * ... more to come .....
25  *
26  * i know, parts of this is now duplicated in image.c
27  * but in this case i think it's okay!
28  */
29 
30 /*
31  * TODO:
32  *  - add IPTC translation table
33  */
34 
35 #include "php.h"
36 #include "php_iptc.h"
37 #include "ext/standard/head.h"
38 
39 #include <sys/stat.h>
40 
41 #ifdef PHP_WIN32
42 # include "win32/php_stdint.h"
43 #else
44 # if HAVE_INTTYPES_H
45 #  include <inttypes.h>
46 # elif HAVE_STDINT_H
47 #  include <stdint.h>
48 # endif
49 #endif
50 
51 /* some defines for the different JPEG block types */
52 #define M_SOF0  0xC0            /* Start Of Frame N */
53 #define M_SOF1  0xC1            /* N indicates which compression process */
54 #define M_SOF2  0xC2            /* Only SOF0-SOF2 are now in common use */
55 #define M_SOF3  0xC3
56 #define M_SOF5  0xC5            /* NB: codes C4 and CC are NOT SOF markers */
57 #define M_SOF6  0xC6
58 #define M_SOF7  0xC7
59 #define M_SOF9  0xC9
60 #define M_SOF10 0xCA
61 #define M_SOF11 0xCB
62 #define M_SOF13 0xCD
63 #define M_SOF14 0xCE
64 #define M_SOF15 0xCF
65 #define M_SOI   0xD8
66 #define M_EOI   0xD9            /* End Of Image (end of datastream) */
67 #define M_SOS   0xDA            /* Start Of Scan (begins compressed data) */
68 #define M_APP0  0xe0
69 #define M_APP1  0xe1
70 #define M_APP2  0xe2
71 #define M_APP3  0xe3
72 #define M_APP4  0xe4
73 #define M_APP5  0xe5
74 #define M_APP6  0xe6
75 #define M_APP7  0xe7
76 #define M_APP8  0xe8
77 #define M_APP9  0xe9
78 #define M_APP10 0xea
79 #define M_APP11 0xeb
80 #define M_APP12 0xec
81 #define M_APP13 0xed
82 #define M_APP14 0xee
83 #define M_APP15 0xef
84 
85 /* {{{ php_iptc_put1
86  */
php_iptc_put1(FILE * fp,int spool,unsigned char c,unsigned char ** spoolbuf)87 static int php_iptc_put1(FILE *fp, int spool, unsigned char c, unsigned char **spoolbuf)
88 {
89 	if (spool > 0)
90 		PUTC(c);
91 
92 	if (spoolbuf) *(*spoolbuf)++ = c;
93 
94   	return c;
95 }
96 /* }}} */
97 
98 /* {{{ php_iptc_get1
99  */
php_iptc_get1(FILE * fp,int spool,unsigned char ** spoolbuf)100 static int php_iptc_get1(FILE *fp, int spool, unsigned char **spoolbuf)
101 {
102 	int c;
103 	char cc;
104 
105 	c = getc(fp);
106 
107 	if (c == EOF) return EOF;
108 
109 	if (spool > 0) {
110 		cc = c;
111 		PUTC(cc);
112 	}
113 
114 	if (spoolbuf) *(*spoolbuf)++ = c;
115 
116 	return c;
117 }
118 /* }}} */
119 
120 /* {{{ php_iptc_read_remaining
121  */
php_iptc_read_remaining(FILE * fp,int spool,unsigned char ** spoolbuf)122 static int php_iptc_read_remaining(FILE *fp, int spool, unsigned char **spoolbuf)
123 {
124   	while (php_iptc_get1(fp, spool, spoolbuf) != EOF) continue;
125 
126 	return M_EOI;
127 }
128 /* }}} */
129 
130 /* {{{ php_iptc_skip_variable
131  */
php_iptc_skip_variable(FILE * fp,int spool,unsigned char ** spoolbuf)132 static int php_iptc_skip_variable(FILE *fp, int spool, unsigned char **spoolbuf)
133 {
134 	unsigned int  length;
135 	int c1, c2;
136 
137     if ((c1 = php_iptc_get1(fp, spool, spoolbuf)) == EOF) return M_EOI;
138 
139     if ((c2 = php_iptc_get1(fp, spool, spoolbuf)) == EOF) return M_EOI;
140 
141 	length = (((unsigned char) c1) << 8) + ((unsigned char) c2);
142 
143 	length -= 2;
144 
145 	while (length--)
146 		if (php_iptc_get1(fp, spool, spoolbuf) == EOF) return M_EOI;
147 
148 	return 0;
149 }
150 /* }}} */
151 
152 /* {{{ php_iptc_next_marker
153  */
php_iptc_next_marker(FILE * fp,int spool,unsigned char ** spoolbuf)154 static int php_iptc_next_marker(FILE *fp, int spool, unsigned char **spoolbuf)
155 {
156     int c;
157 
158     /* skip unimportant stuff */
159 
160     c = php_iptc_get1(fp, spool, spoolbuf);
161 
162 	if (c == EOF) return M_EOI;
163 
164     while (c != 0xff) {
165         if ((c = php_iptc_get1(fp, spool, spoolbuf)) == EOF)
166             return M_EOI; /* we hit EOF */
167     }
168 
169     /* get marker byte, swallowing possible padding */
170     do {
171         c = php_iptc_get1(fp, 0, 0);
172 		if (c == EOF)
173             return M_EOI;       /* we hit EOF */
174 		else
175 		if (c == 0xff)
176 			php_iptc_put1(fp, spool, (unsigned char)c, spoolbuf);
177     } while (c == 0xff);
178 
179     return (unsigned int) c;
180 }
181 /* }}} */
182 
183 static char psheader[] = "\xFF\xED\0\0Photoshop 3.0\08BIM\x04\x04\0\0\0\0";
184 
185 /* {{{ proto array iptcembed(string iptcdata, string jpeg_file_name [, int spool])
186    Embed binary IPTC data into a JPEG image. */
PHP_FUNCTION(iptcembed)187 PHP_FUNCTION(iptcembed)
188 {
189 	char *iptcdata, *jpeg_file;
190 	size_t iptcdata_len, jpeg_file_len;
191 	zend_long spool = 0;
192 	FILE *fp;
193 	unsigned int marker, done = 0;
194 	size_t inx;
195 	zend_string *spoolbuf = NULL;
196 	unsigned char *poi = NULL;
197 	zend_stat_t sb;
198 	zend_bool written = 0;
199 
200 	ZEND_PARSE_PARAMETERS_START(2, 3)
201 		Z_PARAM_STRING(iptcdata, iptcdata_len)
202 		Z_PARAM_PATH(jpeg_file, jpeg_file_len)
203 		Z_PARAM_OPTIONAL
204 		Z_PARAM_LONG(spool)
205 	ZEND_PARSE_PARAMETERS_END();
206 
207 	if (php_check_open_basedir(jpeg_file)) {
208 		RETURN_FALSE;
209 	}
210 
211 	if (iptcdata_len >= SIZE_MAX - sizeof(psheader) - 1025) {
212 		php_error_docref(NULL, E_WARNING, "IPTC data too large");
213 		RETURN_FALSE;
214 	}
215 
216 	if ((fp = VCWD_FOPEN(jpeg_file, "rb")) == 0) {
217 		php_error_docref(NULL, E_WARNING, "Unable to open %s", jpeg_file);
218 		RETURN_FALSE;
219 	}
220 
221 	if (spool < 2) {
222 		zend_fstat(fileno(fp), &sb);
223 
224 		spoolbuf = zend_string_safe_alloc(1, iptcdata_len + sizeof(psheader) + 1024 + 1, sb.st_size, 0);
225 		poi = (unsigned char*)ZSTR_VAL(spoolbuf);
226 		memset(poi, 0, iptcdata_len + sizeof(psheader) + sb.st_size + 1024 + 1);
227 	}
228 
229 	if (php_iptc_get1(fp, spool, poi?&poi:0) != 0xFF) {
230 		fclose(fp);
231 		if (spoolbuf) {
232 			zend_string_free(spoolbuf);
233 		}
234 		RETURN_FALSE;
235 	}
236 
237 	if (php_iptc_get1(fp, spool, poi?&poi:0) != 0xD8) {
238 		fclose(fp);
239 		if (spoolbuf) {
240 			zend_string_free(spoolbuf);
241 		}
242 		RETURN_FALSE;
243 	}
244 
245 	while (!done) {
246 		marker = php_iptc_next_marker(fp, spool, poi?&poi:0);
247 
248 		if (marker == M_EOI) { /* EOF */
249 			break;
250 		} else if (marker != M_APP13) {
251 			php_iptc_put1(fp, spool, (unsigned char)marker, poi?&poi:0);
252 		}
253 
254 		switch (marker) {
255 			case M_APP13:
256 				/* we are going to write a new APP13 marker, so don't output the old one */
257 				php_iptc_skip_variable(fp, 0, 0);
258 				fgetc(fp); /* skip already copied 0xFF byte */
259 				php_iptc_read_remaining(fp, spool, poi?&poi:0);
260 				done = 1;
261 				break;
262 
263 			case M_APP0:
264 				/* APP0 is in each and every JPEG, so when we hit APP0 we insert our new APP13! */
265 			case M_APP1:
266 				if (written) {
267 					/* don't try to write the data twice */
268 					break;
269 				}
270 				written = 1;
271 
272 				php_iptc_skip_variable(fp, spool, poi?&poi:0);
273 
274 				if (iptcdata_len & 1) {
275 					iptcdata_len++; /* make the length even */
276 				}
277 
278 				psheader[ 2 ] = (iptcdata_len+28)>>8;
279 				psheader[ 3 ] = (iptcdata_len+28)&0xff;
280 
281 				for (inx = 0; inx < 28; inx++) {
282 					php_iptc_put1(fp, spool, psheader[inx], poi?&poi:0);
283 				}
284 
285 				php_iptc_put1(fp, spool, (unsigned char)(iptcdata_len>>8), poi?&poi:0);
286 				php_iptc_put1(fp, spool, (unsigned char)(iptcdata_len&0xff), poi?&poi:0);
287 
288 				for (inx = 0; inx < iptcdata_len; inx++) {
289 					php_iptc_put1(fp, spool, iptcdata[inx], poi?&poi:0);
290 				}
291 				break;
292 
293 			case M_SOS:
294 				/* we hit data, no more marker-inserting can be done! */
295 				php_iptc_read_remaining(fp, spool, poi?&poi:0);
296 				done = 1;
297 				break;
298 
299 			default:
300 				php_iptc_skip_variable(fp, spool, poi?&poi:0);
301 				break;
302 		}
303 	}
304 
305 	fclose(fp);
306 
307 	if (spool < 2) {
308 		spoolbuf = zend_string_truncate(spoolbuf, poi - (unsigned char*)ZSTR_VAL(spoolbuf), 0);
309 		RETURN_NEW_STR(spoolbuf);
310 	} else {
311 		RETURN_TRUE;
312 	}
313 }
314 /* }}} */
315 
316 /* {{{ proto array iptcparse(string iptcdata)
317    Parse binary IPTC-data into associative array */
PHP_FUNCTION(iptcparse)318 PHP_FUNCTION(iptcparse)
319 {
320 	size_t inx = 0, len;
321 	unsigned int tagsfound = 0;
322 	unsigned char *buffer, recnum, dataset;
323 	char *str, key[16];
324 	size_t str_len;
325 	zval values, *element;
326 
327 	ZEND_PARSE_PARAMETERS_START(1, 1)
328 		Z_PARAM_STRING(str, str_len)
329 	ZEND_PARSE_PARAMETERS_END();
330 
331 	buffer = (unsigned char *)str;
332 
333 	while (inx < str_len) { /* find 1st tag */
334 		if ((buffer[inx] == 0x1c) && ((buffer[inx+1] == 0x01) || (buffer[inx+1] == 0x02))){
335 			break;
336 		} else {
337 			inx++;
338 		}
339 	}
340 
341 	while (inx < str_len) {
342 		if (buffer[ inx++ ] != 0x1c) {
343 			break;   /* we ran against some data which does not conform to IPTC - stop parsing! */
344 		}
345 
346 		if ((inx + 4) >= str_len)
347 			break;
348 
349 		dataset = buffer[ inx++ ];
350 		recnum = buffer[ inx++ ];
351 
352 		if (buffer[ inx ] & (unsigned char) 0x80) { /* long tag */
353 			if((inx+6) >= str_len) {
354 				break;
355 			}
356 			len = (((zend_long) buffer[ inx + 2 ]) << 24) + (((zend_long) buffer[ inx + 3 ]) << 16) +
357 				  (((zend_long) buffer[ inx + 4 ]) <<  8) + (((zend_long) buffer[ inx + 5 ]));
358 			inx += 6;
359 		} else { /* short tag */
360 			len = (((unsigned short) buffer[ inx ])<<8) | (unsigned short)buffer[ inx+1 ];
361 			inx += 2;
362 		}
363 
364 		if ((len > str_len) || (inx + len) > str_len) {
365 			break;
366 		}
367 
368 		snprintf(key, sizeof(key), "%d#%03d", (unsigned int) dataset, (unsigned int) recnum);
369 
370 		if (tagsfound == 0) { /* found the 1st tag - initialize the return array */
371 			array_init(return_value);
372 		}
373 
374 		if ((element = zend_hash_str_find(Z_ARRVAL_P(return_value), key, strlen(key))) == NULL) {
375 			array_init(&values);
376 
377 			element = zend_hash_str_update(Z_ARRVAL_P(return_value), key, strlen(key), &values);
378 		}
379 
380 		add_next_index_stringl(element, (char *) buffer+inx, len);
381 		inx += len;
382 		tagsfound++;
383 	}
384 
385 	if (! tagsfound) {
386 		RETURN_FALSE;
387 	}
388 }
389 /* }}} */
390 
391 /*
392  * Local variables:
393  * tab-width: 4
394  * c-basic-offset: 4
395  * End:
396  * vim600: sw=4 ts=4 fdm=marker
397  * vim<600: sw=4 ts=4
398  */
399