jcsample.c source code [tensorflow/external/libjpeg_turbo/jcsample.c]

1	/*
2	* jcsample.c
3	*
4	* This file was part of the Independent JPEG Group's software:
5	* Copyright (C) 1991-1996, Thomas G. Lane.
6	* libjpeg-turbo Modifications:
7	* Copyright 2009 Pierre Ossman <[email protected]> for Cendio AB
8	* Copyright (C) 2014, MIPS Technologies, Inc., California.
9	* Copyright (C) 2015, 2019, D. R. Commander.
10	* For conditions of distribution and use, see the accompanying README.ijg
11	* file.
12	*
13	* This file contains downsampling routines.
14	*
15	* Downsampling input data is counted in "row groups". A row group
16	* is defined to be max_v_samp_factor pixel rows of each component,
17	* from which the downsampler produces v_samp_factor sample rows.
18	* A single row group is processed in each call to the downsampler module.
19	*
20	* The downsampler is responsible for edge-expansion of its output data
21	* to fill an integral number of DCT blocks horizontally. The source buffer
22	* may be modified if it is helpful for this purpose (the source buffer is
23	* allocated wide enough to correspond to the desired output width).
24	* The caller (the prep controller) is responsible for vertical padding.
25	*
26	* The downsampler may request "context rows" by setting need_context_rows
27	* during startup. In this case, the input arrays will contain at least
28	* one row group's worth of pixels above and below the passed-in data;
29	* the caller will create dummy rows at image top and bottom by replicating
30	* the first or last real pixel row.
31	*
32	* An excellent reference for image resampling is
33	* Digital Image Warping, George Wolberg, 1990.
34	* Pub. by IEEE Computer Society Press, Los Alamitos, CA. ISBN 0-8186-8944-7.
35	*
36	* The downsampling algorithm used here is a simple average of the source
37	* pixels covered by the output pixel. The hi-falutin sampling literature
38	* refers to this as a "box filter". In general the characteristics of a box
39	* filter are not very good, but for the specific cases we normally use (1:1
40	* and 2:1 ratios) the box is equivalent to a "triangle filter" which is not
41	* nearly so bad. If you intend to use other sampling ratios, you'd be well
42	* advised to improve this code.
43	*
44	* A simple input-smoothing capability is provided. This is mainly intended
45	* for cleaning up color-dithered GIF input files (if you find it inadequate,
46	* we suggest using an external filtering program such as pnmconvol). When
47	* enabled, each input pixel P is replaced by a weighted sum of itself and its
48	* eight neighbors. P's weight is 1-8*SF and each neighbor's weight is SF,
49	* where SF = (smoothing_factor / 1024).
50	* Currently, smoothing is only supported for 2h2v sampling factors.
51	*/
52
53	#define JPEG_INTERNALS
54	#include "jinclude.h"
55	#include "jpeglib.h"
56	#include "jsimd.h"
57
58
59	/ Pointer to routine to downsample a single component /
60	typedef void (*downsample1_ptr) (j_compress_ptr cinfo,
61	jpeg_component_info *compptr,
62	JSAMPARRAY input_data,
63	JSAMPARRAY output_data);
64
65	/ Private subobject /
66
67	typedef struct {
68	struct jpeg_downsampler pub; / public fields /
69
70	/ Downsampling method pointers, one per component /
71	downsample1_ptr methods[MAX_COMPONENTS];
72	} my_downsampler;
73
74	typedef my_downsampler *my_downsample_ptr;
75
76
77	/*
78	* Initialize for a downsampling pass.
79	*/
80
81	METHODDEF(void)
82	start_pass_downsample(j_compress_ptr cinfo)
83	{
84	/ no work for now /
85	}
86
87
88	/*
89	* Expand a component horizontally from width input_cols to width output_cols,
90	* by duplicating the rightmost samples.
91	*/
92
93	LOCAL(void)
94	expand_right_edge(JSAMPARRAY image_data, int num_rows, JDIMENSION input_cols,
95	JDIMENSION output_cols)
96	{
97	register JSAMPROW ptr;
98	register JSAMPLE pixval;
99	register int count;
100	int row;
101	int numcols = (int)(output_cols - input_cols);
102
103	if (numcols > `0`) {
104	for (row = `0`; row < num_rows; row++) {
105	ptr = image_data[row] + input_cols;
106	pixval = ptr[-`1`];
107	for (count = numcols; count > `0`; count--)
108	*ptr++ = pixval;
109	}
110	}
111	}
112
113
114	/*
115	* Do downsampling for a whole row group (all components).
116	*
117	* In this version we simply downsample each component independently.
118	*/
119
120	METHODDEF(void)
121	sep_downsample(j_compress_ptr cinfo, JSAMPIMAGE input_buf,
122	JDIMENSION in_row_index, JSAMPIMAGE output_buf,
123	JDIMENSION out_row_group_index)
124	{
125	my_downsample_ptr downsample = (my_downsample_ptr)cinfo->downsample;
126	int ci;
127	jpeg_component_info *compptr;
128	JSAMPARRAY in_ptr, out_ptr;
129
130	for (ci = `0`, compptr = cinfo->comp_info; ci < cinfo->num_components;
131	ci++, compptr++) {
132	in_ptr = input_buf[ci] + in_row_index;
133	out_ptr = output_buf[ci] + (out_row_group_index * compptr->v_samp_factor);
134	(*downsample->methods[ci]) (cinfo, compptr, in_ptr, out_ptr);
135	}
136	}
137
138
139	/*
140	* Downsample pixel values of a single component.
141	* One row group is processed per call.
142	* This version handles arbitrary integral sampling ratios, without smoothing.
143	* Note that this version is not actually used for customary sampling ratios.
144	*/
145
146	METHODDEF(void)
147	int_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
148	JSAMPARRAY input_data, JSAMPARRAY output_data)
149	{
150	int inrow, outrow, h_expand, v_expand, numpix, numpix2, h, v;
151	JDIMENSION outcol, outcol_h; / outcol_h == outcolh_expand /*
152	JDIMENSION output_cols = compptr->width_in_blocks * DCTSIZE;
153	JSAMPROW inptr, outptr;
154	JLONG outvalue;
155
156	h_expand = cinfo->max_h_samp_factor / compptr->h_samp_factor;
157	v_expand = cinfo->max_v_samp_factor / compptr->v_samp_factor;
158	numpix = h_expand * v_expand;
159	numpix2 = numpix / `2`;
160
161	/ Expand input data enough to let all the output samples be generated*
162	* by the standard loop. Special-casing padded output would be more
163	* efficient.
164	*/
165	expand_right_edge(input_data, cinfo->max_v_samp_factor, cinfo->image_width,
166	output_cols * h_expand);
167
168	inrow = `0`;
169	for (outrow = `0`; outrow < compptr->v_samp_factor; outrow++) {
170	outptr = output_data[outrow];
171	for (outcol = `0`, outcol_h = `0`; outcol < output_cols;
172	outcol++, outcol_h += h_expand) {
173	outvalue = `0`;
174	for (v = `0`; v < v_expand; v++) {
175	inptr = input_data[inrow + v] + outcol_h;
176	for (h = `0`; h < h_expand; h++) {
177	outvalue += (JLONG)(*inptr++);
178	}
179	}
180	*outptr++ = (JSAMPLE)((outvalue + numpix2) / numpix);
181	}
182	inrow += v_expand;
183	}
184	}
185
186
187	/*
188	* Downsample pixel values of a single component.
189	* This version handles the special case of a full-size component,
190	* without smoothing.
191	*/
192
193	METHODDEF(void)
194	fullsize_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
195	JSAMPARRAY input_data, JSAMPARRAY output_data)
196	{
197	/ Copy the data /
198	jcopy_sample_rows(input_data, `0`, output_data, `0`, cinfo->max_v_samp_factor,
199	cinfo->image_width);
200	/ Edge-expand /
201	expand_right_edge(output_data, cinfo->max_v_samp_factor, cinfo->image_width,
202	compptr->width_in_blocks * DCTSIZE);
203	}
204
205
206	/*
207	* Downsample pixel values of a single component.
208	* This version handles the common case of 2:1 horizontal and 1:1 vertical,
209	* without smoothing.
210	*
211	* A note about the "bias" calculations: when rounding fractional values to
212	* integer, we do not want to always round 0.5 up to the next integer.
213	* If we did that, we'd introduce a noticeable bias towards larger values.
214	* Instead, this code is arranged so that 0.5 will be rounded up or down at
215	* alternate pixel locations (a simple ordered dither pattern).
216	*/
217
218	METHODDEF(void)
219	h2v1_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
220	JSAMPARRAY input_data, JSAMPARRAY output_data)
221	{
222	int outrow;
223	JDIMENSION outcol;
224	JDIMENSION output_cols = compptr->width_in_blocks * DCTSIZE;
225	register JSAMPROW inptr, outptr;
226	register int bias;
227
228	/ Expand input data enough to let all the output samples be generated*
229	* by the standard loop. Special-casing padded output would be more
230	* efficient.
231	*/
232	expand_right_edge(input_data, cinfo->max_v_samp_factor, cinfo->image_width,
233	output_cols * `2`);
234
235	for (outrow = `0`; outrow < compptr->v_samp_factor; outrow++) {
236	outptr = output_data[outrow];
237	inptr = input_data[outrow];
238	bias = `0`; / bias = 0,1,0,1,... for successive samples /
239	for (outcol = `0`; outcol < output_cols; outcol++) {
240	*outptr++ = (JSAMPLE)((inptr[`0`] + inptr[`1`] + bias) >> `1`);
241	bias ^= `1`; / 0=>1, 1=>0 /
242	inptr += `2`;
243	}
244	}
245	}
246
247
248	/*
249	* Downsample pixel values of a single component.
250	* This version handles the standard case of 2:1 horizontal and 2:1 vertical,
251	* without smoothing.
252	*/
253
254	METHODDEF(void)
255	h2v2_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
256	JSAMPARRAY input_data, JSAMPARRAY output_data)
257	{
258	int inrow, outrow;
259	JDIMENSION outcol;
260	JDIMENSION output_cols = compptr->width_in_blocks * DCTSIZE;
261	register JSAMPROW inptr0, inptr1, outptr;
262	register int bias;
263
264	/ Expand input data enough to let all the output samples be generated*
265	* by the standard loop. Special-casing padded output would be more
266	* efficient.
267	*/
268	expand_right_edge(input_data, cinfo->max_v_samp_factor, cinfo->image_width,
269	output_cols * `2`);
270
271	inrow = `0`;
272	for (outrow = `0`; outrow < compptr->v_samp_factor; outrow++) {
273	outptr = output_data[outrow];
274	inptr0 = input_data[inrow];
275	inptr1 = input_data[inrow + `1`];
276	bias = `1`; / bias = 1,2,1,2,... for successive samples /
277	for (outcol = `0`; outcol < output_cols; outcol++) {
278	*outptr++ =
279	(JSAMPLE)((inptr0[`0`] + inptr0[`1`] + inptr1[`0`] + inptr1[`1`] + bias) >> `2`);
280	bias ^= `3`; / 1=>2, 2=>1 /
281	inptr0 += `2`; inptr1 += `2`;
282	}
283	inrow += `2`;
284	}
285	}
286
287
288	#ifdef INPUT_SMOOTHING_SUPPORTED
289
290	/*
291	* Downsample pixel values of a single component.
292	* This version handles the standard case of 2:1 horizontal and 2:1 vertical,
293	* with smoothing. One row of context is required.
294	*/
295
296	METHODDEF(void)
297	h2v2_smooth_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
298	JSAMPARRAY input_data, JSAMPARRAY output_data)
299	{
300	int inrow, outrow;
301	JDIMENSION colctr;
302	JDIMENSION output_cols = compptr->width_in_blocks * DCTSIZE;
303	register JSAMPROW inptr0, inptr1, above_ptr, below_ptr, outptr;
304	JLONG membersum, neighsum, memberscale, neighscale;
305
306	/ Expand input data enough to let all the output samples be generated*
307	* by the standard loop. Special-casing padded output would be more
308	* efficient.
309	*/
310	expand_right_edge(input_data - `1`, cinfo->max_v_samp_factor + `2`,
311	cinfo->image_width, output_cols * `2`);
312
313	/ We don't bother to form the individual "smoothed" input pixel values;*
314	* we can directly compute the output which is the average of the four
315	* smoothed values. Each of the four member pixels contributes a fraction
316	* (1-8*SF) to its own smoothed image and a fraction SF to each of the three
317	* other smoothed pixels, therefore a total fraction (1-5*SF)/4 to the final
318	* output. The four corner-adjacent neighbor pixels contribute a fraction
319	* SF to just one smoothed pixel, or SF/4 to the final output; while the
320	* eight edge-adjacent neighbors contribute SF to each of two smoothed
321	* pixels, or SF/2 overall. In order to use integer arithmetic, these
322	* factors are scaled by 2^16 = 65536.
323	* Also recall that SF = smoothing_factor / 1024.
324	*/
325
326	memberscale = `16384` - cinfo->smoothing_factor * `80`; / scaled (1-5SF)/4 /*
327	neighscale = cinfo->smoothing_factor * `16`; / scaled SF/4 /
328
329	inrow = `0`;
330	for (outrow = `0`; outrow < compptr->v_samp_factor; outrow++) {
331	outptr = output_data[outrow];
332	inptr0 = input_data[inrow];
333	inptr1 = input_data[inrow + `1`];
334	above_ptr = input_data[inrow - `1`];
335	below_ptr = input_data[inrow + `2`];
336
337	/ Special case for first column: pretend column -1 is same as column 0 /
338	membersum = inptr0[`0`] + inptr0[`1`] + inptr1[`0`] + inptr1[`1`];
339	neighsum = above_ptr[`0`] + above_ptr[`1`] + below_ptr[`0`] + below_ptr[`1`] +
340	inptr0[`0`] + inptr0[`2`] + inptr1[`0`] + inptr1[`2`];
341	neighsum += neighsum;
342	neighsum += above_ptr[`0`] + above_ptr[`2`] + below_ptr[`0`] + below_ptr[`2`];
343	membersum = membersum * memberscale + neighsum * neighscale;
344	*outptr++ = (JSAMPLE)((membersum + `32768`) >> `16`);
345	inptr0 += `2`; inptr1 += `2`; above_ptr += `2`; below_ptr += `2`;
346
347	for (colctr = output_cols - `2`; colctr > `0`; colctr--) {
348	/ sum of pixels directly mapped to this output element /
349	membersum = inptr0[`0`] + inptr0[`1`] + inptr1[`0`] + inptr1[`1`];
350	/ sum of edge-neighbor pixels /
351	neighsum = above_ptr[`0`] + above_ptr[`1`] + below_ptr[`0`] + below_ptr[`1`] +
352	inptr0[-`1`] + inptr0[`2`] + inptr1[-`1`] + inptr1[`2`];
353	/ The edge-neighbors count twice as much as corner-neighbors /
354	neighsum += neighsum;
355	/ Add in the corner-neighbors /
356	neighsum += above_ptr[-`1`] + above_ptr[`2`] + below_ptr[-`1`] + below_ptr[`2`];
357	/ form final output scaled up by 2^16 /
358	membersum = membersum * memberscale + neighsum * neighscale;
359	/ round, descale and output it /
360	*outptr++ = (JSAMPLE)((membersum + `32768`) >> `16`);
361	inptr0 += `2`; inptr1 += `2`; above_ptr += `2`; below_ptr += `2`;
362	}
363
364	/ Special case for last column /
365	membersum = inptr0[`0`] + inptr0[`1`] + inptr1[`0`] + inptr1[`1`];
366	neighsum = above_ptr[`0`] + above_ptr[`1`] + below_ptr[`0`] + below_ptr[`1`] +
367	inptr0[-`1`] + inptr0[`1`] + inptr1[-`1`] + inptr1[`1`];
368	neighsum += neighsum;
369	neighsum += above_ptr[-`1`] + above_ptr[`1`] + below_ptr[-`1`] + below_ptr[`1`];
370	membersum = membersum * memberscale + neighsum * neighscale;
371	*outptr = (JSAMPLE)((membersum + `32768`) >> `16`);
372
373	inrow += `2`;
374	}
375	}
376
377
378	/*
379	* Downsample pixel values of a single component.
380	* This version handles the special case of a full-size component,
381	* with smoothing. One row of context is required.
382	*/
383
384	METHODDEF(void)
385	fullsize_smooth_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
386	JSAMPARRAY input_data, JSAMPARRAY output_data)
387	{
388	int outrow;
389	JDIMENSION colctr;
390	JDIMENSION output_cols = compptr->width_in_blocks * DCTSIZE;
391	register JSAMPROW inptr, above_ptr, below_ptr, outptr;
392	JLONG membersum, neighsum, memberscale, neighscale;
393	int colsum, lastcolsum, nextcolsum;
394
395	/ Expand input data enough to let all the output samples be generated*
396	* by the standard loop. Special-casing padded output would be more
397	* efficient.
398	*/
399	expand_right_edge(input_data - `1`, cinfo->max_v_samp_factor + `2`,
400	cinfo->image_width, output_cols);
401
402	/ Each of the eight neighbor pixels contributes a fraction SF to the*
403	* smoothed pixel, while the main pixel contributes (1-8*SF). In order
404	* to use integer arithmetic, these factors are multiplied by 2^16 = 65536.
405	* Also recall that SF = smoothing_factor / 1024.
406	*/
407
408	memberscale = `65536L` - cinfo->smoothing_factor * `512L`; / scaled 1-8SF /*
409	neighscale = cinfo->smoothing_factor * `64`; / scaled SF /
410
411	for (outrow = `0`; outrow < compptr->v_samp_factor; outrow++) {
412	outptr = output_data[outrow];
413	inptr = input_data[outrow];
414	above_ptr = input_data[outrow - `1`];
415	below_ptr = input_data[outrow + `1`];
416
417	/ Special case for first column /
418	colsum = (above_ptr++) + (below_ptr++) + inptr[`0`];
419	membersum = *inptr++;
420	nextcolsum = above_ptr[`0`] + below_ptr[`0`] + inptr[`0`];
421	neighsum = colsum + (colsum - membersum) + nextcolsum;
422	membersum = membersum * memberscale + neighsum * neighscale;
423	*outptr++ = (JSAMPLE)((membersum + `32768`) >> `16`);
424	lastcolsum = colsum; colsum = nextcolsum;
425
426	for (colctr = output_cols - `2`; colctr > `0`; colctr--) {
427	membersum = *inptr++;
428	above_ptr++; below_ptr++;
429	nextcolsum = above_ptr[`0`] + below_ptr[`0`] + inptr[`0`];
430	neighsum = lastcolsum + (colsum - membersum) + nextcolsum;
431	membersum = membersum * memberscale + neighsum * neighscale;
432	*outptr++ = (JSAMPLE)((membersum + `32768`) >> `16`);
433	lastcolsum = colsum; colsum = nextcolsum;
434	}
435
436	/ Special case for last column /
437	membersum = *inptr;
438	neighsum = lastcolsum + (colsum - membersum) + colsum;
439	membersum = membersum * memberscale + neighsum * neighscale;
440	*outptr = (JSAMPLE)((membersum + `32768`) >> `16`);
441
442	}
443	}
444
445	#endif /* INPUT_SMOOTHING_SUPPORTED */
446
447
448	/*
449	* Module initialization routine for downsampling.
450	* Note that we must select a routine for each component.
451	*/
452
453	GLOBAL(void)
454	jinit_downsampler(j_compress_ptr cinfo)
455	{
456	my_downsample_ptr downsample;
457	int ci;
458	jpeg_component_info *compptr;
459	boolean smoothok = TRUE;
460
461	downsample = (my_downsample_ptr)
462	(*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
463	sizeof(my_downsampler));
464	cinfo->downsample = (struct jpeg_downsampler *)downsample;
465	downsample->pub.start_pass = start_pass_downsample;
466	downsample->pub.downsample = sep_downsample;
467	downsample->pub.need_context_rows = FALSE;
468
469	if (cinfo->CCIR601_sampling)
470	ERREXIT(cinfo, JERR_CCIR601_NOTIMPL);
471
472	/ Verify we can handle the sampling factors, and set up method pointers /
473	for (ci = `0`, compptr = cinfo->comp_info; ci < cinfo->num_components;
474	ci++, compptr++) {
475	if (compptr->h_samp_factor == cinfo->max_h_samp_factor &&
476	compptr->v_samp_factor == cinfo->max_v_samp_factor) {
477	#ifdef INPUT_SMOOTHING_SUPPORTED
478	if (cinfo->smoothing_factor) {
479	downsample->methods[ci] = fullsize_smooth_downsample;
480	downsample->pub.need_context_rows = TRUE;
481	} else
482	#endif
483	downsample->methods[ci] = fullsize_downsample;
484	} else if (compptr->h_samp_factor * `2` == cinfo->max_h_samp_factor &&
485	compptr->v_samp_factor == cinfo->max_v_samp_factor) {
486	smoothok = FALSE;
487	if (jsimd_can_h2v1_downsample())
488	downsample->methods[ci] = jsimd_h2v1_downsample;
489	else
490	downsample->methods[ci] = h2v1_downsample;
491	} else if (compptr->h_samp_factor * `2` == cinfo->max_h_samp_factor &&
492	compptr->v_samp_factor * `2` == cinfo->max_v_samp_factor) {
493	#ifdef INPUT_SMOOTHING_SUPPORTED
494	if (cinfo->smoothing_factor) {
495	#if defined(__mips__)
496	if (jsimd_can_h2v2_smooth_downsample())
497	downsample->methods[ci] = jsimd_h2v2_smooth_downsample;
498	else
499	#endif
500	downsample->methods[ci] = h2v2_smooth_downsample;
501	downsample->pub.need_context_rows = TRUE;
502	} else
503	#endif
504	{
505	if (jsimd_can_h2v2_downsample())
506	downsample->methods[ci] = jsimd_h2v2_downsample;
507	else
508	downsample->methods[ci] = h2v2_downsample;
509	}
510	} else if ((cinfo->max_h_samp_factor % compptr->h_samp_factor) == `0` &&
511	(cinfo->max_v_samp_factor % compptr->v_samp_factor) == `0`) {
512	smoothok = FALSE;
513	downsample->methods[ci] = int_downsample;
514	} else
515	ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL);
516	}
517
518	#ifdef INPUT_SMOOTHING_SUPPORTED
519	if (cinfo->smoothing_factor && !smoothok)
520	TRACEMS(cinfo, `0`, JTRC_SMOOTH_NOTIMPL);
521	#endif
522	}
523

Browse the source code of tensorflow/external/libjpeg_turbo/jcsample.c