123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721 |
- /*
- * jsimd_arm.c
- *
- * Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
- * Copyright (C) 2011, Nokia Corporation and/or its subsidiary(-ies).
- * Copyright (C) 2009-2011, 2013-2014, 2016, 2018, D. R. Commander.
- * Copyright (C) 2015-2016, 2018, Matthieu Darbois.
- * Copyright (C) 2019, Google LLC.
- *
- * Based on the x86 SIMD extension for IJG JPEG library,
- * Copyright (C) 1999-2006, MIYASAKA Masaru.
- * For conditions of distribution and use, see copyright notice in jsimdext.inc
- *
- * This file contains the interface between the "normal" portions
- * of the library and the SIMD implementations when running on a
- * 32-bit ARM architecture.
- */
- #define JPEG_INTERNALS
- #include "../../jinclude.h"
- #include "../../jpeglib.h"
- #include "../../jsimd.h"
- #include "../../jdct.h"
- #include "../../jsimddct.h"
- #include "../jsimd.h"
- #include <stdio.h>
- #include <string.h>
- #include <ctype.h>
- static unsigned int simd_support = ~0;
- static unsigned int simd_huffman = 1;
- #if !defined(__ARM_NEON__) && (defined(__linux__) || defined(ANDROID) || defined(__ANDROID__))
- #define SOMEWHAT_SANE_PROC_CPUINFO_SIZE_LIMIT (1024 * 1024)
- LOCAL(int)
- check_feature(char *buffer, char *feature)
- {
- char *p;
- if (*feature == 0)
- return 0;
- if (strncmp(buffer, "Features", 8) != 0)
- return 0;
- buffer += 8;
- while (isspace(*buffer))
- buffer++;
- /* Check if 'feature' is present in the buffer as a separate word */
- while ((p = strstr(buffer, feature))) {
- if (p > buffer && !isspace(*(p - 1))) {
- buffer++;
- continue;
- }
- p += strlen(feature);
- if (*p != 0 && !isspace(*p)) {
- buffer++;
- continue;
- }
- return 1;
- }
- return 0;
- }
- LOCAL(int)
- parse_proc_cpuinfo(int bufsize)
- {
- char *buffer = (char *)malloc(bufsize);
- FILE *fd;
- simd_support = 0;
- if (!buffer)
- return 0;
- fd = fopen("/proc/cpuinfo", "r");
- if (fd) {
- while (fgets(buffer, bufsize, fd)) {
- if (!strchr(buffer, '\n') && !feof(fd)) {
- /* "impossible" happened - insufficient size of the buffer! */
- fclose(fd);
- free(buffer);
- return 0;
- }
- if (check_feature(buffer, "neon"))
- simd_support |= JSIMD_NEON;
- }
- fclose(fd);
- }
- free(buffer);
- return 1;
- }
- #endif
- /*
- * Check what SIMD accelerations are supported.
- *
- * FIXME: This code is racy under a multi-threaded environment.
- */
- LOCAL(void)
- init_simd(void)
- {
- #ifndef NO_GETENV
- char *env = NULL;
- #endif
- #if !defined(__ARM_NEON__) && (defined(__linux__) || defined(ANDROID) || defined(__ANDROID__))
- int bufsize = 1024; /* an initial guess for the line buffer size limit */
- #endif
- if (simd_support != ~0U)
- return;
- simd_support = 0;
- #if defined(__ARM_NEON__)
- simd_support |= JSIMD_NEON;
- #elif defined(__linux__) || defined(ANDROID) || defined(__ANDROID__)
- /* We still have a chance to use NEON regardless of globally used
- * -mcpu/-mfpu options passed to gcc by performing runtime detection via
- * /proc/cpuinfo parsing on linux/android */
- while (!parse_proc_cpuinfo(bufsize)) {
- bufsize *= 2;
- if (bufsize > SOMEWHAT_SANE_PROC_CPUINFO_SIZE_LIMIT)
- break;
- }
- #endif
- #ifndef NO_GETENV
- /* Force different settings through environment variables */
- env = getenv("JSIMD_FORCENEON");
- if ((env != NULL) && (strcmp(env, "1") == 0))
- simd_support = JSIMD_NEON;
- env = getenv("JSIMD_FORCENONE");
- if ((env != NULL) && (strcmp(env, "1") == 0))
- simd_support = 0;
- env = getenv("JSIMD_NOHUFFENC");
- if ((env != NULL) && (strcmp(env, "1") == 0))
- simd_huffman = 0;
- #endif
- }
- GLOBAL(int)
- jsimd_can_rgb_ycc(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if ((RGB_PIXELSIZE != 3) && (RGB_PIXELSIZE != 4))
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_rgb_gray(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_can_ycc_rgb(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if ((RGB_PIXELSIZE != 3) && (RGB_PIXELSIZE != 4))
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_ycc_rgb565(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(void)
- jsimd_rgb_ycc_convert(j_compress_ptr cinfo, JSAMPARRAY input_buf,
- JSAMPIMAGE output_buf, JDIMENSION output_row,
- int num_rows)
- {
- void (*neonfct) (JDIMENSION, JSAMPARRAY, JSAMPIMAGE, JDIMENSION, int);
- switch (cinfo->in_color_space) {
- case JCS_EXT_RGB:
- neonfct = jsimd_extrgb_ycc_convert_neon;
- break;
- case JCS_EXT_RGBX:
- case JCS_EXT_RGBA:
- neonfct = jsimd_extrgbx_ycc_convert_neon;
- break;
- case JCS_EXT_BGR:
- neonfct = jsimd_extbgr_ycc_convert_neon;
- break;
- case JCS_EXT_BGRX:
- case JCS_EXT_BGRA:
- neonfct = jsimd_extbgrx_ycc_convert_neon;
- break;
- case JCS_EXT_XBGR:
- case JCS_EXT_ABGR:
- neonfct = jsimd_extxbgr_ycc_convert_neon;
- break;
- case JCS_EXT_XRGB:
- case JCS_EXT_ARGB:
- neonfct = jsimd_extxrgb_ycc_convert_neon;
- break;
- default:
- neonfct = jsimd_extrgb_ycc_convert_neon;
- break;
- }
- neonfct(cinfo->image_width, input_buf, output_buf, output_row, num_rows);
- }
- GLOBAL(void)
- jsimd_rgb_gray_convert(j_compress_ptr cinfo, JSAMPARRAY input_buf,
- JSAMPIMAGE output_buf, JDIMENSION output_row,
- int num_rows)
- {
- }
- GLOBAL(void)
- jsimd_ycc_rgb_convert(j_decompress_ptr cinfo, JSAMPIMAGE input_buf,
- JDIMENSION input_row, JSAMPARRAY output_buf,
- int num_rows)
- {
- void (*neonfct) (JDIMENSION, JSAMPIMAGE, JDIMENSION, JSAMPARRAY, int);
- switch (cinfo->out_color_space) {
- case JCS_EXT_RGB:
- neonfct = jsimd_ycc_extrgb_convert_neon;
- break;
- case JCS_EXT_RGBX:
- case JCS_EXT_RGBA:
- neonfct = jsimd_ycc_extrgbx_convert_neon;
- break;
- case JCS_EXT_BGR:
- neonfct = jsimd_ycc_extbgr_convert_neon;
- break;
- case JCS_EXT_BGRX:
- case JCS_EXT_BGRA:
- neonfct = jsimd_ycc_extbgrx_convert_neon;
- break;
- case JCS_EXT_XBGR:
- case JCS_EXT_ABGR:
- neonfct = jsimd_ycc_extxbgr_convert_neon;
- break;
- case JCS_EXT_XRGB:
- case JCS_EXT_ARGB:
- neonfct = jsimd_ycc_extxrgb_convert_neon;
- break;
- default:
- neonfct = jsimd_ycc_extrgb_convert_neon;
- break;
- }
- neonfct(cinfo->output_width, input_buf, input_row, output_buf, num_rows);
- }
- GLOBAL(void)
- jsimd_ycc_rgb565_convert(j_decompress_ptr cinfo, JSAMPIMAGE input_buf,
- JDIMENSION input_row, JSAMPARRAY output_buf,
- int num_rows)
- {
- jsimd_ycc_rgb565_convert_neon(cinfo->output_width, input_buf, input_row,
- output_buf, num_rows);
- }
- GLOBAL(int)
- jsimd_can_h2v2_downsample(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_can_h2v1_downsample(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_h2v2_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
- JSAMPARRAY input_data, JSAMPARRAY output_data)
- {
- }
- GLOBAL(void)
- jsimd_h2v1_downsample(j_compress_ptr cinfo, jpeg_component_info *compptr,
- JSAMPARRAY input_data, JSAMPARRAY output_data)
- {
- }
- GLOBAL(int)
- jsimd_can_h2v2_upsample(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_can_h2v1_upsample(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_h2v2_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
- {
- }
- GLOBAL(void)
- jsimd_h2v1_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
- {
- }
- GLOBAL(int)
- jsimd_can_h2v2_fancy_upsample(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_can_h2v1_fancy_upsample(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(void)
- jsimd_h2v2_fancy_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
- {
- }
- GLOBAL(void)
- jsimd_h2v1_fancy_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
- {
- jsimd_h2v1_fancy_upsample_neon(cinfo->max_v_samp_factor,
- compptr->downsampled_width, input_data,
- output_data_ptr);
- }
- GLOBAL(int)
- jsimd_can_h2v2_merged_upsample(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_can_h2v1_merged_upsample(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_h2v2_merged_upsample(j_decompress_ptr cinfo, JSAMPIMAGE input_buf,
- JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)
- {
- }
- GLOBAL(void)
- jsimd_h2v1_merged_upsample(j_decompress_ptr cinfo, JSAMPIMAGE input_buf,
- JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)
- {
- }
- GLOBAL(int)
- jsimd_can_convsamp(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (sizeof(DCTELEM) != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_convsamp_float(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_convsamp(JSAMPARRAY sample_data, JDIMENSION start_col,
- DCTELEM *workspace)
- {
- jsimd_convsamp_neon(sample_data, start_col, workspace);
- }
- GLOBAL(void)
- jsimd_convsamp_float(JSAMPARRAY sample_data, JDIMENSION start_col,
- FAST_FLOAT *workspace)
- {
- }
- GLOBAL(int)
- jsimd_can_fdct_islow(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_can_fdct_ifast(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(DCTELEM) != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_fdct_float(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_fdct_islow(DCTELEM *data)
- {
- }
- GLOBAL(void)
- jsimd_fdct_ifast(DCTELEM *data)
- {
- jsimd_fdct_ifast_neon(data);
- }
- GLOBAL(void)
- jsimd_fdct_float(FAST_FLOAT *data)
- {
- }
- GLOBAL(int)
- jsimd_can_quantize(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(JCOEF) != 2)
- return 0;
- if (sizeof(DCTELEM) != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_quantize_float(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_quantize(JCOEFPTR coef_block, DCTELEM *divisors, DCTELEM *workspace)
- {
- jsimd_quantize_neon(coef_block, divisors, workspace);
- }
- GLOBAL(void)
- jsimd_quantize_float(JCOEFPTR coef_block, FAST_FLOAT *divisors,
- FAST_FLOAT *workspace)
- {
- }
- GLOBAL(int)
- jsimd_can_idct_2x2(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(JCOEF) != 2)
- return 0;
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (sizeof(ISLOW_MULT_TYPE) != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_idct_4x4(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(JCOEF) != 2)
- return 0;
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (sizeof(ISLOW_MULT_TYPE) != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(void)
- jsimd_idct_2x2(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JCOEFPTR coef_block, JSAMPARRAY output_buf,
- JDIMENSION output_col)
- {
- jsimd_idct_2x2_neon(compptr->dct_table, coef_block, output_buf, output_col);
- }
- GLOBAL(void)
- jsimd_idct_4x4(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JCOEFPTR coef_block, JSAMPARRAY output_buf,
- JDIMENSION output_col)
- {
- jsimd_idct_4x4_neon(compptr->dct_table, coef_block, output_buf, output_col);
- }
- GLOBAL(int)
- jsimd_can_idct_islow(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(JCOEF) != 2)
- return 0;
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (sizeof(ISLOW_MULT_TYPE) != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_idct_ifast(void)
- {
- init_simd();
- /* The code is optimised for these values only */
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(JCOEF) != 2)
- return 0;
- if (BITS_IN_JSAMPLE != 8)
- return 0;
- if (sizeof(JDIMENSION) != 4)
- return 0;
- if (sizeof(IFAST_MULT_TYPE) != 2)
- return 0;
- if (IFAST_SCALE_BITS != 2)
- return 0;
- if (simd_support & JSIMD_NEON)
- return 1;
- return 0;
- }
- GLOBAL(int)
- jsimd_can_idct_float(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_idct_islow(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JCOEFPTR coef_block, JSAMPARRAY output_buf,
- JDIMENSION output_col)
- {
- jsimd_idct_islow_neon(compptr->dct_table, coef_block, output_buf,
- output_col);
- }
- GLOBAL(void)
- jsimd_idct_ifast(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JCOEFPTR coef_block, JSAMPARRAY output_buf,
- JDIMENSION output_col)
- {
- jsimd_idct_ifast_neon(compptr->dct_table, coef_block, output_buf,
- output_col);
- }
- GLOBAL(void)
- jsimd_idct_float(j_decompress_ptr cinfo, jpeg_component_info *compptr,
- JCOEFPTR coef_block, JSAMPARRAY output_buf,
- JDIMENSION output_col)
- {
- }
- GLOBAL(int)
- jsimd_can_huff_encode_one_block(void)
- {
- init_simd();
- if (DCTSIZE != 8)
- return 0;
- if (sizeof(JCOEF) != 2)
- return 0;
- if (simd_support & JSIMD_NEON && simd_huffman)
- return 1;
- return 0;
- }
- GLOBAL(JOCTET *)
- jsimd_huff_encode_one_block(void *state, JOCTET *buffer, JCOEFPTR block,
- int last_dc_val, c_derived_tbl *dctbl,
- c_derived_tbl *actbl)
- {
- return jsimd_huff_encode_one_block_neon(state, buffer, block, last_dc_val,
- dctbl, actbl);
- }
- GLOBAL(int)
- jsimd_can_encode_mcu_AC_first_prepare(void)
- {
- return 0;
- }
- GLOBAL(void)
- jsimd_encode_mcu_AC_first_prepare(const JCOEF *block,
- const int *jpeg_natural_order_start, int Sl,
- int Al, JCOEF *values, size_t *zerobits)
- {
- }
- GLOBAL(int)
- jsimd_can_encode_mcu_AC_refine_prepare(void)
- {
- return 0;
- }
- GLOBAL(int)
- jsimd_encode_mcu_AC_refine_prepare(const JCOEF *block,
- const int *jpeg_natural_order_start, int Sl,
- int Al, JCOEF *absvalues, size_t *bits)
- {
- return 0;
- }
|