/src/libavc/common/x86/ih264_platform_macros.h
Line | Count | Source |
1 | | /****************************************************************************** |
2 | | * |
3 | | * Copyright (C) 2015 The Android Open Source Project |
4 | | * |
5 | | * Licensed under the Apache License, Version 2.0 (the "License"); |
6 | | * you may not use this file except in compliance with the License. |
7 | | * You may obtain a copy of the License at: |
8 | | * |
9 | | * http://www.apache.org/licenses/LICENSE-2.0 |
10 | | * |
11 | | * Unless required by applicable law or agreed to in writing, software |
12 | | * distributed under the License is distributed on an "AS IS" BASIS, |
13 | | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
14 | | * See the License for the specific language governing permissions and |
15 | | * limitations under the License. |
16 | | * |
17 | | ***************************************************************************** |
18 | | * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore |
19 | | */ |
20 | | /** |
21 | | ******************************************************************************* |
22 | | * @file |
23 | | * ih264_platform_macros.h |
24 | | * |
25 | | * @brief |
26 | | * Platform specific Macro definitions used in the codec |
27 | | * |
28 | | * @author |
29 | | * Ittiam |
30 | | * |
31 | | * @remarks |
32 | | * None |
33 | | * |
34 | | ******************************************************************************* |
35 | | */ |
36 | | |
37 | | |
38 | | #ifndef _IH264_PLATFORM_MACROS_H_ |
39 | | #define _IH264_PLATFORM_MACROS_H_ |
40 | | |
41 | | #include <stdint.h> |
42 | | #include <immintrin.h> |
43 | | |
44 | | #ifndef __ANDROID__ |
45 | | static __inline__ __m128i |
46 | | loadu_32(void const *__a) |
47 | 545M | { |
48 | 545M | struct __loadu_si32 { |
49 | 545M | int __v; |
50 | 545M | } __attribute__((__packed__, __may_alias__)); |
51 | 545M | int __u = ((struct __loadu_si32*)__a)->__v; |
52 | 545M | return __extension__ (__m128i)(__v4si){__u, 0, 0, 0}; |
53 | 545M | } Unexecuted instantiation: imvcd_api.c:loadu_32 Unexecuted instantiation: imvcd_api_utils.c:loadu_32 Unexecuted instantiation: imvcd_dpb_manager.c:loadu_32 Unexecuted instantiation: imvcd_error_handler.c:loadu_32 Unexecuted instantiation: imvcd_nalu_parser.c:loadu_32 Unexecuted instantiation: imvcd_slice_functions.c:loadu_32 Unexecuted instantiation: imvcd_utils.c:loadu_32 Unexecuted instantiation: ih264d_function_selector.c:loadu_32 Unexecuted instantiation: ih264d_function_selector_sse42.c:loadu_32 Unexecuted instantiation: ih264d_function_selector_ssse3.c:loadu_32 Unexecuted instantiation: ih264d_function_selector_avx2.c:loadu_32 Unexecuted instantiation: ih264_chroma_intra_pred_filters.c:loadu_32 Unexecuted instantiation: ih264_luma_intra_pred_filters.c:loadu_32 Unexecuted instantiation: ih264_chroma_intra_pred_filters_ssse3.c:loadu_32 Unexecuted instantiation: ih264_deblk_chroma_ssse3.c:loadu_32 Unexecuted instantiation: ih264_deblk_luma_ssse3.c:loadu_32 Unexecuted instantiation: ih264_inter_pred_filters_ssse3.c:loadu_32 Unexecuted instantiation: ih264_iquant_itrans_recon_dc_ssse3.c:loadu_32 ih264_iquant_itrans_recon_sse42.c:loadu_32 Line | Count | Source | 47 | 144M | { | 48 | 144M | struct __loadu_si32 { | 49 | 144M | int __v; | 50 | 144M | } __attribute__((__packed__, __may_alias__)); | 51 | 144M | int __u = ((struct __loadu_si32*)__a)->__v; | 52 | 144M | return __extension__ (__m128i)(__v4si){__u, 0, 0, 0}; | 53 | 144M | } |
Unexecuted instantiation: ih264_iquant_itrans_recon_ssse3.c:loadu_32 Unexecuted instantiation: ih264_luma_intra_pred_filters_ssse3.c:loadu_32 Unexecuted instantiation: ih264_padding_ssse3.c:loadu_32 Unexecuted instantiation: ih264_weighted_pred_sse42.c:loadu_32 Unexecuted instantiation: ih264_deblk_chroma_avx2.c:loadu_32 Unexecuted instantiation: ih264_deblk_luma_avx2.c:loadu_32 Unexecuted instantiation: ih264_iquant_itrans_recon_avx2.c:loadu_32 Unexecuted instantiation: ih264_weighted_pred_avx2.c:loadu_32 Unexecuted instantiation: ih264_inter_pred_filters_avx2.c:loadu_32 Unexecuted instantiation: ih264d_api.c:loadu_32 Unexecuted instantiation: ih264d_bitstrm.c:loadu_32 Unexecuted instantiation: ih264d_cabac.c:loadu_32 Unexecuted instantiation: ih264d_cabac_init_tables.c:loadu_32 Unexecuted instantiation: ih264d_compute_bs.c:loadu_32 Unexecuted instantiation: ih264d_deblocking.c:loadu_32 Unexecuted instantiation: ih264d_dpb_mgr.c:loadu_32 Unexecuted instantiation: ih264d_format_conv.c:loadu_32 Unexecuted instantiation: ih264d_function_selector_generic.c:loadu_32 Unexecuted instantiation: ih264d_inter_pred.c:loadu_32 Unexecuted instantiation: ih264d_mb_utils.c:loadu_32 Unexecuted instantiation: ih264d_mvpred.c:loadu_32 Unexecuted instantiation: ih264d_nal.c:loadu_32 Unexecuted instantiation: ih264d_parse_bslice.c:loadu_32 Unexecuted instantiation: ih264d_parse_cabac.c:loadu_32 Unexecuted instantiation: ih264d_parse_cavlc.c:loadu_32 Unexecuted instantiation: ih264d_parse_headers.c:loadu_32 Unexecuted instantiation: ih264d_parse_islice.c:loadu_32 Unexecuted instantiation: ih264d_parse_mb_header.c:loadu_32 Unexecuted instantiation: ih264d_parse_pslice.c:loadu_32 Unexecuted instantiation: ih264d_parse_slice.c:loadu_32 Unexecuted instantiation: ih264d_process_bslice.c:loadu_32 Unexecuted instantiation: ih264d_process_intra_mb.c:loadu_32 Unexecuted instantiation: ih264d_process_pslice.c:loadu_32 Unexecuted instantiation: ih264d_quant_scaling.c:loadu_32 Unexecuted instantiation: ih264d_sei.c:loadu_32 Unexecuted instantiation: ih264d_tables.c:loadu_32 Unexecuted instantiation: ih264d_thread_compute_bs.c:loadu_32 Unexecuted instantiation: ih264d_thread_parse_decode.c:loadu_32 Unexecuted instantiation: ih264d_utils.c:loadu_32 Unexecuted instantiation: ih264d_vui.c:loadu_32 Unexecuted instantiation: ih264_deblk_edge_filters.c:loadu_32 Unexecuted instantiation: ih264_inter_pred_filters.c:loadu_32 Unexecuted instantiation: ih264_iquant_itrans_recon.c:loadu_32 Unexecuted instantiation: ih264_weighted_pred.c:loadu_32 Unexecuted instantiation: isvcd_api.c:loadu_32 Unexecuted instantiation: isvcd_nal.c:loadu_32 Unexecuted instantiation: isvcd_nal_parse.c:loadu_32 Unexecuted instantiation: isvcd_parse_epslice.c:loadu_32 Unexecuted instantiation: isvcd_parse_headers.c:loadu_32 Unexecuted instantiation: isvcd_parse_slice.c:loadu_32 Unexecuted instantiation: isvcd_process_ebslice.c:loadu_32 Unexecuted instantiation: isvcd_process_epslice.c:loadu_32 Unexecuted instantiation: isvcd_thread_compute_bs.c:loadu_32 Unexecuted instantiation: isvcd_thread_parse_decode.c:loadu_32 Unexecuted instantiation: isvcd_utils.c:loadu_32 Unexecuted instantiation: isvcd_vui.c:loadu_32 Unexecuted instantiation: isvcd_ii_pred.c:loadu_32 Unexecuted instantiation: isvcd_intra_resamp.c:loadu_32 Unexecuted instantiation: isvcd_mode_mv_resamp.c:loadu_32 Unexecuted instantiation: isvcd_residual_resamp.c:loadu_32 Unexecuted instantiation: isvcd_function_selector.c:loadu_32 Unexecuted instantiation: isvcd_function_selector_sse42.c:loadu_32 Unexecuted instantiation: isvcd_intra_resamp_sse42.c:loadu_32 Unexecuted instantiation: isvcd_iquant_itrans_residual_recon_sse42.c:loadu_32 Unexecuted instantiation: isvcd_iquant_itrans_residual_sse42.c:loadu_32 Unexecuted instantiation: isvcd_iquant_itrans_sse42.c:loadu_32 Unexecuted instantiation: isvcd_pred_residual_recon_sse42.c:loadu_32 Unexecuted instantiation: isvcd_residual_resamp_sse42.c:loadu_32 Unexecuted instantiation: isvcd_cabac.c:loadu_32 Unexecuted instantiation: isvcd_cabac_init_tables.c:loadu_32 Unexecuted instantiation: isvcd_compute_bs.c:loadu_32 Unexecuted instantiation: isvcd_function_selector_generic.c:loadu_32 Unexecuted instantiation: isvcd_mb_utils.c:loadu_32 Unexecuted instantiation: isvcd_parse_cavlc.c:loadu_32 Unexecuted instantiation: isvcd_parse_ebslice.c:loadu_32 Unexecuted instantiation: isvcd_parse_eislice.c:loadu_32 Unexecuted instantiation: isvcd_iquant_itrans.c:loadu_32 Unexecuted instantiation: isvcd_iquant_itrans_residual.c:loadu_32 Unexecuted instantiation: isvcd_iquant_itrans_residual_recon.c:loadu_32 Unexecuted instantiation: isvcd_pred_residual_recon.c:loadu_32 Unexecuted instantiation: isvce_api.c:loadu_32 Unexecuted instantiation: isvce_downscaler.c:loadu_32 Unexecuted instantiation: isvce_encode.c:loadu_32 Unexecuted instantiation: isvce_fmt_conv.c:loadu_32 Unexecuted instantiation: isvce_ibl_eval.c:loadu_32 Unexecuted instantiation: isvce_process.c:loadu_32 Unexecuted instantiation: isvce_rc_mem_interface.c:loadu_32 Unexecuted instantiation: isvce_sub_pic_rc.c:loadu_32 Unexecuted instantiation: isvce_downscaler_sse42.c:loadu_32 Unexecuted instantiation: isvce_function_selector.c:loadu_32 Unexecuted instantiation: ih264_list.c:loadu_32 Unexecuted instantiation: isvc_intra_resample.c:loadu_32 Unexecuted instantiation: isvc_iquant_itrans_recon_sse42.c:loadu_32 Unexecuted instantiation: isvc_resi_trans_quant_sse42.c:loadu_32 Unexecuted instantiation: isvc_intra_resample_sse42.c:loadu_32 Unexecuted instantiation: ih264e_bitstream.c:loadu_32 Unexecuted instantiation: ih264e_fmt_conv.c:loadu_32 Unexecuted instantiation: ih264e_sei.c:loadu_32 Unexecuted instantiation: isvce_cabac.c:loadu_32 Unexecuted instantiation: isvce_cabac_encode.c:loadu_32 Unexecuted instantiation: isvce_cabac_init.c:loadu_32 Unexecuted instantiation: isvce_core_coding.c:loadu_32 Unexecuted instantiation: isvce_mc.c:loadu_32 Unexecuted instantiation: isvce_me.c:loadu_32 Unexecuted instantiation: ih264e_half_pel_ssse3.c:loadu_32 Unexecuted instantiation: isvc_iquant_itrans_recon.c:loadu_32 Unexecuted instantiation: ih264e_cabac_init.c:loadu_32 Unexecuted instantiation: ih264e_core_coding.c:loadu_32 Unexecuted instantiation: ih264e_half_pel.c:loadu_32 Unexecuted instantiation: ih264e_me.c:loadu_32 Unexecuted instantiation: ih264e_api.c:loadu_32 Unexecuted instantiation: ih264e_encode.c:loadu_32 Unexecuted instantiation: ih264e_process.c:loadu_32 Unexecuted instantiation: ih264e_function_selector.c:loadu_32 ih264_resi_trans_quant_sse42.c:loadu_32 Line | Count | Source | 47 | 401M | { | 48 | 401M | struct __loadu_si32 { | 49 | 401M | int __v; | 50 | 401M | } __attribute__((__packed__, __may_alias__)); | 51 | 401M | int __u = ((struct __loadu_si32*)__a)->__v; | 52 | 401M | return __extension__ (__m128i)(__v4si){__u, 0, 0, 0}; | 53 | 401M | } |
Unexecuted instantiation: ih264e_cabac.c:loadu_32 Unexecuted instantiation: ih264e_cabac_encode.c:loadu_32 |
54 | | #else |
55 | | static __inline__ __m128i loadu_32(void const *__a) { return _mm_loadu_si32(__a); }; |
56 | | #endif |
57 | | |
58 | 10.7G | #define CLIP_U8(x) CLIP3(0, UINT8_MAX, (x)) |
59 | 4.58M | #define CLIP_S8(x) CLIP3(INT8_MIN, INT8_MAX, (x)) |
60 | | |
61 | | #define CLIP_U10(x) CLIP3(0, 1023, (x)) |
62 | | #define CLIP_S10(x) CLIP3(-512, 511, (x)) |
63 | | |
64 | | #define CLIP_U11(x) CLIP3(0, 2047, (x)) |
65 | 233k | #define CLIP_S11(x) CLIP3(-1024, 1023, (x)) |
66 | | |
67 | | #define CLIP_U12(x) CLIP3(0, 4095, (x)) |
68 | | #define CLIP_S12(x) CLIP3(-2048, 2047, (x)) |
69 | | |
70 | | #define CLIP_U16(x) CLIP3(0, UINT16_MAX, (x)) |
71 | | #define CLIP_S16(x) CLIP3(INT16_MIN, INT16_MAX, (x)) |
72 | | |
73 | | #define CLIP_U32(x) CLIP3(0, UINT32_MAX, (x)) |
74 | | #define CLIP_S32(x) CLIP3(INT32_MIN, INT32_MAX, (x)) |
75 | | |
76 | | #define MEM_ALIGN16 __attribute__ ((aligned (16))) |
77 | | |
78 | | #define SHL(x,y) (((y) < 32) ? ((x) << (y)) : 0) |
79 | | #define SHR(x,y) (((y) < 32) ? ((x) >> (y)) : 0) |
80 | | |
81 | | #define SHR_NEG(val,shift) ((shift>0)?(val>>shift):(val<<(-shift))) |
82 | | #define SHL_NEG(val,shift) ((shift<0)?(val>>(-shift)):(val<<shift)) |
83 | | |
84 | | |
85 | | #define ITT_BIG_ENDIAN(x) __builtin_bswap32(x); |
86 | | |
87 | 13.4G | #define NOP(nop_cnt) {UWORD32 nop_i; for (nop_i = 0; nop_i < nop_cnt; nop_i++) asm("nop");} |
88 | | |
89 | | #define PLD(a) |
90 | | |
91 | | /* In normal cases, 0 will not be passed as an argument to CLZ and CTZ. |
92 | | As CLZ and CTZ outputs are used as a shift value in few places, these return |
93 | | 31 for u4_word == 0 case, just to handle error cases gracefully without any |
94 | | undefined behaviour */ |
95 | | |
96 | | static __inline UWORD32 CLZ(UWORD32 u4_word) |
97 | 987M | { |
98 | 987M | if(u4_word) |
99 | 920M | return(__builtin_clz(u4_word)); |
100 | 67.0M | else |
101 | 67.0M | return 31; |
102 | 987M | } Unexecuted instantiation: imvcd_api.c:CLZ Unexecuted instantiation: imvcd_api_utils.c:CLZ Unexecuted instantiation: imvcd_dpb_manager.c:CLZ Unexecuted instantiation: imvcd_error_handler.c:CLZ Unexecuted instantiation: imvcd_nalu_parser.c:CLZ Unexecuted instantiation: imvcd_slice_functions.c:CLZ Unexecuted instantiation: imvcd_utils.c:CLZ Unexecuted instantiation: ih264d_function_selector.c:CLZ Unexecuted instantiation: ih264d_function_selector_sse42.c:CLZ Unexecuted instantiation: ih264d_function_selector_ssse3.c:CLZ Unexecuted instantiation: ih264d_function_selector_avx2.c:CLZ Unexecuted instantiation: ih264_chroma_intra_pred_filters.c:CLZ Unexecuted instantiation: ih264_luma_intra_pred_filters.c:CLZ Unexecuted instantiation: ih264_chroma_intra_pred_filters_ssse3.c:CLZ Unexecuted instantiation: ih264_deblk_chroma_ssse3.c:CLZ Unexecuted instantiation: ih264_deblk_luma_ssse3.c:CLZ Unexecuted instantiation: ih264_inter_pred_filters_ssse3.c:CLZ Unexecuted instantiation: ih264_iquant_itrans_recon_dc_ssse3.c:CLZ Unexecuted instantiation: ih264_iquant_itrans_recon_sse42.c:CLZ Unexecuted instantiation: ih264_iquant_itrans_recon_ssse3.c:CLZ Unexecuted instantiation: ih264_luma_intra_pred_filters_ssse3.c:CLZ Unexecuted instantiation: ih264_padding_ssse3.c:CLZ Unexecuted instantiation: ih264_weighted_pred_sse42.c:CLZ Unexecuted instantiation: ih264_deblk_chroma_avx2.c:CLZ Unexecuted instantiation: ih264_deblk_luma_avx2.c:CLZ Unexecuted instantiation: ih264_iquant_itrans_recon_avx2.c:CLZ Unexecuted instantiation: ih264_weighted_pred_avx2.c:CLZ Unexecuted instantiation: ih264_inter_pred_filters_avx2.c:CLZ Unexecuted instantiation: ih264d_api.c:CLZ Unexecuted instantiation: ih264d_bitstrm.c:CLZ Line | Count | Source | 97 | 20.4M | { | 98 | 20.4M | if(u4_word) | 99 | 20.4M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 20.4M | } |
Unexecuted instantiation: ih264d_cabac_init_tables.c:CLZ Unexecuted instantiation: ih264d_compute_bs.c:CLZ Unexecuted instantiation: ih264d_deblocking.c:CLZ Unexecuted instantiation: ih264d_dpb_mgr.c:CLZ Unexecuted instantiation: ih264d_format_conv.c:CLZ Unexecuted instantiation: ih264d_function_selector_generic.c:CLZ Unexecuted instantiation: ih264d_inter_pred.c:CLZ Unexecuted instantiation: ih264d_mb_utils.c:CLZ Unexecuted instantiation: ih264d_mvpred.c:CLZ Unexecuted instantiation: ih264d_nal.c:CLZ ih264d_parse_bslice.c:CLZ Line | Count | Source | 97 | 583k | { | 98 | 583k | if(u4_word) | 99 | 577k | return(__builtin_clz(u4_word)); | 100 | 6.45k | else | 101 | 6.45k | return 31; | 102 | 583k | } |
Line | Count | Source | 97 | 24.1M | { | 98 | 24.1M | if(u4_word) | 99 | 24.1M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 24.1M | } |
Line | Count | Source | 97 | 10.7M | { | 98 | 10.7M | if(u4_word) | 99 | 10.3M | return(__builtin_clz(u4_word)); | 100 | 348k | else | 101 | 348k | return 31; | 102 | 10.7M | } |
Unexecuted instantiation: ih264d_parse_headers.c:CLZ ih264d_parse_islice.c:CLZ Line | Count | Source | 97 | 363k | { | 98 | 363k | if(u4_word) | 99 | 361k | return(__builtin_clz(u4_word)); | 100 | 1.57k | else | 101 | 1.57k | return 31; | 102 | 363k | } |
ih264d_parse_mb_header.c:CLZ Line | Count | Source | 97 | 18.2M | { | 98 | 18.2M | if(u4_word) | 99 | 18.2M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 18.2M | } |
ih264d_parse_pslice.c:CLZ Line | Count | Source | 97 | 613k | { | 98 | 613k | if(u4_word) | 99 | 587k | return(__builtin_clz(u4_word)); | 100 | 25.4k | else | 101 | 25.4k | return 31; | 102 | 613k | } |
Unexecuted instantiation: ih264d_parse_slice.c:CLZ Unexecuted instantiation: ih264d_process_bslice.c:CLZ ih264d_process_intra_mb.c:CLZ Line | Count | Source | 97 | 2.91M | { | 98 | 2.91M | if(u4_word) | 99 | 2.91M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 2.91M | } |
Unexecuted instantiation: ih264d_process_pslice.c:CLZ Unexecuted instantiation: ih264d_quant_scaling.c:CLZ Unexecuted instantiation: ih264d_sei.c:CLZ Unexecuted instantiation: ih264d_tables.c:CLZ Unexecuted instantiation: ih264d_thread_compute_bs.c:CLZ Unexecuted instantiation: ih264d_thread_parse_decode.c:CLZ Line | Count | Source | 97 | 717k | { | 98 | 717k | if(u4_word) | 99 | 717k | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 717k | } |
Unexecuted instantiation: ih264d_vui.c:CLZ Unexecuted instantiation: ih264_deblk_edge_filters.c:CLZ Unexecuted instantiation: ih264_inter_pred_filters.c:CLZ Unexecuted instantiation: ih264_iquant_itrans_recon.c:CLZ Unexecuted instantiation: ih264_weighted_pred.c:CLZ Unexecuted instantiation: isvcd_api.c:CLZ Unexecuted instantiation: isvcd_nal.c:CLZ Unexecuted instantiation: isvcd_nal_parse.c:CLZ isvcd_parse_epslice.c:CLZ Line | Count | Source | 97 | 624k | { | 98 | 624k | if(u4_word) | 99 | 612k | return(__builtin_clz(u4_word)); | 100 | 11.1k | else | 101 | 11.1k | return 31; | 102 | 624k | } |
Unexecuted instantiation: isvcd_parse_headers.c:CLZ Unexecuted instantiation: isvcd_parse_slice.c:CLZ Unexecuted instantiation: isvcd_process_ebslice.c:CLZ Unexecuted instantiation: isvcd_process_epslice.c:CLZ Unexecuted instantiation: isvcd_thread_compute_bs.c:CLZ Unexecuted instantiation: isvcd_thread_parse_decode.c:CLZ Unexecuted instantiation: isvcd_utils.c:CLZ Unexecuted instantiation: isvcd_vui.c:CLZ Unexecuted instantiation: isvcd_ii_pred.c:CLZ Unexecuted instantiation: isvcd_intra_resamp.c:CLZ Unexecuted instantiation: isvcd_mode_mv_resamp.c:CLZ Unexecuted instantiation: isvcd_residual_resamp.c:CLZ Unexecuted instantiation: isvcd_function_selector.c:CLZ Unexecuted instantiation: isvcd_function_selector_sse42.c:CLZ Unexecuted instantiation: isvcd_intra_resamp_sse42.c:CLZ Unexecuted instantiation: isvcd_iquant_itrans_residual_recon_sse42.c:CLZ Unexecuted instantiation: isvcd_iquant_itrans_residual_sse42.c:CLZ Unexecuted instantiation: isvcd_iquant_itrans_sse42.c:CLZ Unexecuted instantiation: isvcd_pred_residual_recon_sse42.c:CLZ Unexecuted instantiation: isvcd_residual_resamp_sse42.c:CLZ Unexecuted instantiation: isvcd_cabac.c:CLZ Unexecuted instantiation: isvcd_cabac_init_tables.c:CLZ Unexecuted instantiation: isvcd_compute_bs.c:CLZ Unexecuted instantiation: isvcd_function_selector_generic.c:CLZ Unexecuted instantiation: isvcd_mb_utils.c:CLZ Line | Count | Source | 97 | 13.1k | { | 98 | 13.1k | if(u4_word) | 99 | 12.9k | return(__builtin_clz(u4_word)); | 100 | 255 | else | 101 | 255 | return 31; | 102 | 13.1k | } |
isvcd_parse_ebslice.c:CLZ Line | Count | Source | 97 | 82.5k | { | 98 | 82.5k | if(u4_word) | 99 | 80.2k | return(__builtin_clz(u4_word)); | 100 | 2.26k | else | 101 | 2.26k | return 31; | 102 | 82.5k | } |
isvcd_parse_eislice.c:CLZ Line | Count | Source | 97 | 309k | { | 98 | 309k | if(u4_word) | 99 | 307k | return(__builtin_clz(u4_word)); | 100 | 1.94k | else | 101 | 1.94k | return 31; | 102 | 309k | } |
Unexecuted instantiation: isvcd_iquant_itrans.c:CLZ Unexecuted instantiation: isvcd_iquant_itrans_residual.c:CLZ Unexecuted instantiation: isvcd_iquant_itrans_residual_recon.c:CLZ Unexecuted instantiation: isvcd_pred_residual_recon.c:CLZ Line | Count | Source | 97 | 5.30k | { | 98 | 5.30k | if(u4_word) | 99 | 5.30k | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 5.30k | } |
Unexecuted instantiation: isvce_downscaler.c:CLZ Unexecuted instantiation: isvce_encode.c:CLZ Unexecuted instantiation: isvce_fmt_conv.c:CLZ Unexecuted instantiation: isvce_ibl_eval.c:CLZ Unexecuted instantiation: isvce_process.c:CLZ Unexecuted instantiation: isvce_rc_mem_interface.c:CLZ Line | Count | Source | 97 | 15.6M | { | 98 | 15.6M | if(u4_word) | 99 | 15.6M | return(__builtin_clz(u4_word)); | 100 | 18.4E | else | 101 | 18.4E | return 31; | 102 | 15.6M | } |
Unexecuted instantiation: isvce_downscaler_sse42.c:CLZ Unexecuted instantiation: isvce_function_selector.c:CLZ Line | Count | Source | 97 | 57.0k | { | 98 | 57.0k | if(u4_word) | 99 | 57.0k | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 57.0k | } |
Unexecuted instantiation: isvc_intra_resample.c:CLZ Unexecuted instantiation: isvc_iquant_itrans_recon_sse42.c:CLZ Unexecuted instantiation: isvc_resi_trans_quant_sse42.c:CLZ Unexecuted instantiation: isvc_intra_resample_sse42.c:CLZ Line | Count | Source | 97 | 25.2M | { | 98 | 25.2M | if(u4_word) | 99 | 25.2M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 25.2M | } |
Unexecuted instantiation: ih264e_fmt_conv.c:CLZ Unexecuted instantiation: ih264e_sei.c:CLZ Line | Count | Source | 97 | 300M | { | 98 | 300M | if(u4_word) | 99 | 300M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 300M | } |
Line | Count | Source | 97 | 52.4M | { | 98 | 52.4M | if(u4_word) | 99 | 45.2M | return(__builtin_clz(u4_word)); | 100 | 7.19M | else | 101 | 7.19M | return 31; | 102 | 52.4M | } |
Unexecuted instantiation: isvce_cabac_init.c:CLZ Line | Count | Source | 97 | 177M | { | 98 | 177M | if(u4_word) | 99 | 140M | return(__builtin_clz(u4_word)); | 100 | 37.2M | else | 101 | 37.2M | return 31; | 102 | 177M | } |
Unexecuted instantiation: isvce_mc.c:CLZ Line | Count | Source | 97 | 5.33k | { | 98 | 5.33k | if(u4_word) | 99 | 5.33k | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 5.33k | } |
Unexecuted instantiation: ih264e_half_pel_ssse3.c:CLZ Unexecuted instantiation: isvc_iquant_itrans_recon.c:CLZ Unexecuted instantiation: ih264e_cabac_init.c:CLZ Line | Count | Source | 97 | 76.0M | { | 98 | 76.0M | if(u4_word) | 99 | 55.9M | return(__builtin_clz(u4_word)); | 100 | 20.1M | else | 101 | 20.1M | return 31; | 102 | 76.0M | } |
Unexecuted instantiation: ih264e_half_pel.c:CLZ Line | Count | Source | 97 | 4.10k | { | 98 | 4.10k | if(u4_word) | 99 | 4.10k | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 4.10k | } |
Line | Count | Source | 97 | 4.20k | { | 98 | 4.20k | if(u4_word) | 99 | 4.20k | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 4.20k | } |
Unexecuted instantiation: ih264e_encode.c:CLZ Unexecuted instantiation: ih264e_process.c:CLZ Unexecuted instantiation: ih264e_function_selector.c:CLZ Unexecuted instantiation: ih264_resi_trans_quant_sse42.c:CLZ Line | Count | Source | 97 | 229M | { | 98 | 229M | if(u4_word) | 99 | 229M | return(__builtin_clz(u4_word)); | 100 | 0 | else | 101 | 0 | return 31; | 102 | 229M | } |
ih264e_cabac_encode.c:CLZ Line | Count | Source | 97 | 29.9M | { | 98 | 29.9M | if(u4_word) | 99 | 27.8M | return(__builtin_clz(u4_word)); | 100 | 2.03M | else | 101 | 2.03M | return 31; | 102 | 29.9M | } |
|
103 | | |
104 | | static __inline UWORD32 CTZ(UWORD32 u4_word) |
105 | 0 | { |
106 | 0 | if(0 == u4_word) |
107 | 0 | return 31; |
108 | 0 | else |
109 | 0 | { |
110 | 0 | unsigned int index; |
111 | 0 | index = __builtin_ctz(u4_word); |
112 | 0 | return (UWORD32)index; |
113 | 0 | } |
114 | 0 | } Unexecuted instantiation: imvcd_api.c:CTZ Unexecuted instantiation: imvcd_api_utils.c:CTZ Unexecuted instantiation: imvcd_dpb_manager.c:CTZ Unexecuted instantiation: imvcd_error_handler.c:CTZ Unexecuted instantiation: imvcd_nalu_parser.c:CTZ Unexecuted instantiation: imvcd_slice_functions.c:CTZ Unexecuted instantiation: imvcd_utils.c:CTZ Unexecuted instantiation: ih264d_function_selector.c:CTZ Unexecuted instantiation: ih264d_function_selector_sse42.c:CTZ Unexecuted instantiation: ih264d_function_selector_ssse3.c:CTZ Unexecuted instantiation: ih264d_function_selector_avx2.c:CTZ Unexecuted instantiation: ih264_chroma_intra_pred_filters.c:CTZ Unexecuted instantiation: ih264_luma_intra_pred_filters.c:CTZ Unexecuted instantiation: ih264_chroma_intra_pred_filters_ssse3.c:CTZ Unexecuted instantiation: ih264_deblk_chroma_ssse3.c:CTZ Unexecuted instantiation: ih264_deblk_luma_ssse3.c:CTZ Unexecuted instantiation: ih264_inter_pred_filters_ssse3.c:CTZ Unexecuted instantiation: ih264_iquant_itrans_recon_dc_ssse3.c:CTZ Unexecuted instantiation: ih264_iquant_itrans_recon_sse42.c:CTZ Unexecuted instantiation: ih264_iquant_itrans_recon_ssse3.c:CTZ Unexecuted instantiation: ih264_luma_intra_pred_filters_ssse3.c:CTZ Unexecuted instantiation: ih264_padding_ssse3.c:CTZ Unexecuted instantiation: ih264_weighted_pred_sse42.c:CTZ Unexecuted instantiation: ih264_deblk_chroma_avx2.c:CTZ Unexecuted instantiation: ih264_deblk_luma_avx2.c:CTZ Unexecuted instantiation: ih264_iquant_itrans_recon_avx2.c:CTZ Unexecuted instantiation: ih264_weighted_pred_avx2.c:CTZ Unexecuted instantiation: ih264_inter_pred_filters_avx2.c:CTZ Unexecuted instantiation: ih264d_api.c:CTZ Unexecuted instantiation: ih264d_bitstrm.c:CTZ Unexecuted instantiation: ih264d_cabac.c:CTZ Unexecuted instantiation: ih264d_cabac_init_tables.c:CTZ Unexecuted instantiation: ih264d_compute_bs.c:CTZ Unexecuted instantiation: ih264d_deblocking.c:CTZ Unexecuted instantiation: ih264d_dpb_mgr.c:CTZ Unexecuted instantiation: ih264d_format_conv.c:CTZ Unexecuted instantiation: ih264d_function_selector_generic.c:CTZ Unexecuted instantiation: ih264d_inter_pred.c:CTZ Unexecuted instantiation: ih264d_mb_utils.c:CTZ Unexecuted instantiation: ih264d_mvpred.c:CTZ Unexecuted instantiation: ih264d_nal.c:CTZ Unexecuted instantiation: ih264d_parse_bslice.c:CTZ Unexecuted instantiation: ih264d_parse_cabac.c:CTZ Unexecuted instantiation: ih264d_parse_cavlc.c:CTZ Unexecuted instantiation: ih264d_parse_headers.c:CTZ Unexecuted instantiation: ih264d_parse_islice.c:CTZ Unexecuted instantiation: ih264d_parse_mb_header.c:CTZ Unexecuted instantiation: ih264d_parse_pslice.c:CTZ Unexecuted instantiation: ih264d_parse_slice.c:CTZ Unexecuted instantiation: ih264d_process_bslice.c:CTZ Unexecuted instantiation: ih264d_process_intra_mb.c:CTZ Unexecuted instantiation: ih264d_process_pslice.c:CTZ Unexecuted instantiation: ih264d_quant_scaling.c:CTZ Unexecuted instantiation: ih264d_sei.c:CTZ Unexecuted instantiation: ih264d_tables.c:CTZ Unexecuted instantiation: ih264d_thread_compute_bs.c:CTZ Unexecuted instantiation: ih264d_thread_parse_decode.c:CTZ Unexecuted instantiation: ih264d_utils.c:CTZ Unexecuted instantiation: ih264d_vui.c:CTZ Unexecuted instantiation: ih264_deblk_edge_filters.c:CTZ Unexecuted instantiation: ih264_inter_pred_filters.c:CTZ Unexecuted instantiation: ih264_iquant_itrans_recon.c:CTZ Unexecuted instantiation: ih264_weighted_pred.c:CTZ Unexecuted instantiation: isvcd_api.c:CTZ Unexecuted instantiation: isvcd_nal.c:CTZ Unexecuted instantiation: isvcd_nal_parse.c:CTZ Unexecuted instantiation: isvcd_parse_epslice.c:CTZ Unexecuted instantiation: isvcd_parse_headers.c:CTZ Unexecuted instantiation: isvcd_parse_slice.c:CTZ Unexecuted instantiation: isvcd_process_ebslice.c:CTZ Unexecuted instantiation: isvcd_process_epslice.c:CTZ Unexecuted instantiation: isvcd_thread_compute_bs.c:CTZ Unexecuted instantiation: isvcd_thread_parse_decode.c:CTZ Unexecuted instantiation: isvcd_utils.c:CTZ Unexecuted instantiation: isvcd_vui.c:CTZ Unexecuted instantiation: isvcd_ii_pred.c:CTZ Unexecuted instantiation: isvcd_intra_resamp.c:CTZ Unexecuted instantiation: isvcd_mode_mv_resamp.c:CTZ Unexecuted instantiation: isvcd_residual_resamp.c:CTZ Unexecuted instantiation: isvcd_function_selector.c:CTZ Unexecuted instantiation: isvcd_function_selector_sse42.c:CTZ Unexecuted instantiation: isvcd_intra_resamp_sse42.c:CTZ Unexecuted instantiation: isvcd_iquant_itrans_residual_recon_sse42.c:CTZ Unexecuted instantiation: isvcd_iquant_itrans_residual_sse42.c:CTZ Unexecuted instantiation: isvcd_iquant_itrans_sse42.c:CTZ Unexecuted instantiation: isvcd_pred_residual_recon_sse42.c:CTZ Unexecuted instantiation: isvcd_residual_resamp_sse42.c:CTZ Unexecuted instantiation: isvcd_cabac.c:CTZ Unexecuted instantiation: isvcd_cabac_init_tables.c:CTZ Unexecuted instantiation: isvcd_compute_bs.c:CTZ Unexecuted instantiation: isvcd_function_selector_generic.c:CTZ Unexecuted instantiation: isvcd_mb_utils.c:CTZ Unexecuted instantiation: isvcd_parse_cavlc.c:CTZ Unexecuted instantiation: isvcd_parse_ebslice.c:CTZ Unexecuted instantiation: isvcd_parse_eislice.c:CTZ Unexecuted instantiation: isvcd_iquant_itrans.c:CTZ Unexecuted instantiation: isvcd_iquant_itrans_residual.c:CTZ Unexecuted instantiation: isvcd_iquant_itrans_residual_recon.c:CTZ Unexecuted instantiation: isvcd_pred_residual_recon.c:CTZ Unexecuted instantiation: isvce_api.c:CTZ Unexecuted instantiation: isvce_downscaler.c:CTZ Unexecuted instantiation: isvce_encode.c:CTZ Unexecuted instantiation: isvce_fmt_conv.c:CTZ Unexecuted instantiation: isvce_ibl_eval.c:CTZ Unexecuted instantiation: isvce_process.c:CTZ Unexecuted instantiation: isvce_rc_mem_interface.c:CTZ Unexecuted instantiation: isvce_sub_pic_rc.c:CTZ Unexecuted instantiation: isvce_downscaler_sse42.c:CTZ Unexecuted instantiation: isvce_function_selector.c:CTZ Unexecuted instantiation: ih264_list.c:CTZ Unexecuted instantiation: isvc_intra_resample.c:CTZ Unexecuted instantiation: isvc_iquant_itrans_recon_sse42.c:CTZ Unexecuted instantiation: isvc_resi_trans_quant_sse42.c:CTZ Unexecuted instantiation: isvc_intra_resample_sse42.c:CTZ Unexecuted instantiation: ih264e_bitstream.c:CTZ Unexecuted instantiation: ih264e_fmt_conv.c:CTZ Unexecuted instantiation: ih264e_sei.c:CTZ Unexecuted instantiation: isvce_cabac.c:CTZ Unexecuted instantiation: isvce_cabac_encode.c:CTZ Unexecuted instantiation: isvce_cabac_init.c:CTZ Unexecuted instantiation: isvce_core_coding.c:CTZ Unexecuted instantiation: isvce_mc.c:CTZ Unexecuted instantiation: isvce_me.c:CTZ Unexecuted instantiation: ih264e_half_pel_ssse3.c:CTZ Unexecuted instantiation: isvc_iquant_itrans_recon.c:CTZ Unexecuted instantiation: ih264e_cabac_init.c:CTZ Unexecuted instantiation: ih264e_core_coding.c:CTZ Unexecuted instantiation: ih264e_half_pel.c:CTZ Unexecuted instantiation: ih264e_me.c:CTZ Unexecuted instantiation: ih264e_api.c:CTZ Unexecuted instantiation: ih264e_encode.c:CTZ Unexecuted instantiation: ih264e_process.c:CTZ Unexecuted instantiation: ih264e_function_selector.c:CTZ Unexecuted instantiation: ih264_resi_trans_quant_sse42.c:CTZ Unexecuted instantiation: ih264e_cabac.c:CTZ Unexecuted instantiation: ih264e_cabac_encode.c:CTZ |
115 | | |
116 | 72.4M | #define DATA_SYNC() __sync_synchronize() |
117 | | |
118 | | |
119 | | |
120 | | //#define INLINE __inline |
121 | | #define INLINE inline |
122 | | |
123 | | #define PREFETCH_ENABLE 1 |
124 | | |
125 | | #if PREFETCH_ENABLE |
126 | | #define PREFETCH(ptr, type) _mm_prefetch(ptr, type); |
127 | | #else |
128 | | #define PREFETCH(ptr, type) |
129 | | #endif |
130 | | |
131 | | #define MEM_ALIGN8 __attribute__ ((aligned (8))) |
132 | | #define MEM_ALIGN16 __attribute__ ((aligned (16))) |
133 | | #define MEM_ALIGN32 __attribute__ ((aligned (32))) |
134 | | |
135 | | #endif /* _IH264_PLATFORM_MACROS_H_ */ |