mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
106 lines
4.3 KiB
106 lines
4.3 KiB
/* |
|
* BlackFin DSPUTILS COMMON OPTIMIZATIONS HEADER |
|
* |
|
* Copyright (C) 2007 Marc Hoffman <mmh@pleasantst.com> |
|
* |
|
* This file is part of Libav. |
|
* |
|
* Libav is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* Libav is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with Libav; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
|
|
#ifndef AVCODEC_BFIN_DSPUTIL_BFIN_H |
|
#define AVCODEC_BFIN_DSPUTIL_BFIN_H |
|
|
|
#include <stdint.h> |
|
|
|
#include "config.h" |
|
|
|
#if defined(__FDPIC__) && CONFIG_SRAM |
|
#define attribute_l1_text __attribute__ ((l1_text)) |
|
#define attribute_l1_data_b __attribute__((l1_data_B)) |
|
#else |
|
#define attribute_l1_text |
|
#define attribute_l1_data_b |
|
#endif |
|
|
|
void ff_bfin_idct (int16_t *block) attribute_l1_text; |
|
void ff_bfin_fdct (int16_t *block) attribute_l1_text; |
|
void ff_bfin_add_pixels_clamped (const int16_t *block, uint8_t *dest, int line_size) attribute_l1_text; |
|
void ff_bfin_put_pixels_clamped (const int16_t *block, uint8_t *dest, int line_size) attribute_l1_text; |
|
void ff_bfin_diff_pixels (int16_t *block, const uint8_t *s1, const uint8_t *s2, int stride) attribute_l1_text; |
|
void ff_bfin_get_pixels (int16_t *restrict block, const uint8_t *pixels, int line_size) attribute_l1_text; |
|
int ff_bfin_pix_norm1 (uint8_t * pix, int line_size) attribute_l1_text; |
|
int ff_bfin_z_sad8x8 (uint8_t *blk1, uint8_t *blk2, int dsz, int line_size, int h) attribute_l1_text; |
|
int ff_bfin_z_sad16x16 (uint8_t *blk1, uint8_t *blk2, int dsz, int line_size, int h) attribute_l1_text; |
|
|
|
void ff_bfin_z_put_pixels16_xy2 (uint8_t *block, const uint8_t *s0, int dest_size, int line_size, int h) attribute_l1_text; |
|
void ff_bfin_z_put_pixels8_xy2 (uint8_t *block, const uint8_t *s0, int dest_size, int line_size, int h) attribute_l1_text; |
|
void ff_bfin_put_pixels16_xy2_nornd (uint8_t *block, const uint8_t *s0, int line_size, int h) attribute_l1_text; |
|
void ff_bfin_put_pixels8_xy2_nornd (uint8_t *block, const uint8_t *s0, int line_size, int h) attribute_l1_text; |
|
|
|
|
|
int ff_bfin_pix_sum (uint8_t *p, int stride) attribute_l1_text; |
|
|
|
void ff_bfin_put_pixels8uc (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int dest_size, int line_size, int h) attribute_l1_text; |
|
void ff_bfin_put_pixels16uc (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int dest_size, int line_size, int h) attribute_l1_text; |
|
void ff_bfin_put_pixels8uc_nornd (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int line_size, int h) attribute_l1_text; |
|
void ff_bfin_put_pixels16uc_nornd (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int line_size, int h) attribute_l1_text; |
|
|
|
int ff_bfin_sse4 (void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h) attribute_l1_text; |
|
int ff_bfin_sse8 (void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h) attribute_l1_text; |
|
int ff_bfin_sse16 (void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h) attribute_l1_text; |
|
|
|
|
|
#ifdef BFIN_PROFILE |
|
|
|
static double Telem[16]; |
|
static char *TelemNames[16]; |
|
static int TelemCnt; |
|
|
|
#define PROF(lab,e) { int xx_e = e; char*xx_lab = lab; uint64_t xx_t0 = read_time(); |
|
#define EPROF() xx_t0 = read_time()-xx_t0; Telem[xx_e] = Telem[xx_e] + xx_t0; TelemNames[xx_e] = xx_lab; } |
|
|
|
static void prof_report (void) |
|
{ |
|
int i; |
|
double s = 0; |
|
for (i=0;i<16;i++) { |
|
double v; |
|
if (TelemNames[i]) { |
|
v = Telem[i]/TelemCnt; |
|
av_log (NULL,AV_LOG_DEBUG,"%-20s: %12.4f\t%12.4f\n", TelemNames[i],v,v/64); |
|
s = s + Telem[i]; |
|
} |
|
} |
|
av_log (NULL,AV_LOG_DEBUG,"%-20s: %12.4f\t%12.4f\n%20.4f\t%d\n", |
|
"total",s/TelemCnt,s/TelemCnt/64,s,TelemCnt); |
|
} |
|
|
|
static void bfprof (void) |
|
{ |
|
static int init; |
|
if (!init) atexit (prof_report); |
|
init=1; |
|
TelemCnt++; |
|
} |
|
|
|
#else |
|
#define PROF(a,b) |
|
#define EPROF() |
|
#define bfprof() |
|
#endif |
|
|
|
#endif /* AVCODEC_BFIN_DSPUTIL_BFIN_H */
|
|
|