/* pHash, the open source perceptual hash library Copyright (C) 2009 Aetilius, Inc. All rights reserved. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see . Evan Klinger - eklinger@phash.org D Grant Starkweather - dstarkweather@phash.org */ #ifndef _AUDIO_PHASH_H #define _AUDIO_PHASH_H #include #include #include #include #include #include "pHash.h" extern "C" { #include "ph_fft.h" } /* /brief count number of samples in file * * /param filename - path and file name of audio file * /param sr - sample rate conversion * /param channels - channels number conversion * /return int count of number of sampels, negative for error */ int ph_count_samples(const char *filename, int sr,int channels); /* /brief read audio * * /param filename - path and name of audio file to read * /param sr - sample rate conversion * /param channels - nb channels to convert to (always 1) unused * /param buf - preallocated buffer * /param buflen - (in/out) param for buf length * /param nbsecs - float value for duration (in secs) to read from file * /return float* - float pointer to start of buffer - one channel of audio, NULL if error */ float* ph_readaudio(const char *filename, int sr, int channels, float *sigbuf, int &buflen, const float nbsecs = 0); /* /brief audio hash calculation * purpose: hash calculation for each frame in the buffer. * Each value is computed from successive overlapping frames of the input buffer. * The value is based on the bark scale values of the frame fft spectrum. The value * computed from temporal and spectral differences on the bark scale. * * /param buf - pointer to start of buffer * /param N - length of buffer * /param sr - sample rate on which to base the audiohash * /param nb_frames - (out) number of frames in audio buf and length of audiohash buffer returned * /return uint32 pointer to audio hash, NULL for error */ uint32_t* ph_audiohash(float *buf, int nbbuf, const int sr, int &nbframes); DP **ph_audio_hashes(char *files[], int count, int sr = 8000, int channels = 1, int threads = 0); /* /brief bit count set bits in 32bit variable * /param n * /return int number of bits set to 1, negative if error */ int ph_bitcount(uint32_t n); /* /brief compare 2 hash blocks * /param ptr_blockA - pointer to the first block * /param ptr_blockB - pointer to the second block * /param block_size - length of both blocks to compare * /return double bit error rate (ber) from comparing two blocks, neg for error */ double ph_compare_blocks(const uint32_t *ptr_blockA,const uint32_t *ptr_blockB, const int block_size); /* /brief distance function between two hashes * * /param hash_a - first hash * /param Na - length of first hash * /param hash_b - second hash * /param Nb - length of second hash * /param threshold - threshold value to compare successive blocks, 0.25, 0.30, 0.35 * /param block_size - length of block_size, 256 * /param Nc - (out) length of confidence score vector * /return double - ptr to confidence score vector */ double* ph_audio_distance_ber(uint32_t *hash_a , const int Na, uint32_t *hash_b, const int Nb, const float threshold, const int block_size, int &Nc); #endif