-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathlib.h
56 lines (30 loc) · 1.5 KB
/
lib.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#ifndef NYUMAYA_AUDIO_RECOGNITION_H
#define NYUMAYA_AUDIO_RECOGNITION_H
#include <string>
class AudioRecognitionImpl;
class FeatureExtractor;
class SpeakerVerificationImpl;
extern "C"
{
const char* GetVersionString(){return "0.3.4";}
//Audio Recognition
AudioRecognitionImpl* create_audio_recognition(const char* modelPath);
//Input Mel Features and get the index of the detected label if recognized
//@param array_length Number of mel features
//@param data Signed uint8_t mel features
int RunDetection(AudioRecognitionImpl*impl,const uint8_t* const data,const int mel_length);
//Input Mel Features and get the raw probabilities of the labels
uint8_t*RunRawDetection(AudioRecognitionImpl*impl,const uint8_t* const data,const int mel_length);
void SetSensitivity(AudioRecognitionImpl*impl,float sens);
size_t GetInputDataSize(AudioRecognitionImpl*impl);
//Speaker Verification
SpeakerVerificationImpl* create_speaker_verification(const char*modelPath);
uint8_t* VerifySpeaker(SpeakerVerificationImpl*impl,const uint8_t* const data,const int array_length);
//Feature Extractor
FeatureExtractor* create_feature_extractor(size_t nfft=512,size_t melcount = 40,size_t sample_rate=16000,
size_t lowerf=20, size_t upperf=8000,float window_len=0.03,float shift=0.01);
int signal_to_mel(FeatureExtractor*impl,const int16_t * const pcm, size_t len,uint8_t*result,float gain);
size_t get_melcount(FeatureExtractor*impl);
void print_mel_filter(FeatureExtractor*impl);
}
#endif