Alejandro Acuña
2024-08-12 1876e65234c20209001178705cfa50d8f9ded67a
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
// VoiceActivityDetector.cpp: implementation of the VoiceActivityDetector class.
//
//////////////////////////////////////////////////////////////////////
 
#include "VoiceActivityDetector.h"
#include "AudioSample.h"
 
//////////////////////////////////////////////////////////////////////
// Construction/Destruction
//////////////////////////////////////////////////////////////////////
 
VoiceActivityDetector::VoiceActivityDetector()
{
    EnableDetection();
    char subFacilityName[100];
    sprintf(subFacilityName, "VAD:%x", this);
    tracer.SetSubFacilityName(subFacilityName);
    SetTraceLevel();
}
 
VoiceActivityDetector::~VoiceActivityDetector()
{
 
}
 
int
VoiceActivityDetector::SetTraceLevel()
{
    long SystemMask = 0;
    if ((SystemMask = GetRegKeyLong(HKEY_CURRENT_USER, "Software\\Cisco Systems\\MTC\\Tracing", "AllComponents", 0x0)) == 0)
    {
        SystemMask = GetRegKeyLong(HKEY_CURRENT_USER, "Software\\Cisco Systems\\MTC\\Tracing", "VAD", 0x100000);
    }
    tracer.SetSystemMask(SystemMask);
    return 0;
}
 
int
VoiceActivityDetector::EnableDetection()
{
    enabled = true;
    return 0;
}
 
int
VoiceActivityDetector::DisableDetection()
{
    enabled = false;
    return 0;
}
 
int
VoiceActivityDetector::TransformStarted()
{
    return vad.Initialize();
}
 
int
VoiceActivityDetector::TransformAudioSamples(std::vector<std::pair<AudioSample *, AudioSource *> > &data, AudioSample **ppAudioSample)
{
    AudioSample *inSample = data[0].first;
    int result = 0;
    *ppAudioSample = inSample;
    inSample->AddRef(this);
    if (enabled)
    {
        int numSamples = inSample->DataSize() / 2;
        if (vad.IsSilence((short *)(inSample->Data()), numSamples))
        {
            // silence period
            // vad assumes 8kHz 16bit PCM mono input
            inSample->SetDataSize(0);
            inSample->SetSilenceDuration(numSamples/8);
            tracer.tracef(DET, "Silence : %dms\n", numSamples/8);
        }
        else
        {
            tracer.tracef(DET, "Speech : %dms\n", numSamples/8);
        }
    }
    else
    {
        tracer.tracef(DET, "Disabled\n");
    }
    return result;
}