-
-
Notifications
You must be signed in to change notification settings - Fork 75
/
test.py
92 lines (69 loc) · 2.63 KB
/
test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
import os
import cPickle
import numpy as np
from scipy.io.wavfile import read
from featureextraction import extract_features
#from speakerfeatures import extract_features
import warnings
warnings.filterwarnings("ignore")
import time
"""
#path to training data
source = "development_set/"
modelpath = "speaker_models/"
test_file = "development_set_test.txt"
file_paths = open(test_file,'r')
"""
#path to training data
source = "SampleData/"
#path where training speakers will be saved
modelpath = "Speakers_models/"
gmm_files = [os.path.join(modelpath,fname) for fname in
os.listdir(modelpath) if fname.endswith('.gmm')]
#Load the Gaussian gender Models
models = [cPickle.load(open(fname,'r')) for fname in gmm_files]
speakers = [fname.split("/")[-1].split(".gmm")[0] for fname
in gmm_files]
error = 0
total_sample = 0.0
print "Do you want to Test a Single Audio: Press '1' or The complete Test Audio Sample: Press '0' ?"
take = int(raw_input().strip())
if take == 1:
print "Enter the File name from Test Audio Sample Collection :"
path = raw_input().strip()
print "Testing Audio : ", path
sr,audio = read(source + path)
vector = extract_features(audio,sr)
log_likelihood = np.zeros(len(models))
for i in range(len(models)):
gmm = models[i] #checking with each model one by one
scores = np.array(gmm.score(vector))
log_likelihood[i] = scores.sum()
winner = np.argmax(log_likelihood)
print "\tdetected as - ", speakers[winner]
time.sleep(1.0)
elif take == 0:
test_file = "testSamplePath.txt"
file_paths = open(test_file,'r')
# Read the test directory and get the list of test audio files
for path in file_paths:
total_sample += 1.0
path = path.strip()
print "Testing Audio : ", path
sr,audio = read(source + path)
vector = extract_features(audio,sr)
log_likelihood = np.zeros(len(models))
for i in range(len(models)):
gmm = models[i] #checking with each model one by one
scores = np.array(gmm.score(vector))
log_likelihood[i] = scores.sum()
winner = np.argmax(log_likelihood)
print "\tdetected as - ", speakers[winner]
checker_name = path.split("_")[0]
if speakers[winner] != checker_name:
error += 1
time.sleep(1.0)
print error, total_sample
accuracy = ((total_sample - error) / total_sample) * 100
print "The Accuracy Percentage for the current testing Performance with MFCC + GMM is : ", accuracy, "%"
print "Hurrey ! Speaker identified. Mission Accomplished Successfully. "