runMode_3.py

import numpy
from tensorflow import keras
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Dropout, Activation
from tensorflow.keras.optimizers import SGD
import math
import VQ

from sklearn import preprocessing
from sklearn.decomposition import PCA

from sklearn.preprocessing import OneHotEncoder
from VQ import Features
import glob
import sys
from tensorflow.keras.models import model_from_json
import _pickle
import os
import json
import matplotlib.pyplot as plt
import numpy as np
from matplotlib import cm
from scipy.io import wavfile
import librosa


class Train(object):
	"""docstring for Train"""
	frame_size = 0.032
	frame_shift = 0.016
	mapping = {}

	def __init__(self,frame_size, frame_shift):
		# self.num_speakers = num_speakers
		Train.frame_size = frame_size
		Train.frame_shift = frame_shift
		self.featuresObj = Features(frame_size,frame_shift)
		self.model = Sequential()
		self.pca = PCA(n_components='mle', whiten = True) 


	def Pca(self, X_train):	
		self.pca.fit(X_train)
		X_train = self.pca.transform(X_train)
		# self.pca = pca
		return X_train


	def encodeY(self, y_train):
		y_train = numpy.reshape(y_train, (y_train.shape[0], 1))
		enc = OneHotEncoder()
		y_train =enc.fit_transform(y_train).toarray()
		return y_train


	def train(self, directory, epochs = 60, activation_fn = 'glorot_normal'):
		train_data = self.featuresObj.load_data(directory)
		X_train = train_data[0]
		y_train = train_data[1]
		# print X_train.shape

		X_train = self.Pca(X_train)
		y_train = self.encodeY(y_train)
		# print y_train
		# print X_train.shape
		# print y_train.shape
		# print 
		self.model.add(Dense(64, input_dim=X_train.shape[1] , init=activation_fn))
		self.model.add(Activation('tanh'))
		self.model.add(Dropout(0.5))

		self.model.add(Dense(self.featuresObj.num_speakers, init=activation_fn))
		self.model.add(Activation('softmax'))

		sgd = SGD(lr=0.1, decay=1e-6, momentum=0.9, nesterov=True)
		self.model.compile(loss='categorical_crossentropy',
					  optimizer=sgd,
					  metrics=['accuracy'])

		self.model.fit(X_train, y_train, nb_epoch=epochs, validation_split= 0.2, batch_size=32)
		self.mapping = self.featuresObj.mapping

	
	def test(self, testdirec, model, pca):
		# pca = self.train()
		num_speakers = filecount(testdirec)
		testdirec = testdirec + "/"
		files = glob.glob(testdirec + "*.wav")
		tot_positives = 0
		speaker_no = 0

		while (speaker_no < num_speakers):
			speaker_no += 1
			filename = testdirec + str(speaker_no) + ".wav"
			print (filename)
			print

			flag = self.testFile(filename, model, pca, speaker_no-1)
			if flag:
				tot_positives +=1

		print ("total number of correct answers = " + str(tot_positives))
		print 
		# print
		return tot_positives


	def testFile(self, filename, model, pca, phone_number, mapping):
		test_data = self.featuresObj.getFeaturesFromWave(filename)  ### frames by features(34)
		X_test = test_data
		X_test = pca.transform(X_test)
		modelNN = model.predict(X_test)

		sumRows = numpy.sum(modelNN, axis=0)
		sumRows /= modelNN.shape[0]
		print (sumRows)
		print
		index = numpy.argmax(sumRows)
		print (sumRows[index])
		print (mapping)
		user_id = mapping[str(index+1)]
		print (user_id)
		print (phone_number)
		try:
			if int(phone_number)==int(user_id):
				if sumRows[index]<0.4:
					print (' true but less than 0.4' )
					print
				return True
			else:
				return False	
		except Exception :
			print ("Something went wrong. Try entering a new phone number without characters")
			raise Exception
		

### counts number of directories in the given directory

def fcount(path):
	count = 0
	for f in os.listdir(path):
		child = os.path.join(path, f)
		if os.path.isdir(child):
			count +=1
	return count

def filecount(path):
	count = 0
	for f in os.listdir(path):
		child = os.path.join(path, f)
		if os.path.isfile(child):
			count +=1
	return count


if __name__ == "__main__":
	num_args = len(sys.argv)

	if num_args < 3:
		print ("""Enter task to be performed :
				python runMode_3.py train /path to train directory  for training
				python runMode_3.py test phone_number /path to test file for test
				Enter directory name as well as test file name with it
				""")
		rate, sig = librosa.load('./' + 'b.wav')
		mfcc_feat = librosa.feature.mfcc(rate,sig)

		ig, ax = plt.subplots()
		mfcc_data= np.swapaxes(mfcc_feat, 0 ,1)
		cax = ax.imshow(mfcc_data, interpolation='nearest', cmap=cm.coolwarm, origin='lower', aspect='auto')
		ax.set_title('MFCC')
		#Showing mfcc_data
		plt.show()
		#Showing mfcc_feat
		plt.plot(mfcc_feat)
		plt.show()

	elif num_args >= 3:
		if sys.argv[1] == 'train':
			# direc = raw_input('Please Enter Input directory for training: ')
			direc = sys.argv[2]
			print (direc)
			print (type(direc))
			speakers = int(fcount(direc))

			t = Train(frame_size=0.032, frame_shift=0.016)
			t.train(direc, 20)
			json_string = t.model.to_json()
			open('my_model_architecture.json', 'w').write(json_string)
			t.model.save_weights('my_model_weights.h5', overwrite = True)
			
			with open('my_dumped_pca.pkl', 'wb') as fid:
				cPickle.dump(t.pca, fid)

			fid.close()
			with open('dictionary.json', 'w') as f:
				json.dump(t.mapping, f)

			f.close()
			print ("model is saved Finally")

		elif sys.argv[1] == 'test' :
			# testdirec = raw_input('Please enter Input directory or file for testing: ')
			testdirec = sys.argv[3]
			if os.path.isdir(testdirec):
				flag = True
			else:
				flag = False
			
			t = Train(frame_size=0.032, frame_shift=0.016)

			model = model_from_json(open('my_model_architecture.json').read())
			model.load_weights('my_model_weights.h5')

			with open('my_dumped_pca.pkl', 'rb') as fid:
				pca_loaded = cPickle.load(fid)

			fid.close()
			with open('dictionary.json', 'r') as f:
				try:
					mapping = json.load(f)
				except ValueError:
					mapping = {}

			print (mapping)
			f.close()

			sgd = SGD(lr=0.1, decay=1e-6, momentum=0.9, nesterov=True)
			model.compile(loss='categorical_crossentropy',
						  optimizer=sgd,
						  metrics=['accuracy'])
			print ("model is read ")
			if flag:
				tot_positives = t.test(testdirec, model, pca_loaded)
				print (tot_positives)
			else:
				# phone_number = raw_input('Please enter phone number for current user:')
				phone_number = sys.argv[2]
				true = t.testFile(testdirec, model, pca_loaded, phone_number, mapping)
				print (true)
				print
		else:
			print ('wrong argument entered: Please enter "train" or "test"')
	else:
		print ("enter one argument whether to train or test")

	sys.exit(0)