the-assignment/classifier/feature_extraction/feature_extractor.py

# import essentia.standard
import essentia
from essentia.standard import (MonoLoader, Windowing, Spectrum, MFCC,
	ZeroCrossingRate, SpectralCentroidTime, RollOff, Flux, Envelope,
	FlatnessSFX, LogAttackTime, StrongDecay, FlatnessDB, HFC,
	SpectralComplexity, FrameGenerator, YamlOutput)

# Disable annoying info level logging
essentia.log.infoActive = False

class bcolors:
	BLUE = '\033[94m'
	GREEN = '\033[92m'
	YELLOW = '\033[93m'
	RED = '\033[91m'
	ENDC = '\033[0m'

def extractFeatures(audioPath, outputPath, sampleRate):
	# Loads the audio file specified
	loader = MonoLoader(filename = audioPath, sampleRate = sampleRate)
	audio = loader()

	# Sets up the functions that will be used
	# TODO check if zero phase windowing is something we might want
	window = Windowing(normalized = False, size = 6144, type = 'hamming',
		zeroPhase = False)
	spectrum = Spectrum()
	mfcc = MFCC(inputSize = 6144, sampleRate = sampleRate)
	zcr = ZeroCrossingRate()
	sc = SpectralCentroidTime(sampleRate = sampleRate)
	sr = RollOff(sampleRate = sampleRate)
	sf = Flux()
	env = Envelope(attackTime = 2, releaseTime = 300, sampleRate = sampleRate)
	flat = FlatnessSFX()
	logAtt = LogAttackTime(sampleRate = sampleRate)
	strDec = StrongDecay(sampleRate = sampleRate)
	flatDB = FlatnessDB()
	hfc = HFC(sampleRate = sampleRate)
	spcComp = SpectralComplexity(sampleRate = sampleRate, magnitudeThreshold = 2)

	# Creates a pool to collect the values of the features
	pool = essentia.Pool()

	# Slices the signal into frames
	for frame in FrameGenerator(audio, frameSize = 6144, hopSize = 3072,
		startFromZero = True , validFrameThresholdRatio = 0.7):
		# Applies a window function to the frame
		windowedFrame = window(frame)

		# Computes time domain features
		frameZCR = zcr(windowedFrame)
		frameSC = sc(windowedFrame)
		frameEFlatness = flat(env(windowedFrame))
		frameLogAtt = logAtt(env(windowedFrame))[1]
		frameStrDec = strDec(windowedFrame)

		# Computes spectral features
		frameSpectrum = spectrum(windowedFrame)
		frameSR = sr(frameSpectrum)
		frameSF = sf(frameSpectrum)
		frameSEFlatness = flat(env(frameSpectrum))
		frameSLogAtt = logAtt(env(frameSpectrum))[1]
		frameSStrDec = strDec(frameSpectrum)
		frameSFlat = flatDB(frameSpectrum)
		frameHFC = hfc(frameSpectrum)
		frameSComp = spcComp(frameSpectrum)

		# Computes cepstral features
		# Discards the bands
		mfcc_coeffs = mfcc(frameSpectrum)[1]

		# Adds the values to the pool
		pool.add('ZCR', frameZCR)
		pool.add('SC', frameSC)
		pool.add('Flat', frameEFlatness)
		pool.add('LAtt', frameLogAtt)
		pool.add('SDec', frameStrDec)

		pool.add('SR', frameSR)
		pool.add('SF', frameSF)
		pool.add('SEFlat', frameSEFlatness)
		pool.add('SFlat', frameSFlat)
		pool.add('SLAtt', frameSLogAtt)
		pool.add('SSDec', frameSStrDec)
		pool.add('HFC', frameHFC)
		pool.add('SComp', frameSComp)

		for index, coef in enumerate(mfcc_coeffs):
			pool.add('mfcc' + str(index), coef)

	YamlOutput(filename = outputPath, format = 'json', writeVersion = False)(pool)

# Prints a nice message to let the user know the module was imported
print(bcolors.BLUE + 'feature_extractor loaded' + bcolors.ENDC)

# Enables executing the module as a standalone script
if __name__ == "__main__":
	import sys
	extractFeatures(sys.argv[1], sys.argv[2], int(sys.argv[3]))
Move feature extraction to separate folder, Init batch_feature_extractor 6 years ago			`# import essentia.standard`
Init feature_extractor 6 years ago			`import essentia`
Move feature extraction to separate folder, Init batch_feature_extractor 6 years ago			`from essentia.standard import (MonoLoader, Windowing, Spectrum, MFCC,`
Add more features 6 years ago			`ZeroCrossingRate, SpectralCentroidTime, RollOff, Flux, Envelope,`
Init k-Fold Cross Validation, Add test script, Remove LPC features, Minor fixes 6 years ago			`FlatnessSFX, LogAttackTime, StrongDecay, FlatnessDB, HFC,`
Add more features 6 years ago			`SpectralComplexity, FrameGenerator, YamlOutput)`
Move feature extraction to separate folder, Init batch_feature_extractor 6 years ago
			`# Disable annoying info level logging`
			`essentia.log.infoActive = False`
Init feature_extractor 6 years ago
Init k-Fold Cross Validation, Add test script, Remove LPC features, Minor fixes 6 years ago			`class bcolors:`
			`BLUE = '\033[94m'`
			`GREEN = '\033[92m'`
			`YELLOW = '\033[93m'`
			`RED = '\033[91m'`
			`ENDC = '\033[0m'`

Init feature_extractor 6 years ago			`def extractFeatures(audioPath, outputPath, sampleRate):`
			`# Loads the audio file specified`
Move feature extraction to separate folder, Init batch_feature_extractor 6 years ago			`loader = MonoLoader(filename = audioPath, sampleRate = sampleRate)`
Init feature_extractor 6 years ago			`audio = loader()`

			`# Sets up the functions that will be used`
			`# TODO check if zero phase windowing is something we might want`
			`window = Windowing(normalized = False, size = 6144, type = 'hamming',`
			`zeroPhase = False)`
			`spectrum = Spectrum()`
			`mfcc = MFCC(inputSize = 6144, sampleRate = sampleRate)`
			`zcr = ZeroCrossingRate()`
			`sc = SpectralCentroidTime(sampleRate = sampleRate)`
			`sr = RollOff(sampleRate = sampleRate)`
			`sf = Flux()`
Add more features 6 years ago			`env = Envelope(attackTime = 2, releaseTime = 300, sampleRate = sampleRate)`
			`flat = FlatnessSFX()`
			`logAtt = LogAttackTime(sampleRate = sampleRate)`
			`strDec = StrongDecay(sampleRate = sampleRate)`
			`flatDB = FlatnessDB()`
			`hfc = HFC(sampleRate = sampleRate)`
			`spcComp = SpectralComplexity(sampleRate = sampleRate, magnitudeThreshold = 2)`
Init feature_extractor 6 years ago
			`# Creates a pool to collect the values of the features`
			`pool = essentia.Pool()`

			`# Slices the signal into frames`
			`for frame in FrameGenerator(audio, frameSize = 6144, hopSize = 3072,`
			`startFromZero = True , validFrameThresholdRatio = 0.7):`
			`# Applies a window function to the frame`
			`windowedFrame = window(frame)`

			`# Computes time domain features`
			`frameZCR = zcr(windowedFrame)`
			`frameSC = sc(windowedFrame)`
Add more features 6 years ago			`frameEFlatness = flat(env(windowedFrame))`
			`frameLogAtt = logAtt(env(windowedFrame))[1]`
			`frameStrDec = strDec(windowedFrame)`
Init feature_extractor 6 years ago
			`# Computes spectral features`
			`frameSpectrum = spectrum(windowedFrame)`
			`frameSR = sr(frameSpectrum)`
			`frameSF = sf(frameSpectrum)`
Add more features 6 years ago			`frameSEFlatness = flat(env(frameSpectrum))`
			`frameSLogAtt = logAtt(env(frameSpectrum))[1]`
			`frameSStrDec = strDec(frameSpectrum)`
			`frameSFlat = flatDB(frameSpectrum)`
			`frameHFC = hfc(frameSpectrum)`
			`frameSComp = spcComp(frameSpectrum)`

Init models training, Other minor fixes 6 years ago			`# Computes cepstral features`
Init feature_extractor 6 years ago			`# Discards the bands`
			`mfcc_coeffs = mfcc(frameSpectrum)[1]`

			`# Adds the values to the pool`
			`pool.add('ZCR', frameZCR)`
			`pool.add('SC', frameSC)`
Add more features 6 years ago			`pool.add('Flat', frameEFlatness)`
			`pool.add('LAtt', frameLogAtt)`
			`pool.add('SDec', frameStrDec)`

Init feature_extractor 6 years ago			`pool.add('SR', frameSR)`
			`pool.add('SF', frameSF)`
Add more features 6 years ago			`pool.add('SEFlat', frameSEFlatness)`
			`pool.add('SFlat', frameSFlat)`
			`pool.add('SLAtt', frameSLogAtt)`
			`pool.add('SSDec', frameSStrDec)`
			`pool.add('HFC', frameHFC)`
			`pool.add('SComp', frameSComp)`

			`for index, coef in enumerate(mfcc_coeffs):`
			`pool.add('mfcc' + str(index), coef)`
Init feature_extractor 6 years ago
			`YamlOutput(filename = outputPath, format = 'json', writeVersion = False)(pool)`

			`# Prints a nice message to let the user know the module was imported`
Init k-Fold Cross Validation, Add test script, Remove LPC features, Minor fixes 6 years ago			`print(bcolors.BLUE + 'feature_extractor loaded' + bcolors.ENDC)`
Init feature_extractor 6 years ago
			`# Enables executing the module as a standalone script`
			`if __name__ == "__main__":`
			`import sys`
			`extractFeatures(sys.argv[1], sys.argv[2], int(sys.argv[3]))`