import parselmouth as pm from pysndfile import sndio as snd def pitch_array(sample_file='outputs/audio/sunflowers-Victoria-180-normal-870.aiff'): samples, samplerate, _ = snd.read(sample_file) sample_sound = pm.Sound(values=samples,sampling_frequency=samplerate) sample_pitch = sample_sound.to_pitch() return sample_pitch.to_matrix().as_array() def intensity_array(sample_file='outputs/audio/sunflowers-Victoria-180-normal-870.aiff'): sample_file='outputs/audio/sunflowers-Victoria-180-normal-870.aiff' samples, samplerate, _ = snd.read(sample_file) sample_sound = pm.Sound(values=samples,sampling_frequency=samplerate) sample_intensity = sample_sound.to_mfcc() sample_intensity.as_array().shape return sample_pitch.to_matrix().as_array() def compute_mfcc(sample_file='outputs/audio/sunflowers-Victoria-180-normal-870.aiff'): # sample_file='outputs/audio/sunflowers-Victoria-180-normal-870.aiff' samples, samplerate, _ = snd.read(sample_file) sample_sound = pm.Sound(values=samples,sampling_frequency=samplerate) sample_mfcc = sample_sound.to_mfcc() # sample_mfcc.to_array().shape return sample_mfcc.to_array() # sunflowers_vic_180_norm = pitch_array('outputs/audio/sunflowers-Victoria-180-normal-870.aiff') # sunflowers_fred_180_norm = pitch_array('outputs/audio/sunflowers-Fred-180-normal-6515.aiff') # sunflowers_vic_180_norm_mfcc = compute_mfcc('outputs/audio/sunflowers-Victoria-180-normal-870.aiff') fred_180_norm_mfcc = compute_mfcc('outputs/audio/sunflowers-Fred-180-normal-6515.aiff') alex_mfcc = compute_mfcc('outputs/audio/sunflowers-Alex-180-normal-4763.aiff') # # sunflowers_vic_180_norm.shape # # sunflowers_fred_180_norm.shape # alex_mfcc.shape # sunflowers_vic_180_norm_mfcc.shape # sunflowers_fred_180_norm_mfcc.shape from speech_spectrum import generate_aiff_spectrogram vic_spec = generate_aiff_spectrogram('outputs/audio/sunflowers-Victoria-180-normal-870.aiff') alex_spec = generate_aiff_spectrogram('outputs/audio/sunflowers-Alex-180-normal-4763.aiff') alex150spec = generate_aiff_spectrogram('outputs/audio/sunflowers-Alex-150-normal-589.aiff') vic_spec.shape alex_spec.shape alex150spec.shape alex_mfcc.shape fred_180_norm_mfcc.shape # pm.SoundFileFormat # pm.Pitch.get_number_of_frames()