feature_extraction.py

from pathlib import Path  # For writing videos into the data folder
import os
import argparse
from parsel_process import *
import pandas as pd

def add_filpath(filepath):
  return filepath

if __name__ =='__main__':
    parser = argparse.ArgumentParser(description = "Provide the sampling rate and file path and features to be extracted")
    parser.add_argument(
      "samplingRate", type = int,
      help="desired sample rate for the file to be read with"
    )
    parser.add_argument(
      "filePath", type = str,
      help="path to the file (including '.wav extension), or folder containing the files, audio files must be in .wav format"
    )
    parser.add_argument(
        "writePath", type = str,
        help = "file to append result to, default is a new file in the current location"
    )
    parser.add_argument(
      "--formants", action="store_true",
      help="extract 4 formants"
    )
    parser.add_argument(
      "--ZCR", action="store_true",
      help="extract zero crossing rate"
    )
    parser.add_argument(
      "--harmonics", action="store_true",
      help="extract harmonics")
    parser.add_argument(
      "--rate_of_speech", action="store_true",
      help="extract number of syllables, words and pauses"
      )
    parser.add_argument(
      "--loudness", action="store_true",
      help="extract max intensity and intensity"
    )
    parser.add_argument(
      "--pitch_features", action="store_true",
      help="extract pitch, shimmer, jitter and pitch range"
      )
    parser.add_argument(
      "--spectral_features", action="store_true",
      help="extract spectral slope, mfcc and mean spectral roll off"
    )
    parser.add_argument(
      "--energy", action="store_true",
      help="extract energy")

    args = parser.parse_args()

    SAMPLING_RATE = args.samplingRate
    PATH = args.filePath
    WRITE_PATH = args.writePath
    FEATURES = args.__dict__

    function_dic = {"formants": [analyse_formants, analyse_formants, analyse_formants, analyse_formants],
                    "ZCR": [analyse_zero_crossing],
                    "harmonics": [analyse_harmonics],
                    "rate_of_speech": [get_number_sylls, get_number_words, pauses],
                    "loudness": [get_max_intensity, analyse_intensity],
                    "pitch_features":[analyse_pitch, analyse_pitch_range, analyse_shimmer, analyse_jitter],
                    "spectral_features":[spectral_slope, analyse_mfcc, mean_spectral_rolloff],
                    "energy":[get_energy]}

    # Files are read in order of the time created
    if ".wav" in PATH:
      pathlist = [PATH]
    else :
      pathlist = sorted(Path(PATH).glob('**/*.wav'))
    dic = {"filepath": [], "duration" : []}
    feature_list = ["filepath", "duration"]
    for k in FEATURES:
      if (FEATURES[k] == True):
        feature_list.append(k)

    itr = 0
    store_formants = []
    if not pathlist:
      raise ValueError("The filepath must be a .wav file or a folder containing .wav files")
    files = []
    for path in pathlist:
      filename_ext = os.path.basename(os.path.normpath(path))
      filename_no_ext = filename_ext.split('.', 1)[0]
      for feature in feature_list:
        if feature== "filepath":
          dic[feature].append(filename_no_ext)
        elif feature == "duration":
          y, s = librosa.load(path)
          y = librosa.to_mono(y)
          dic[feature].append(librosa.get_duration(y=y, sr=s))
        else:
          for func in function_dic[feature]:
            if feature == "formants" and itr <4:
              store_formants.append(func(itr+1, str(path)))
              itr+=1
              if itr == 4:
                itr = 0
                if str(func.__name__) in dic:
                  dic[str(func.__name__)].append(store_formants)
                else:
                  dic[str(func.__name__)] = [store_formants]
                store_formants = []
            if str(func.__name__) == "analyse_mfcc":
              value = func(str(path),  WRITE_PATH, SAMPLING_RATE)
              if str(func.__name__) in dic:
                dic[str(func.__name__)].append(value)
              else:
                dic[str(func.__name__)] = [value]
            else:
              value = func(str(path), SAMPLING_RATE)
              if str(func.__name__) in dic:
                dic[str(func.__name__)].append(value)
              else:
                dic[str(func.__name__)] = [value]

    pd.DataFrame(dic).to_csv(f"{WRITE_PATH}features.csv",index=False)