data_aquisition.py

from __future__ import unicode_literals
import youtube_dl
from moviepy.video.io.ffmpeg_tools import ffmpeg_extract_subclip
import csv
import ast
import os
import os.path
import argparse

#Class definitions

em_class = { '/m/03j1ly':'Emergency vehicle',
        '/m/04qvtq':'Police car(siren)',
        '/m/012n7d':'Ambulance(siren)',
        '/m/012ndj':'Fire engine, fire truck(siren)',
        '/m/03kmc9':'Siren',
            '/m/0dgbq'  :'Civil defense siren',
        '/m/030rvx' :'Buzzer',
        '/m/01y3hg' :'Smoke detector, smoke alarm',
        '/m/0c3f7m' :'Fire alarm',    
}
non_em_class = {'/m/07pbtc8':'Walk, footsteps',
        '/m/0gy1t2s':'Bicycle bell',
        '/m/03m9d0z':'Wind',
        '/t/dd00092':'Wind noise(microphone)',
        '/m/0jb2l'  :'Thunderstorm',
        '/m/0ngt1'  :'Thunder',
        '/m/06mb1'  :'Rain',
        '/m/0j2kx'  :'Waterfall',
        ##can probably exclude this
        '/m/028v0c' :'Silence',
        '/m/096m7z' :'Noise',
        '/m/06_y0by':'Environmental noise',
        '/m/07rgkc5':'Static',
        '/m/0chx_'  :'White noise',
        '/m/06bz3'  :'Radio',        
        #could be noise classes those listed above
        
        ###not sure about this '/m/07yv9'  :'Vehicle',
        ###not sure about this '/m/012f08' :'Moto vehicle(road)',
        '/m/0k4j'   :'Car',
        '/m/0912c9' :'Vehicle horn, car horn, honking',
        '/m/07rknqz':'Skidding',
        '/m/0h9mv'  :'Tire squeal',
        '/t/dd00134':'Car passing by',
        '/m/07r04'  :'Truck',
        '/m/05x_td' :'Air horn,truck horn',
        '/m0/4_sv'  :'Motorcycle',
         '/m/0btp2'  :'Traffic noise, roadway noise',
        '/m/0195fx' :'Subway, metro, underground',
        '/m/0199g'  :'Bicycle',
        '/m/06_fw'  :'Skateboard',
        
                    
}


def prepare_data(args):
    '''
    Prepares data in the 2 created sub-folders, 'emergency' and 'nonEmergency'
    '''
    base_download_path = str(args.download_dir)

    em_download_path = os.path.join(base_download_path, 'emergency')
    nonem_download_path = os.path.join(base_download_path, 'nonEmergency')

    base_save_path = str(args.save_dir)

    em_files_path = os.path.join(base_save_path, 'emergency')
    nonem_files_path = os.path.join(base_save_path, 'nonEmergency')

    ##################################
    os.chdir(base_download_path)

    # mention the name of the .csv file
    with open(args.csv_filename) as csvfile:   # Also use other csv audioset files too extract all the data available in these categories
        readCSV = csv.reader(csvfile,delimiter=',')
        count=0
        em_c=0
        non_em_c=0
        
        for row in readCSV:
            if(count<3):
                count=count+1
            else:
                v_id = row[0]
                #v_start = ast.literal_eval(row[1])
                #v_end = ast.literal_eval(row[2])
                v_start = float(row[1])
                v_end  = float(row[2])
                labels_list = row[3:]
                
                labels_id = []
                for labels in labels_list:
                    if labels == '':
                        break
                    else:
                        labels = labels.replace('\"','')
                        labels = labels.strip()
                        labels_id.append(labels)
                
                v_class = []
                for labels in labels_id:
                    v_class.extend(labels.split(","))

                flg1=0
                flg2=0
                
                ##Excluding videos present in both EM and non-EM
                if(set(v_class)&set(em_class.keys())!=set([])):
                    flg1=1
                if(set(v_class)&set(non_em_class.keys())!=set([])):
                    flg2=1

                if flg1==1 and flg2==1:
                    continue

                elif flg1==1:
                    print (v_id,v_start,v_end,'em')
                    ydl_opts = {
                            'format': 'bestaudio/best',
                        'ignoreerrors':'True',
                            'postprocessors': [{
                                'key': 'FFmpegExtractAudio',
                                'preferredcodec': 'wav',
                                'preferredquality': '192',
                            }],
                            'outtmpl':'emergency/%(id)s.%(ext)s',    
                    }

                    with youtube_dl.YoutubeDL(ydl_opts) as ydl:
                            ydl.download(['http://www.youtube.com/watch?v='+row[0]])

                    input_file = em_download_path+v_id+'.wav'
                    print(input_file)
                    # break
                    if(os.path.exists(input_file)):
                        print ('#############################################')
                        em_c = em_c +1
                        output_file = os.path.join(em_files_path, str(em_c)+'.wav')
                        print (output_file)
                        ffmpeg_extract_subclip(input_file,v_start,v_end,targetname=output_file)
                        os.remove(input_file)
                        
                elif flg2==1:
                    print (v_id,v_start,v_end,'Non-em')
                    ydl_opts = {
                            'format': 'bestaudio/best',
                        'ignoreerrors':'True',
                            'postprocessors': [{
                                'key': 'FFmpegExtractAudio',
                                'preferredcodec': 'wav',
                                'preferredquality': '192',
                            }],
                            'outtmpl':'nonEmergency/%(id)s.%(ext)s',    
                    }

                    with youtube_dl.YoutubeDL(ydl_opts) as ydl:
                            ydl.download(['http://www.youtube.com/watch?v='+row[0]])
                    
                    input_file = nonem_download_path+v_id+'.wav'
                    
                    if(os.path.exists(input_file)):
                        print ('#############################################')
                        non_em_c = non_em_c+1
                        output_file = os.path.join(nonem_files_path, str(non_em_c)+'.wav')
                        print (output_file)
                        ffmpeg_extract_subclip(input_file,v_start,v_end,targetname=output_file) 
                        os.remove(input_file)

if __name__ == "__main__":
    parser = argparse.ArgumentParser()

    parser.add_help
    parser.add_argument('--download_dir', help='Path to save the downloaded files', default=None)
    parser.add_argument('--save_dir', help='Path to save the extracted audio files', default=None)
    parser.add_argument('--csv_filename', help='Name of the AudioSet csv file (eval_segments.csv/balanced_train_segments.csv)', default=None)

    args = parser.parse_args()

    # Check needed, default values are None
    if args.download_dir is None or args.save_dir is None or args.csv_filename is None:
        raise ValueError("Need to specify Download and Save directories")

    prepare_data(args)