File size: 1,887 Bytes
15ac91d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
import argparse
import csv
import os

from utilities import create_folder


def dcase2017task4(args):
    """Create black list. Black list is a list of audio ids that will be 
    skipped in training. 
    """

    # Augments & parameters
    workspace = args.workspace
    
    # Black list from DCASE 2017 Task 4
    test_weak_csv = 'metadata/black_list/groundtruth_weak_label_testing_set.csv'
    evaluation_weak_csv = 'metadata/black_list/groundtruth_weak_label_evaluation_set.csv'
    
    black_list_csv = os.path.join(workspace, 'black_list', 'dcase2017task4.csv')
    create_folder(os.path.dirname(black_list_csv))
    
    def get_id_sets(csv_path):
        with open(csv_path, 'r') as fr:
            reader = csv.reader(fr, delimiter='\t')
            lines = list(reader)
         
        ids_set = [] 
        
        for line in lines:
            """line: ['-5QrBL6MzLg_60.000_70.000.wav', '60.000', '70.000', 'Train horn']"""
            ids_set.append(line[0][0 : 11])
            
        ids_set = list(set(ids_set))
        return ids_set
        
    test_ids_set = get_id_sets(test_weak_csv)
    evaluation_ids_set = get_id_sets(evaluation_weak_csv)
    
    full_ids_set = test_ids_set + evaluation_ids_set
    
    # Write black list
    fw = open(black_list_csv, 'w')
    
    for id in full_ids_set:
        fw.write('{}\n'.format(id))
        
    print('Write black list to {}'.format(black_list_csv))
    

if __name__ == '__main__':
    parser = argparse.ArgumentParser(description='')
    subparsers = parser.add_subparsers(dest='mode')

    parser_dcase2017task4 = subparsers.add_parser('dcase2017task4')
    parser_dcase2017task4.add_argument('--workspace', type=str, required=True)
        
    args = parser.parse_args()

    if args.mode == 'dcase2017task4':
        dcase2017task4(args)
        
    else:
        raise Exception('Error argument!')