# Copyright (c) 2021 Binbin Zhang(binbzha@qq.com) # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import argparse import json def load_label_and_score(keyword, label_file, score_file): # utt_id : score list score_table = {} with open(score_file, 'r', encoding='utf8') as fin: for line in fin: arr = line.strip().split() # key = utt_id key = arr[0] # scores is a list str_list = arr[1: ] scores = list(map(float, str_list)) score_table[key] = scores keyword_table = {} filler_table = {} filler_duration = 0.0 # label_file = data.list with open(label_file, 'r', encoding='utf8') as fin: for line in fin: obj = json.loads(line.strip()) assert 'key' in obj assert 'txt' in obj assert 'duration' in obj key = obj['key'] # txt is label index = obj['txt'] duration = obj['duration'] assert key in score_table # txt == keyword , correct if index == keyword: keyword_table[key] = score_table[key] else: # false filler_table[key] = score_table[key] filler_duration += duration return keyword_table, filler_table, filler_duration if __name__ == '__main__': parser = argparse.ArgumentParser(description='compute det curve') parser.add_argument('--test_data', required=True, help='label file') parser.add_argument('--keyword', type=int, default=0, help='score file') parser.add_argument('--score_file', required=True, help='score file') parser.add_argument('--step', type=float, default=0.01, help='score file') parser.add_argument('--stats_file', required=True, help='false reject/alarm stats file') args = parser.parse_args() # 'window_shift' is used to skip the frames after triggered window_shift = 50 keyword_table, filler_table, filler_duration = load_label_and_score( args.keyword, args.test_data, args.score_file) print('Filler total duration Hours: {}'.format(filler_duration / 3600.0)) # print('keyword_table.size = ', len(keyword_table)) # print('filler_table.size = ', len(filler_table)) # print('filler_duration = ', filler_duration) with open(args.stats_file, 'w', encoding='utf8') as fout: threshold = 0.0 while threshold <= 1.0: num_false_reject = 0 # transverse the all keyword_table for key, score_list in keyword_table.items(): # computer positive test sample, use the max score of list. score = max(score_list) if float(score) < threshold: num_false_reject += 1 num_false_alarm = 0 # transverse the all filler_table for key, score_list in filler_table.items(): i = 0 while i < len(score_list): if score_list[i] >= threshold: num_false_alarm += 1 i += 1 else: i += window_shift if len(keyword_table) != 0 : false_reject_rate = num_false_reject / len(keyword_table) num_false_alarm = max(num_false_alarm, 1e-6) if filler_duration != 0: false_alarm_per_hour = num_false_alarm / (filler_duration / 3600.0) fout.write('{:.6f} {:.6f} {:.6f}\n'.format(threshold, false_alarm_per_hour, false_reject_rate)) threshold += args.step