tensorflow/examples/speech_commands/accuracy_utils.py - platform/external/tensorflow - Git at Google

 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 ''' utils for getting accuracy statistics'''
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

 import tensorflow as tf
 import numpy as np


 class StreamingAccuracyStats(object):
   """Get streaming accuracy statistics every time a new command is founded.

     Attributes:
       _how_many_gt: How many ground truths.
       _how_many_gt_matched: How many ground truths have been matched.
       _how_many_fp: How many commands have been fired as false positive.
       _how_many_c: How many commands have been fired correctly.
       _how_many_w: How many commands have been fired wrongly.
       _gt_occurence: A list to record which commands and when it occurs in the
         input audio stream.
       _previous_c: A variable to record the last status of _how_many_c.
       _previous_w: A variable to record the last status of _how_many_w.
       _previous_fp: A variable to record the last status of _how_many_fp.
       """

   def __init__(self):
     """Init StreamingAccuracyStats with void or zero values."""
     self._how_many_gt = 0
     self._how_many_gt_matched = 0
     self._how_many_fp = 0
     self._how_many_c = 0
     self._how_many_w = 0
     self._gt_occurence = []
     self._previous_c = 0
     self._previous_w = 0
     self._previous_fp = 0

   def read_ground_truth_file(self, file_name):
     """Load a list of 1.ground truth and 2.start timestamp pair and store it in
     time order."""
     with open(file_name, 'r') as f:
       for line in f:
         line_split = line.strip().split(',')
         if len(line_split) != 2:
           continue
         timestamp = round(float(line_split[1]))
         label = line_split[0]
         self._gt_occurence.append([label, timestamp])
     self._gt_occurence = sorted(self._gt_occurence,
                                           key=lambda item: item[1])

   def delta(self):
     """Compute delta of StreamingAccuracyStats against last status and get what
     the recognition state is this time"""
     fp_delta = self._how_many_fp - self._previous_fp
     w_delta = self._how_many_w - self._previous_w
     c_delta = self._how_many_c - self._previous_c
     if fp_delta == 1:
       recognition_state = "(False Positive)"
     elif c_delta == 1:
       recognition_state = "(Correct)"
     elif w_delta == 1:
       recognition_state = "(Wrong)"
     else:
       raise ValueError("Unexpected state in statistics")
     # Update the previous status
     self._previous_c = self._how_many_c
     self._previous_w = self._how_many_w
     self._previous_fp = self._how_many_fp
     return recognition_state

   def calculate_accuracy_stats(self, found_words, up_to_time_ms,
                                time_tolerance_ms):
     """Calculate accuracy statistics when a new commands is founded

     Given ground truth and corresponding predictions founded by
     model, figure out how many were correct. Take a tolerance time, so that only
     predictions up to a point in time are considered.

     Args:
         found_words: A list of all founded commands up to now.
         up_to_time_ms: End timestamp of this audio piece.
         time_tolerance_ms: The tolerance milliseconds before and after
           up_to_time_ms to match a ground truth.
     """
     if up_to_time_ms == -1:
       latest_possible_time = np.inf
     else:
       latest_possible_time = up_to_time_ms + time_tolerance_ms
     self._how_many_gt = 0
     for ground_truth in self._gt_occurence:
       ground_truth_time = ground_truth[1]
       if ground_truth_time > latest_possible_time:
         break
       self._how_many_gt += 1
     self._how_many_fp = 0
     self._how_many_c = 0
     self._how_many_w = 0
     has_gt_matched = []
     for found_word in found_words:
       found_label = found_word[0]
       found_time = found_word[1]
       earliest_time = found_time - time_tolerance_ms
       latest_time = found_time + time_tolerance_ms
       has_matched_been_found = False
       for ground_truth in self._gt_occurence:
         ground_truth_time = ground_truth[1]
         if (ground_truth_time > latest_time or ground_truth_time >
             latest_possible_time):
           break
         if ground_truth_time < earliest_time:
           continue
         ground_truth_label = ground_truth[0]
         if (ground_truth_label == found_label and has_gt_matched.count(
             ground_truth_time) == 0):
           self._how_many_c += 1
         else:
           self._how_many_w += 1
         has_gt_matched.append(ground_truth_time)
         has_matched_been_found = True
         break
       if not has_matched_been_found:
         self._how_many_fp += 1
     self._how_many_gt_matched = len(has_gt_matched)

   def print_accuracy_stats(self):
     """Write a human-readable description of the statistics to stdout."""
     if self._how_many_gt == 0:
       tf.logging.info('No ground truth yet, {}false positives'.format(
         self._how_many_fp))
     else:
       any_match_percentage = self._how_many_gt_matched / self._how_many_gt * 100
       correct_match_percentage = self._how_many_c / self._how_many_gt * 100
       wrong_match_percentage = self._how_many_w / self._how_many_gt * 100
       false_positive_percentage = self._how_many_fp / self._how_many_gt * 100
       tf.logging.info('{:.1f}% matched, {:.1f}% correct, {:.1f}% wrong, '
                    '{:.1f}% false positive'.format(any_match_percentage,
                                                    correct_match_percentage,
                                                    wrong_match_percentage,
                                                    false_positive_percentage))
	# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# ==============================================================================
	''' utils for getting accuracy statistics'''
	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function

	import tensorflow as tf
	import numpy as np


	class StreamingAccuracyStats(object):
	"""Get streaming accuracy statistics every time a new command is founded.

	Attributes:
	_how_many_gt: How many ground truths.
	_how_many_gt_matched: How many ground truths have been matched.
	_how_many_fp: How many commands have been fired as false positive.
	_how_many_c: How many commands have been fired correctly.
	_how_many_w: How many commands have been fired wrongly.
	_gt_occurence: A list to record which commands and when it occurs in the
	input audio stream.
	_previous_c: A variable to record the last status of _how_many_c.
	_previous_w: A variable to record the last status of _how_many_w.
	_previous_fp: A variable to record the last status of _how_many_fp.
	"""

	def __init__(self):
	"""Init StreamingAccuracyStats with void or zero values."""
	self._how_many_gt = 0
	self._how_many_gt_matched = 0
	self._how_many_fp = 0
	self._how_many_c = 0
	self._how_many_w = 0
	self._gt_occurence = []
	self._previous_c = 0
	self._previous_w = 0
	self._previous_fp = 0

	def read_ground_truth_file(self, file_name):
	"""Load a list of 1.ground truth and 2.start timestamp pair and store it in
	time order."""
	with open(file_name, 'r') as f:
	for line in f:
	line_split = line.strip().split(',')
	if len(line_split) != 2:
	continue
	timestamp = round(float(line_split[1]))
	label = line_split[0]
	self._gt_occurence.append([label, timestamp])
	self._gt_occurence = sorted(self._gt_occurence,
	key=lambda item: item[1])

	def delta(self):
	"""Compute delta of StreamingAccuracyStats against last status and get what
	the recognition state is this time"""
	fp_delta = self._how_many_fp - self._previous_fp
	w_delta = self._how_many_w - self._previous_w
	c_delta = self._how_many_c - self._previous_c
	if fp_delta == 1:
	recognition_state = "(False Positive)"
	elif c_delta == 1:
	recognition_state = "(Correct)"
	elif w_delta == 1:
	recognition_state = "(Wrong)"
	else:
	raise ValueError("Unexpected state in statistics")
	# Update the previous status
	self._previous_c = self._how_many_c
	self._previous_w = self._how_many_w
	self._previous_fp = self._how_many_fp
	return recognition_state

	def calculate_accuracy_stats(self, found_words, up_to_time_ms,
	time_tolerance_ms):
	"""Calculate accuracy statistics when a new commands is founded

	Given ground truth and corresponding predictions founded by
	model, figure out how many were correct. Take a tolerance time, so that only
	predictions up to a point in time are considered.

	Args:
	found_words: A list of all founded commands up to now.
	up_to_time_ms: End timestamp of this audio piece.
	time_tolerance_ms: The tolerance milliseconds before and after
	up_to_time_ms to match a ground truth.
	"""
	if up_to_time_ms == -1:
	latest_possible_time = np.inf
	else:
	latest_possible_time = up_to_time_ms + time_tolerance_ms
	self._how_many_gt = 0
	for ground_truth in self._gt_occurence:
	ground_truth_time = ground_truth[1]
	if ground_truth_time > latest_possible_time:
	break
	self._how_many_gt += 1
	self._how_many_fp = 0
	self._how_many_c = 0
	self._how_many_w = 0
	has_gt_matched = []
	for found_word in found_words:
	found_label = found_word[0]
	found_time = found_word[1]
	earliest_time = found_time - time_tolerance_ms
	latest_time = found_time + time_tolerance_ms
	has_matched_been_found = False
	for ground_truth in self._gt_occurence:
	ground_truth_time = ground_truth[1]
	if (ground_truth_time > latest_time or ground_truth_time >
	latest_possible_time):
	break
	if ground_truth_time < earliest_time:
	continue
	ground_truth_label = ground_truth[0]
	if (ground_truth_label == found_label and has_gt_matched.count(
	ground_truth_time) == 0):
	self._how_many_c += 1
	else:
	self._how_many_w += 1
	has_gt_matched.append(ground_truth_time)
	has_matched_been_found = True
	break
	if not has_matched_been_found:
	self._how_many_fp += 1
	self._how_many_gt_matched = len(has_gt_matched)

	def print_accuracy_stats(self):
	"""Write a human-readable description of the statistics to stdout."""
	if self._how_many_gt == 0:
	tf.logging.info('No ground truth yet, {}false positives'.format(
	self._how_many_fp))
	else:
	any_match_percentage = self._how_many_gt_matched / self._how_many_gt * 100
	correct_match_percentage = self._how_many_c / self._how_many_gt * 100
	wrong_match_percentage = self._how_many_w / self._how_many_gt * 100
	false_positive_percentage = self._how_many_fp / self._how_many_gt * 100
	tf.logging.info('{:.1f}% matched, {:.1f}% correct, {:.1f}% wrong, '
	'{:.1f}% false positive'.format(any_match_percentage,
	correct_match_percentage,
	wrong_match_percentage,
	false_positive_percentage))