From 1a129d9cc5c62f04dafe5ad532825c18951bdbb3 Mon Sep 17 00:00:00 2001
From: Peter van Lunteren <contact@pvanlunteren.com>
Date: Sun, 23 Jun 2024 12:14:12 +0200
Subject: [PATCH] added smoothing feature

---
 classification_utils/inference_lib.py | 608 ++++++++------------------
 1 file changed, 175 insertions(+), 433 deletions(-)
diff --git a/classification_utils/inference_lib.py b/classification_utils/inference_lib.py
index fbe73c3e..b9c2dadb 100755
--- a/classification_utils/inference_lib.py
+++ b/classification_utils/inference_lib.py
@@ -1,16 +1,21 @@
 # library of inference functions to be used for classifying MD crops 
 # Created by Peter van Lunteren
-# Latest edit by Peter van Lunteren on 6 Jun 2024
+# Latest edit by Peter van Lunteren on 23 Jun 2024
 
-# # import packages
-import json
+# import packages
+import io
 import os
+import json
+import datetime
+import contextlib
 from tqdm import tqdm
 from PIL import Image
-from collections import defaultdict 
-from cameratraps.megadetector.detection.video_utils import frame_results_to_video_results
-from cameratraps.megadetector.utils.ct_utils import is_list_sorted
+from collections import defaultdict
 from EcoAssist.smooth_params import *
+from megadetector.data_management import read_exif
+from megadetector.data_management import cct_json_utils
+from megadetector.data_management.read_exif import parse_exif_datetime_string
+from cameratraps.megadetector.detection.video_utils import frame_results_to_video_results
 
 # MAIN FUNCTION different workflow for videos than for images
 def classify_MD_json(json_path,
@@ -45,9 +50,9 @@ def classify_MD_json(json_path,
         
         # convert frame results to video results
         frame_results_to_video_results(input_file = frame_level_json,
-                                    output_file = video_level_json)
+                                       output_file = video_level_json)
         frame_results_to_video_results(input_file = frame_level_json_original,
-                                    output_file = video_level_json_original)
+                                       output_file = video_level_json_original)
 
         # remove unnecessary jsons
         if os.path.isfile(frame_level_json_original):
@@ -171,7 +176,7 @@ def convert_detections_to_classification(json_path,
                             # update prgressbar
                             pbar.update(1)
 
-    # # write unaltered json for timelapse
+    # write unaltered json for timelapse
     json_path_unaltered = os.path.splitext(json_path)[0] + "_original" + os.path.splitext(json_path)[1]
     data['classification_categories'] = {v: k for k, v in inverted_cls_label_map.items()}
     data['forbidden_classes'] = forbidden_classes
@@ -180,10 +185,18 @@ def convert_detections_to_classification(json_path,
 
     # smooth results if user specified
     json_to_rewrite = json_path_unaltered
-    if smooth_bool and json_path.endswith("image_recognition_file.json"):
-        json_path_smooth = os.path.splitext(json_path)[0] + "_smooth" + os.path.splitext(json_path)[1]
-        smooth_json(json_path_unaltered, json_path_smooth)
-        json_to_rewrite = json_path_smooth
+    if smooth_bool:
+        print("<EA-status-change>smoothing<EA-status-change>")
+        
+        # image metadata will be read and sequences will be formed
+        if json_path.endswith("image_recognition_file.json"):
+            smooth_json_imgs(json_path_unaltered)
+            json_to_rewrite = os.path.splitext(json_path)[0] + "_original" + os.path.splitext(json_path)[1]
+    
+        # for videos it is a bit easier as we already know the sequences
+        # we just need average all predictions per video in the frames.json
+        if json_path.endswith("video_recognition_file.frames.json"):
+            smooth_json_video(json_path)
 
     # rewrite json to be used by EcoAssist
     with open(json_to_rewrite) as image_recognition_file_content:
@@ -223,208 +236,39 @@ def convert_detections_to_classification(json_path,
     with open(json_path, "w") as json_file:
         json.dump(data, json_file, indent=1)
 
-# check other predictions whitin an image or sequence and smooth results to minimise prediction errors
-# Thanks Dan Morris (https://github.com/agentmorris/MegaDetector/blob/main/api/batch_processing/data_preparation/manage_local_batch.py)
-def smooth_json(json_input_fpath, json_output_fpath):
+# average predictions over multiple detections in images
+# based on code written by Dan Morris' MegaDetector in /data_preparation/manage_local_batch.py
+def smooth_json_imgs(json_input_fpath):
+
     # init vars
     filename_base = os.path.normpath(os.path.dirname(json_input_fpath))
-    classification_detection_files = [json_input_fpath]
-    overflow_folder_handling_enabled = False
-
-    # check if user assigned other and non-other categories
-    global other_category_names
-    global non_other_category_names
-    other_category_names_assigned = False
-    non_other_category_names_assigned = False
-    if 'other_category_names' in vars() or 'other_category_names' in globals():
-        other_category_names_assigned = True
-    if 'non_other_category_names' in vars() or 'non_other_category_names' in globals():
-        non_other_category_names_assigned = True
-
-    # if user has not assigned values to other_category_names and non_other_category_names themselves, we'll try to
-    # automatically distille the other category
-    if other_category_names_assigned == False or non_other_category_names_assigned == False:
-        with open(json_input_fpath,'r') as f:
-            d = json.load(f)
-            categories = list(d['classification_categories'].values())
-            if 'other' not in categories:
-                other_category_names = []
-                non_other_category_names = categories
-                print(f"<EA>Warning: category 'other' not present in json file. The variables other_category_names"
-                    " and non_other_category_names also not assigned in EcoAssist\smooth_params.py. Will not"
-                    " perform 'other'-smoothing, but will proceed with classification and sequence smoothing"
-                    " as usual.<EA>")
-            else:
-                other_category_names = ['other']
-                categories.remove('other')
-                non_other_category_names = categories
-
-    smoothed_classification_files = []
-    for final_output_path in classification_detection_files:
-        classifier_output_path = final_output_path
-        classifier_output_path_within_image_smoothing = classifier_output_path.replace(
-            '.json','_within_image_smoothing.json')
-        with open(classifier_output_path,'r') as f:
-            d = json.load(f)
-        category_name_to_id = {d['classification_categories'][k]:k for k in d['classification_categories']}
-        other_category_ids = []
-        for s in other_category_names:
-            if s in category_name_to_id:
-                other_category_ids.append(category_name_to_id[s])
-            else:
-                print('<EA>Warning: "other" category {} not present in file {}<EA>'.format(
-                    s,classifier_output_path))
-        n_other_classifications_changed = 0
-        n_other_images_changed = 0
-        n_detections_flipped = 0
-        n_images_changed = 0
-        
-        # Before we do anything else, get rid of everything but the top classification for each detection.
-        for im in d['images']:
-            if 'detections' not in im or im['detections'] is None or len(im['detections']) == 0:
-                continue
-            detections = im['detections']
-            for det in detections:
-                if 'classifications' not in det or len(det['classifications']) == 0:
-                    continue
-                classification_confidence_values = [c[1] for c in det['classifications']]
-                assert is_list_sorted(classification_confidence_values,reverse=True)
-                det['classifications'] = [det['classifications'][0]]
-            # ...for each detection in this image
-        # ...for each image
-        
-        for im in tqdm(d['images']):
-            if 'detections' not in im or im['detections'] is None or len(im['detections']) == 0:
-                continue
-            detections = im['detections']
-            category_to_count = defaultdict(int)
-            for det in detections:
-                if ('classifications' in det) and (det['conf'] >= detection_confidence_threshold):
-                    for c in det['classifications']:
-                        if c[1] >= classification_confidence_threshold:
-                            category_to_count[c[0]] += 1
-                    # ...for each classification
-                # ...if there are classifications for this detection
-            # ...for each detection
-                            
-            if len(category_to_count) <= 1:
-                continue
-            category_to_count = {k: v for k, v in sorted(category_to_count.items(),
-                                                        key=lambda item: item[1], 
-                                                        reverse=True)}
-            keys = list(category_to_count.keys())
-            
-            # Handle a quirky special case: if the most common category is "other" and 
-            # it's "tied" with the second-most-common category, swap them
-            if (len(keys) > 1) and \
-                (keys[0] in other_category_ids) and \
-                (keys[1] not in other_category_ids) and \
-                (category_to_count[keys[0]] == category_to_count[keys[1]]):
-                    keys[1], keys[0] = keys[0], keys[1]
-            
-            max_count = category_to_count[keys[0]]
-            # secondary_count = category_to_count[keys[1]]
-            # The 'secondary count' is the most common non-other class
-            secondary_count = 0
-            for i_key in range(1,len(keys)):
-                if keys[i_key] not in other_category_ids:
-                    secondary_count = category_to_count[keys[i_key]]
-                    break
-            most_common_category = keys[0]
-            assert max_count >= secondary_count
-            
-            # If we have at least *min_detections_to_overwrite_other* in a category that isn't
-            # "other", change all "other" classifications to that category
-            if max_count >= min_detections_to_overwrite_other and \
-                most_common_category not in other_category_ids:
-                other_change_made = False
-                for det in detections:
-                    if ('classifications' in det) and (det['conf'] >= detection_overwrite_threshold): 
-                        for c in det['classifications']:                
-                            if c[1] >= classification_overwrite_threshold and \
-                                c[0] in other_category_ids:
-                                n_other_classifications_changed += 1
-                                other_change_made = True
-                                c[0] = most_common_category
-                        # ...for each classification
-                    # ...if there are classifications for this detection
-                # ...for each detection
-                
-                if other_change_made:
-                    n_other_images_changed += 1
-            # ...if we should overwrite all "other" classifications
-        
-            if max_count < min_detections_above_threshold:
-                continue
-            if secondary_count >= max_detections_secondary_class:
-                continue
-            
-            # At this point, we know we have a dominant category; change all other above-threshold
-            # classifications to that category.  That category may have been "other", in which
-            # case we may have already made the relevant changes.
-            n_detections_flipped_this_image = 0
-            for det in detections:
-                if ('classifications' in det) and (det['conf'] >= detection_overwrite_threshold):
-                    for c in det['classifications']:
-                        if c[1] >= classification_overwrite_threshold and \
-                            c[0] != most_common_category:
-                            c[0] = most_common_category
-                            n_detections_flipped += 1
-                            n_detections_flipped_this_image += 1
-                    # ...for each classification
-                # ...if there are classifications for this detection
-            # ...for each detection
-            
-            if n_detections_flipped_this_image > 0:
-                n_images_changed += 1
-        # ...for each image    
-        
-        print('<EA>Classification smoothing: changed {} detections on {} images<EA>'.format(
-            n_detections_flipped,n_images_changed))
-        print('<EA>"Other" smoothing: changed {} detections on {} images<EA>'.format(
-            n_other_classifications_changed,n_other_images_changed))
-        with open(classifier_output_path_within_image_smoothing,'w') as f:
-            json.dump(d,f,indent=1)
-        print('Wrote results to:\n{}'.format(classifier_output_path_within_image_smoothing))
-        smoothed_classification_files.append(classifier_output_path_within_image_smoothing)
-    # ...for each file we want to smooth
-
-    #% Read EXIF data from all images
-    from data_management import read_exif
+    
+    # read EXIF data from all images
     exif_options = read_exif.ReadExifOptions()
     exif_options.verbose = False
-    # exif_options.n_workers = default_workers_for_parallel_tasks
-    # exif_options.use_threads = parallelization_defaults_to_threads
     exif_options.processing_library = 'pil'
     exif_options.byte_handling = 'delete'
     exif_results_file = os.path.join(filename_base,'exif_data.json')
     if os.path.isfile(exif_results_file):
-        print('Reading EXIF results from {}'.format(exif_results_file))
         with open(exif_results_file,'r') as f:
             exif_results = json.load(f)
-    else:        
+    else:
         exif_results = read_exif.read_exif_from_folder(filename_base,
-                                                    output_file=exif_results_file,
-                                                    options=exif_options)
+                                                        output_file=exif_results_file,
+                                                        options=exif_options)
 
-    #% Prepare COCO-camera-traps-compatible image objects for EXIF results
-    import datetime    
-    from data_management.read_exif import parse_exif_datetime_string
-    min_valid_timestamp_year = 2000
+    # prepare COCO-camera-traps-compatible image objects for EXIF results
+    min_valid_timestamp_year = 1990
     now = datetime.datetime.now()
     image_info = []
     images_without_datetime = []
     images_with_invalid_datetime = []
     exif_datetime_tag = 'DateTimeOriginal'
-    for exif_result in tqdm(exif_results):
-        im = {}
-
-        # By default we assume that each leaf-node folder is a location
-        if overflow_folder_handling_enabled:
-            im['location'] = relative_path_to_location(os.path.dirname(exif_result['file_name']))
-        else:
-            im['location'] = os.path.dirname(exif_result['file_name'])
+    for exif_result in exif_results:
 
+        # collect info
+        im = {}
+        im['location'] = os.path.dirname(exif_result['file_name'])
         im['file_name'] = exif_result['file_name']
         im['id'] = im['file_name']
         if ('exif_tags' not in exif_result) or (exif_result['exif_tags'] is None) or \
@@ -439,16 +283,16 @@ def smooth_json(json_input_fpath, json_output_fpath):
         else:
             dt = exif_dt
             
-            # An image from the future (or within the last hour) is invalid
+            # an image from the future (or within the last hour) is invalid
             if (now - dt).total_seconds() <= 1*60*60:
-                print('<EA>Warning: datetime for {} is {}<EA>'.format(
-                    im['file_name'],dt))
+                print('<EA>Warning: an image from the future (or within the last hour) is invalid - datetime for {} is {}<EA>'.format(
+                    im['file_name'], dt))
                 im['datetime'] = None            
                 images_with_invalid_datetime.append(im['file_name'])
             
-            # An image from before the dawn of time is also invalid
+            # an image from before the dawn of time is also invalid
             elif dt.year < min_valid_timestamp_year:
-                print('<EA>Warning: datetime for {} is {}<EA>'.format(
+                print('<EA>Warning: an image from before the dawn of time is also invalid - datetime for {} is {}<EA>'.format(
                     im['file_name'],dt))
                 im['datetime'] = None
                 images_with_invalid_datetime.append(im['file_name'])
@@ -456,260 +300,158 @@ def smooth_json(json_input_fpath, json_output_fpath):
             else:
                 im['datetime'] = dt
         image_info.append(im)
-    # ...for each exif image result
 
-    print('<EA>Parsed EXIF datetime information, unable to parse EXIF data from {} of {} images<EA>'.format(
-        len(images_without_datetime),len(exif_results)))
+    # assemble into sequences
+    dummy_stream = io.StringIO()
+    with contextlib.redirect_stdout(dummy_stream):
+        cct_json_utils.create_sequences(image_info)
 
-    #% Assemble into sequences
-    from data_management import cct_json_utils
-    print('Assembling images into sequences')
-    cct_json_utils.create_sequences(image_info)
-
-    # Make a list of images appearing at each location
+    # make a list of images appearing at each location
     sequence_to_images = defaultdict(list)
-    for im in tqdm(image_info):
+    for im in image_info:
         sequence_to_images[im['seq_id']].append(im)
     all_sequences = list(sorted(sequence_to_images.keys()))
 
-    #% Load classification results
-    sequence_level_smoothing_input_file = smoothed_classification_files[0]
+    # write to file
+    sequence_level_smoothing_input_file = json_input_fpath
     with open(sequence_level_smoothing_input_file,'r') as f:
         d = json.load(f)
 
-    # Map each filename to classification results for that file
+    # map each filename to classification results for that file
     filename_to_results = {}
-    for im in tqdm(d['images']):
+    for im in d['images']:
         filename_to_results[im['file'].replace('\\','/')] = im
-
-    #% Smooth classification results over sequences (prep)
-    classification_category_id_to_name = d['classification_categories']
-    classification_category_name_to_id = {v: k for k, v in classification_category_id_to_name.items()}
-    class_names = list(classification_category_id_to_name.values())
-    animal_detection_category = '1'
-    assert(d['detection_categories'][animal_detection_category] == 'animal')
-    other_category_ids = set([classification_category_name_to_id[s] for s in other_category_names])
-
-    # These are the only classes to which we're going to switch other classifications
-    category_names_to_smooth_to = set(non_other_category_names)
-    category_ids_to_smooth_to = set([classification_category_name_to_id[s] for s in category_names_to_smooth_to])
-    assert all([s in class_names for s in category_names_to_smooth_to])    
     
-    #% Smooth classification results over sequences (supporting functions)
-    def results_for_sequence(images_this_sequence):
-        """
-        Fetch MD results for every image in this sequence, based on the 'file_name' field
-        """
-        results_this_sequence = []
-        for im in images_this_sequence:
-            fn = im['file_name']
-            results_this_image = filename_to_results[fn]
-            assert isinstance(results_this_image,dict)
-            results_this_sequence.append(results_this_image)
-        return results_this_sequence
-
-    def top_classifications_for_sequence(images_this_sequence):
-        """
-        Return all top-1 animal classifications for every detection in this 
-        sequence, regardless of  confidence
-
-        May modify [images_this_sequence] (removing non-top-1 classifications)
-        """
+    # link the classifications to each image of the sequence
+    def fetch_classifications_for_sequence(images_this_sequence):
         classifications_this_sequence = []
         for im in images_this_sequence:
             fn = im['file_name']
-            results_this_image = filename_to_results[fn]
-            if 'detections' in results_this_image:
-                if results_this_image['detections'] is None:
-                    continue
-            else:
+            results_this_image = filename_to_results.get(fn, {})
+            detections = results_this_image.get('detections')
+            if not detections:
                 continue
-            for det in results_this_image['detections']:
-                
-                # Only process animal detections
-                if det['category'] != animal_detection_category:
-                    continue
-                
-                # Only process detections with classification information
-                if 'classifications' not in det:
-                    continue
-                
-                # We only care about top-1 classifications, remove everything else
-                if len(det['classifications']) > 1:
-                    
-                    # Make sure the list of classifications is already sorted by confidence
-                    classification_confidence_values = [c[1] for c in det['classifications']]
-                    assert is_list_sorted(classification_confidence_values,reverse=True)
-                    
-                    # ...and just keep the first one
-                    det['classifications'] = [det['classifications'][0]]
-                    
-                # Confidence values should be sorted within a detection; verify this, and ignore 
-                top_classification = det['classifications'][0]
-                classifications_this_sequence.append(top_classification)
-            # ...for each detection in this image
-        # ...for each image in this sequence
+            for det in detections:
+                if det.get('category') == '1' and 'classifications' in det:
+                    classifications_this_sequence.append(det['classifications'])
         return classifications_this_sequence
-    # ...top_classifications_for_sequence()
-
 
-    def count_above_threshold_classifications(classifications_this_sequence):    
-        """
-        Given a list of classification objects (tuples), return a dict mapping
-        category IDs to the count of above-threshold classifications.
-        
-        This dict's keys will be sorted in descending order by frequency.
-        """
-        
-        # Count above-threshold classifications in this sequence
-        category_to_count = defaultdict(int)
-        for c in classifications_this_sequence:
-            if c[1] >= classification_confidence_threshold:
-                category_to_count[c[0]] += 1
-        
-        # Sort the dictionary in descending order by count
-        category_to_count = {k: v for k, v in sorted(category_to_count.items(),
-                                                    key=lambda item: item[1], 
-                                                    reverse=True)}
-        
-        keys_sorted_by_frequency = list(category_to_count.keys())
-            
-        # Handle a quirky special case: if the most common category is "other" and 
-        # it's "tied" with the second-most-common category, swap them.
-        if len(other_category_names) > 0:
-            if (len(keys_sorted_by_frequency) > 1) and \
-                (keys_sorted_by_frequency[0] in other_category_names) and \
-                (keys_sorted_by_frequency[1] not in other_category_names) and \
-                (category_to_count[keys_sorted_by_frequency[0]] == \
-                category_to_count[keys_sorted_by_frequency[1]]):
-                    keys_sorted_by_frequency[1], keys_sorted_by_frequency[0] = \
-                        keys_sorted_by_frequency[0], keys_sorted_by_frequency[1]
-        sorted_category_to_count = {}    
-        for k in keys_sorted_by_frequency:
-            sorted_category_to_count[k] = category_to_count[k]
-        return sorted_category_to_count
-    # ...def count_above_threshold_classifications()
-        
-    def sort_images_by_time(images):
-        """
-        Returns a copy of [images], sorted by the 'datetime' field (ascending).
-        """
-        return sorted(images, key = lambda im: im['datetime'])        
-
-    def get_first_key_from_sorted_dictionary(di):
-        if len(di) == 0:
-            return None
-        return next(iter(di.items()))[0]
-
-    def get_first_value_from_sorted_dictionary(di):
-        if len(di) == 0:
-            return None
-        return next(iter(di.items()))[1]
-
-    #% Smooth classifications at the sequence level (main loop)
-    n_other_flips = 0
-    n_classification_flips = 0
-    n_unclassified_flips = 0
-
-    # Break if this token is contained in a filename (set to None for normal operation)
-    debug_fn = None
-    for i_sequence,seq_id in tqdm(enumerate(all_sequences),total=len(all_sequences)):
+    # group and smooth averages for all detections in a sequence
+    for _, seq_id in tqdm(enumerate(all_sequences),total=len(all_sequences)):
         images_this_sequence = sequence_to_images[seq_id]
+
+        # link the classifications to the images of the sequence
+        classifications_this_sequence = fetch_classifications_for_sequence(images_this_sequence)
         
-        # Count top-1 classifications in this sequence (regardless of confidence)
-        classifications_this_sequence = top_classifications_for_sequence(images_this_sequence)
-        
-        # Handy debugging code for looking at the numbers for a particular sequence
+        # group all confidences per class together in a list
+        aggregated_confs = defaultdict(list)
+        for conf_list in classifications_this_sequence:
+            for cat_idx, conf in conf_list:
+                aggregated_confs[cat_idx].append(conf)
+
+        # calculate the average confidence per class
+        smoothend_conf_list = []
+        for cat_idx, conf_list in aggregated_confs.items():
+            ave_conf = round(sum(conf_list) / len(conf_list), 5)
+            smoothend_conf_list.append([cat_idx, ave_conf])
+
+        # only take the highest smoothed confidence
+        if smoothend_conf_list != []:
+            smoothend_conf = [sorted(smoothend_conf_list, key=lambda x: x[1], reverse=True)[0]] if smoothend_conf_list != [] else [[]]
+
+        # now we need to place these smoothed results back into the detections
         for im in images_this_sequence:
-            if debug_fn is not None and debug_fn in im['file_name']:
-                raise ValueError('')
-        if len(classifications_this_sequence) == 0:
-            continue
-        
-        # Count above-threshold classifications for each category
-        sorted_category_to_count = count_above_threshold_classifications(classifications_this_sequence)
-        if len(sorted_category_to_count) == 0:
-            continue
-        
-        max_count = get_first_value_from_sorted_dictionary(sorted_category_to_count)    
-        dominant_category_id = get_first_key_from_sorted_dictionary(sorted_category_to_count)
-        
-        # If our dominant category ID isn't something we want to smooth to, don't mess around with this sequence
-        if dominant_category_id not in category_ids_to_smooth_to:
-            continue
+            fn = im['file_name']
+            results_this_image = filename_to_results[fn]
+            if "detections" in results_this_image:
+                for detection in results_this_image['detections']:
+                    if "classifications" in detection:
+                        detection['classifications'] = smoothend_conf
+    
+    # remove exif.json if present
+    exif_json = os.path.join(filename_base, "exif_data.json")
+    if os.path.isfile(exif_json):
+        os.remove(exif_json)
         
-        ## Smooth "other" classifications ##
-        if max_count >= min_dominant_class_classifications_above_threshold_for_other_smoothing:        
-            for c in classifications_this_sequence:           
-                if c[0] in other_category_ids:
-                    n_other_flips += 1
-                    c[0] = dominant_category_id
-                    c[1] = flipped_other_confidence_value
-
-        # By not re-computing "max_count" here, we are making a decision that the count used
-        # to decide whether a class should overwrite another class does not include any "other"
-        # classifications we changed to be the dominant class.  If we wanted to include those...
-        # 
-        # sorted_category_to_count = count_above_threshold_classifications(classifications_this_sequence)
-        # max_count = get_first_value_from_sorted_dictionary(sorted_category_to_count)    
-        # assert dominant_category_id == get_first_key_from_sorted_dictionary(sorted_category_to_count)
+    # remove original json and replace with smoothed
+    original_json = os.path.join(filename_base, "image_recognition_file_original.json")
+    if os.path.isfile(original_json):
+        os.remove(original_json)
+    
+    # write smoothed classification results as orignal
+    with open(os.path.join(filename_base, original_json),'w') as f:
+        json.dump(d, f, indent=1)
+
+# for videos we don't need to read exif data becuase we will average the results per video
+def smooth_json_video(json_path):
+    
+    # init vars
+    json_path_frames = os.path.join(os.path.dirname(json_path), "video_recognition_file.frames_original.json")
+    videos_dict = defaultdict(dict)
+
+    # gather all confs per class and per video
+    with open(json_path_frames, "r") as json_file:
+        d = json.load(json_file)
+    for im in d['images']:
+        video_fn = os.path.dirname(im['file'])
+        if 'detections' in im:
+            for det in im['detections']:
+                if 'classifications' in det:
+                    for cat_idx, conf in det['classifications']:
+                        if cat_idx not in videos_dict[video_fn]:
+                            videos_dict[video_fn][cat_idx] = []
+                        videos_dict[video_fn][cat_idx].append(conf)
+    
+    # smooth per video
+    smoothed_confs_dict = defaultdict()
+    for video, aggregated_confs in videos_dict.items():
+        smoothend_conf_list = []
         
-        ## Smooth non-dominant classes ##
-        if max_count >= min_dominant_class_classifications_above_threshold_for_class_smoothing:
-            
-            # Don't flip classes to the dominant class if they have a large number of classifications
-            category_ids_not_to_flip = set()
-            for category_id in sorted_category_to_count.keys():
-                secondary_class_count = sorted_category_to_count[category_id]
-                dominant_to_secondary_ratio = max_count / secondary_class_count
-                
-                # Don't smooth over this class if there are a bunch of them, and the ratio
-                # if primary to secondary class count isn't too large
-                
-                # Default ratio
-                ratio_for_override = min_dominant_class_ratio_for_secondary_override_table[None]
+        # average each conf per class
+        for cat_idx, conf_list in aggregated_confs.items():
+            ave_conf = round(sum(conf_list) / len(conf_list), 5)
+            smoothend_conf_list.append([cat_idx, ave_conf])
+
+        # only take the highest smoothed confidence
+        if smoothend_conf_list != []:
+            smoothend_conf = [sorted(smoothend_conf_list, key=lambda x: x[1], reverse=True)[0]] if smoothend_conf_list != [] else [[]]
+    
+        # store in separate dict
+        smoothed_confs_dict[video] = smoothend_conf
+
+    # loop through json one last time to replace the classifications and remove unidentified animals
+    for im in d['images']:
+        video_fn = os.path.dirname(im['file'])
+        if 'detections' in im:
+            new_detections = []
+            for det in im['detections']:
+                if det['category'] == '1':
+                    if 'classifications' in det:
+                        
+                        # because we select the best frame based on confidence, we want the frame with the clearest animal
+                        # (i.e., the highest detection confidence) to have a slightly better confidence than the other frames
+                        # therefore we take the weighted average of the two confidence scores
+                        ave_conf = round(((smoothed_confs_dict[video_fn][0][1] * 29) + (det['conf'])) / 30, 5)
+                        det['classifications'] = [[smoothed_confs_dict[video_fn][0][0], ave_conf]]
+                        new_detections.append(det)
+                        
+                    # these are the unidentified animals that also have a frame that is good enough for a classification 
+                    # there fore we can skip those since the other frames are better
+                    elif video_fn in smoothed_confs_dict:
+                        continue  
+                    
+                    # these are the unidentified animals without any frame that is good enough for a classification 
+                    else:
+                        new_detections.append(det)
                 
-                # Does this dominant class have a custom ratio?
-                if dominant_category_id in min_dominant_class_ratio_for_secondary_override_table:
-                    ratio_for_override = \
-                        min_dominant_class_ratio_for_secondary_override_table[dominant_category_id]
-                if (dominant_to_secondary_ratio < ratio_for_override) and \
-                    (secondary_class_count > \
-                    max_secondary_class_classifications_above_threshold_for_class_smoothing):
-                    category_ids_not_to_flip.add(category_id)
-            for c in classifications_this_sequence:
-                if c[0] not in category_ids_not_to_flip and c[0] != dominant_category_id:
-                    c[0] = dominant_category_id
-                    c[1] = flipped_class_confidence_value
-                    n_classification_flips += 1
+                # these are persons and vehicles    
+                else:
+                    new_detections.append(det)
             
-        ## Smooth unclassified detections ##
-        if max_count >= min_dominant_class_classifications_above_threshold_for_unclassified_smoothing:
-            results_this_sequence = results_for_sequence(images_this_sequence)
-            detections_this_sequence = []
-            for r in results_this_sequence:
-                if r['detections'] is not None:
-                    detections_this_sequence.extend(r['detections'])
-            for det in detections_this_sequence:
-                if 'classifications' in det and len(det['classifications']) > 0:
-                    continue
-                if det['category'] != animal_detection_category:
-                    continue
-                if det['conf'] < min_detection_confidence_for_unclassified_flipping:
-                    continue
-                det['classifications'] = [[dominant_category_id,flipped_unclassified_confidence_value]]
-                n_unclassified_flips += 1
-                                
-    # ...for each sequence    
-    print('\nFinished sequence smoothing\n')
-    print('<EA>Flipped {} "other" classifications<EA>'.format(n_other_flips))
-    print('<EA>Flipped {} species classifications<EA>'.format(n_classification_flips))
-    print('<EA>Flipped {} unclassified detections<EA>'.format(n_unclassified_flips))
-    
-    #% Write smoothed classification results
-    with open(os.path.join(filename_base, json_output_fpath),'w') as f:
-        json.dump(d,f,indent=1)
+            # replace with the filtered detections
+            im['detections'] = new_detections
+
+    # write smoothed classification results
+    with open(json_path_frames, 'w') as f:
+        json.dump(d, f, indent = 1)     
     
-    #% remove temporary jsons
-    if os.path.isfile(classifier_output_path_within_image_smoothing):
-        os.remove(classifier_output_path_within_image_smoothing)