release code base

2024-02-20 16:31:21 +01:00 · 2024-02-20 16:31:21 +01:00 · efbd43fed1
commit efbd43fed1
70 changed files with 4923 additions and 0 deletions
--- a/src/utils/dvd_codebase/data/analysis_utils.py
+++ b/src/utils/dvd_codebase/data/analysis_utils.py
@ -0,0 +1,282 @@
+"""
+Copyright (c) Facebook, Inc. and its affiliates.
+All rights reserved.
+This source code is licensed under the license found in the
+LICENSE file in the root directory of this source tree.
+"""
+
+import glob, json, pdb
+from tqdm import tqdm
+import pandas as pd
+import copy, os
+
+def get_question_type(template, prior_template):
+    last_node_type = template['nodes'][-1]['type']
+    text = template['text'][0].lower()
+    if 'same set of activities' in text: 
+        qtype = 'compare action set'
+    elif 'same sequence of activities' in text:
+        qtype = 'compare action sequence'
+    elif 'frequently' in text:
+        qtype = 'compare int'
+    elif 'how many times' in text:
+        qtype = 'action count'
+    elif 'how many' in text or 'what number' in text:
+        qtype = 'obj count'
+    elif 'is there' in text: 
+        qtype = 'obj exist'
+    elif 'what color' in text or 'what material' in text or 'what shape' in text or 'what size' in text:
+        qtype = 'attr query'
+    elif 'what type of action' in text or 'what is the' in text or 'what types of action' in text:
+        qtype = 'action query'
+    else:
+        assert 'what about' in text
+        qtype = get_question_type(prior_template, None)
+    return qtype
+
+def get_question_subtype(template, prior_template):
+    last_node_type = template['nodes'][-1]['type']
+    text = template['text'][0].lower()
+    if 'same set of activities' in text: 
+        if 'how many' in text:
+            qtype = 'compare action set (count)'
+        else:
+            qtype = 'compare action set (exist)'
+    elif 'same sequence of activities' in text:
+        if 'how many' in text:
+            qtype = 'compare action seq (count)'
+        else:
+            qtype = 'compare action seq (exist)'
+    elif 'frequently' in text:
+        if 'as frequently' in text:
+            qtype = 'compare int (equal)'
+        elif 'less frequently' in text:
+            qtype = 'compare int (less)'
+        elif 'more frequently' in text:
+            qtype = 'compare int (more)'
+    elif 'how many times' in text:
+        qtype = 'action count'
+    elif 'how many' in text or 'what number' in text:
+        qtype = 'obj count'
+    elif 'is there' in text: 
+        qtype = 'obj exist'
+    elif 'what color' in text or 'what about its color' in text: 
+        qtype = 'attr query (color)'
+    elif 'what material' in text or 'what about its material'in text: 
+        qtype = 'attr query (material)'
+    elif 'what shape' in text or 'what about its shape' in text: 
+        qtype = 'attr query (shape)'
+    elif 'what size' in text or 'what about its size' in text: 
+        qtype = 'attr query (size)'
+    elif 'what type of action' in text or 'what is the' in text or 'what types of action' in text:
+        if '<o>' in text:
+            qtype = 'action query (by order)'
+        elif '<f>' in text:
+            qtype = 'ation query (by freq)'
+        else:
+            qtype = 'action query (all actions)'
+    else:
+        assert 'what about' in text
+        assert 'color' not in text and 'size' not in text and \
+                'shape' not in text and 'material' not in text
+        qtype = get_question_subtype(prior_template, None)
+    return qtype
+
+def get_question_complexity(turn, template_fn):
+    template = turn['template']
+    interval_type = template['interval_type']
+    last_node_type = template['nodes'][-1]['type']
+    second_last_node_type = template['nodes'][-2]['type']
+
+    if interval_type == 'none': 
+        return 'none'
+    elif interval_type == 'atomic': 
+        if 'one_hop' in template_fn:
+            return 'atomic (spatial)'
+        else:
+            return 'atomic (non-spatial)'
+        #return 'atomic'
+    elif interval_type == 'compositional':
+        return 'compositional'
+
+def get_accuracies_by_type(all_types, models, all_answers, all_results, output_file):
+    types = sorted(set(all_types))
+    accuracies = {} 
+    for t in types:
+        accuracies[t] = []
+        for model in models:
+            nb_corrects = 0 
+            count = 0
+            results = all_results[model]
+            for a_idx, a in enumerate(all_answers):
+                curr_type = all_types[a_idx]
+                if curr_type != t: continue
+                pred = results[a_idx]
+                if str(pred) == str(a):
+                    nb_corrects += 1 
+                count += 1 
+            acc = nb_corrects/count 
+            accuracies[t].append(acc)  
+    df = copy.deepcopy(accuracies)
+    df['model'] = models
+    df = pd.DataFrame(data=df, columns=['model'] + list(accuracies.keys()))
+    df.to_csv(output_file)
+    return types, accuracies, df
+
+def get_transfer_accuracies(all_types, models, all_answers, all_results, output_file, is_video_update=False, is_all=False): 
+    accuracies = []
+    for model in models:
+        results = all_results[model]
+        nb_corrects = 0 
+        count = 0 
+        for a_idx, a in enumerate(all_answers):
+            if is_all:
+                is_single_turn = True
+                for k,v in all_types.items():
+                    if v[a_idx] != 'none':
+                        is_single_turn = False 
+                        break
+                if is_single_turn: continue 
+            else:
+                curr_type = all_types[a_idx]
+                if is_video_update:
+                    if curr_type != 'video_update': continue
+                else:
+                    if curr_type != 'yes': continue
+            prior_pred_a = results[a_idx-1]
+            prior_gt_a = all_answers[a_idx-1]
+            if str(prior_pred_a) != str(prior_gt_a): continue  
+            pred_a = results[a_idx]
+            gt_a = all_answers[a_idx]
+            if str(pred_a) == str(gt_a):
+                nb_corrects += 1 
+            count += 1 
+        if count == 0:
+            acc = 0
+        else:
+            #pdb.set_trace()
+            acc = nb_corrects/count 
+        accuracies.append(acc)
+    df = {}
+    df['accuracies'] = accuracies
+    df['model'] = models
+    df = pd.DataFrame(data=df, columns=['model', 'accuracies'])
+    df.to_csv(output_file)
+    return df 
+
+def get_start_end_time(period):
+    start, end = period
+    if start is None:
+        start = 0
+    else:
+        start = start[-1]
+    if end is None:
+        end = 301
+    else:
+        end = end[-1]
+    return start, end 
+
+def get_period_size(period):
+    if period is None:
+        return 0
+    start, end = get_start_end_time(period)
+    return end - start
+
+def get_overlap_period(curr_period, last_period, ratio=False):
+    if curr_period is None:
+        return -1 
+    if last_period is None:
+        return 0 
+    s1, e1 = get_start_end_time(curr_period)
+    s2, e2 = get_start_end_time(last_period)
+    if s2<e1 and s1<e2:
+        if ratio:
+            return get_period_ratio_bin((min(e1,e2)-max(s1,s2))/(e2-s2))
+        else:
+            return (min(e1,e2)-max(s1,s2))
+    else:
+        return 0 
+
+def get_period_distance(curr_period, last_period, point='start'):
+    if curr_period is None:
+        return -1 
+    if last_period is None: 
+        return -1 
+    s1, e1 = get_start_end_time(curr_period)
+    s2, e2 = get_start_end_time(last_period)
+    if point == 'start': 
+        return abs(s1-s2)
+    elif point == 'end':
+        return abs(e1-e2) 
+
+def get_period_ratio_bin(ratio):
+    if ratio == 0:
+        return 0
+    for n in range(0,10):
+        if ratio*10>n:
+            bin = n
+        else:
+            break
+    return bin 
+
+def get_obj_turn_dist(used_objects, dependencies, template, turn_idx):
+    all_dists = [0]
+    
+    if dependencies['object'] != 'none':
+        if dependencies['object'] == 'earlier_unique':
+            obj_id = str(template['earlier_unique_obj'])
+            if obj_id not in used_objects:
+                pdb.set_trace()
+            turn_dist = turn_idx - used_objects[obj_id]['original_turn'] + 1
+            all_dists.append(turn_dist)
+        
+    if dependencies['temporal'] != 'none':
+        if 'earlier_unique' in dependencies['temporal']:
+            obj_id = str(template['temporal_obj_id'])
+            if obj_id not in used_objects:
+                pdb.set_trace()
+            turn_dist = turn_idx - used_objects[obj_id]['original_turn'] + 1
+            all_dists.append(turn_dist)
+        
+    return max(all_dists)
+
+def get_stats(dials):
+    videos = set()
+    questions = set()
+    for dial in dials: 
+        for turn in dial:
+            question = turn['question']
+            video = '{}-{}'.format(turn['split'], turn['image_filename'])
+            videos.add(video)
+            questions.add(question)
+    print('# videos: {}'.format(len(videos)))
+    print("# dialogues: {}".format(len(dials)))
+    print("# unique questions: {}".format(len(questions)))
+    output = {
+        '#videos': len(videos),
+        '#dialogues': len(dials),
+        '#unique questions': len(questions)
+    }
+    return output 
+
+def find_video_end_range(end_time):
+    ranges = [0, 30, 60, 90, 120, 150, 180, 210, 240, 270]
+    if end_time is None: 
+        return 9
+    for idx, r in enumerate(ranges):
+        if end_time[-1] > r:
+            curr_r = idx 
+        else:
+            return curr_r
+    return 9
+
+def find_video_start_range(start_time):
+    ranges = [400, 270, 240, 210, 180, 150, 120, 90, 60, 30]
+    if start_time is None: 
+        return 0
+    for idx, r in enumerate(ranges):
+        if start_time[-1] <= r:
+            curr_r = 9-idx 
+        else:
+            return curr_r
+    return 0