SplitQA.py

from config import *
from Executors.conjunction import Conjunction
from Executors.simple_search import SimpleSearch
from Executors.composition import Composition


class SplitQA():
    def __init__(self):
        self.Executors = [Composition(),Conjunction(),SimpleSearch()]
        webanswer_dict = {}

        ##################################
        # calculate split points
        with open(config.split_points_dir + config.EVALUATION_SET + '.json', 'r') as outfile:
            self.split_points = pd.DataFrame(json.load(outfile))

        ## Appending data from original complexwebquestions
        with open(config.complexwebquestions_dir + 'ComplexWebQuestions_' + config.EVALUATION_SET + '.json', 'r') as outfile:
            complexwebquestions = pd.DataFrame(json.load(outfile))
        
        self.split_points = self.split_points.merge(pd.DataFrame(complexwebquestions)[['answers','ID']],on='ID',how='inner')
        self.split_points.rename(columns={'answers_y': 'answers'}, inplace=True)

    def run_executors(self):
        ##################################
        # generate webanswer first batch
        
        question_list = []
        for executor in self.Executors:
            question_list += executor.gen_webanswer_first_wave(self.split_points)
        
        # dropbing duplicates questions
        question_list = pd.DataFrame(question_list).drop_duplicates(subset=['question']).to_dict(orient='rows')
        
        # Loading RC answers
        # --- Insert and alternative RC model here ---
        with open(config.rc_answer_cache_dir + config.EVALUATION_SET  + '.json', 'r') as outfile:
            webanswer_dict = json.load(outfile)
        
            # used as dataframes in the executors..
            for key in webanswer_dict.keys():
                webanswer_dict[key] = pd.DataFrame(webanswer_dict[key])
        
            for question in question_list:
                if question['question'] not in webanswer_dict:
                    print('Warning!!! RC cache is missing the following question: ' + question['question'])


        ##################################
        # run executors
        print('Running executors - first wave')
        question_list = []
        batch_webanswer_question = []
        for executor in self.Executors:
            print('Executor: ' + executor.name)
            exec_res = executor.proc_webanswer_wave_results(self.split_points,webanswer_dict)
            self.split_points = exec_res['split_points']
            question_list += exec_res['question_list']
        
        print('Running executors - second wave (second stage of composition questions)')
        ##################################
        # run executors - second wave
        for executor in self.Executors:
            print('Executor: ' + executor.name)
            exec_res = executor.proc_webanswer_second_wave_results(self.split_points,webanswer_dict)
            self.split_points = exec_res['split_points']
        
        
        results_path = config.data_dir +  'final_results' + '_' + config.EVALUATION_SET
        print ('saving results in ' + results_path)
        
        self.split_points.to_csv(results_path + '.csv',encoding="utf-8",index=False)
        with open(results_path + '.json', 'w') as outfile:
            json.dump(self.split_points.to_dict(orient="rows"), outfile)

    def gen_predictions_file(self):

        predictions = []
        for ind, q in self.split_points.iterrows():
            conjunction_rc_conf = -100
            composition_rc_conf = -100
            SimpQA_rc_conf = -100
            if q['SplitQA_conjunction_rc_conf'] is not None and len(q['SplitQA_conjunction_rc_conf']) > 0:
                conjunction_rc_conf = max(q['SplitQA_conjunction_rc_conf'])
            if q['SplitQA_composition_rc_conf'] is not None and len(q['SplitQA_composition_rc_conf']) > 0:
                composition_rc_conf = max(q['SplitQA_composition_rc_conf'])
            if q['SimpQA_rc_conf'] is not None and len(q['SimpQA_rc_conf']) > 0:
                SimpQA_rc_conf = max(q['SimpQA_rc_conf'])

            conjunction_rc_conf += 1.0
            composition_rc_conf += 2.0

            try:
                if q['comp'] == 'conjunction':
                    if conjunction_rc_conf >= SimpQA_rc_conf:
                        predictions.append({'ID':q['ID'],'answer':q['SplitQA_conjunction_spans'][0]})
                    else:
                        predictions.append({'ID': q['ID'], 'answer': q['SimpQA_spans'][0]})
                else:
                    if composition_rc_conf >= SimpQA_rc_conf:
                        predictions.append({'ID': q['ID'], 'answer': q['SplitQA_composition_spans'][0]})
                    else:
                        predictions.append({'ID': q['ID'], 'answer': q['SimpQA_spans'][0]})
            except:
                predictions.append({'ID': q['ID'], 'answer': ''})

        results_path = config.data_dir + 'predictions_' + config.EVALUATION_SET
        print('saving predictions file ' + results_path)
        with open(results_path + '.json', 'w') as outfile:
            json.dump(predictions, outfile, sort_keys=True, indent=4)

    def compute_final_results(self):
        comp = 0
        comp_count = 0
        conj = 0
        comj_count = 0
        SplitQA_P1_sum = 0
        SplitQA_oracle_P1_sum = 0
        SimpQA_P1_sum = 0
        only_comp_count = 0
        only_comp_count_right = 0
        only_search_count = 0
        only_search_count_right = 0
        we_chose_comp = 0
        we_chose_simp = 0
        both_count = 0
        for ind, q in self.split_points.iterrows():
            conjunction_rc_conf = -100
            composition_rc_conf = -100
            SimpQA_rc_conf = -100
            if q['SplitQA_conjunction_rc_conf'] is not None and len(q['SplitQA_conjunction_rc_conf']) > 0:
                conjunction_rc_conf = max(q['SplitQA_conjunction_rc_conf'])
            if q['SplitQA_composition_rc_conf'] is not None and len(q['SplitQA_composition_rc_conf']) > 0:
                composition_rc_conf = max(q['SplitQA_composition_rc_conf'])
            if q['SimpQA_rc_conf'] is not None and len(q['SimpQA_rc_conf']) > 0:
                SimpQA_rc_conf = max(q['SimpQA_rc_conf'])
        
            # constant normalization - (a bit ugly i know, will be learned in future work...)
            conjunction_rc_conf += 1.0
            composition_rc_conf += 2.0
        
            SimpQA_P1 = (q['SimpQA_MRR']==1)*100.0
            SplitQA_conj_P1 = (q['SplitQA_conjunction_MRR']==1)*100.0
            SplitQA_comp_P1 = (q['SplitQA_composition_MRR']==1)*100.0
        
            SimpQA_P1_sum += SimpQA_P1
        
            if q['comp'] == 'conjunction':
                if conjunction_rc_conf >= SimpQA_rc_conf:
                    we_chose_comp += 1
                    SplitQA_P1_sum += SplitQA_conj_P1
                else:
                    we_chose_simp += 1
                    SplitQA_P1_sum += SimpQA_P1
            else:
                if composition_rc_conf >= SimpQA_rc_conf:
                    we_chose_comp += 1
                    SplitQA_P1_sum += SplitQA_comp_P1
                else:
                    SplitQA_P1_sum += SimpQA_P1
                    we_chose_simp += 1
        
            SplitQA_oracle_P1_sum += max(SimpQA_P1, SplitQA_conj_P1, SplitQA_comp_P1)
        
            if (q['SimpQA_MRR'] == 1 and q['SplitQA_composition_MRR'] == 1) or \
                    (q['SimpQA_MRR'] == 1 and q['SplitQA_conjunction_MRR'] == 1):
                both_count += 1
        
            if q['comp'] == 'composition':
                if q['SimpQA_MRR'] < 1 and q['SplitQA_composition_MRR'] == 1:
                    if composition_rc_conf > SimpQA_rc_conf:
                        comp += 1
                        only_comp_count_right += 1
                    only_comp_count += 1
                    comp_count += 1
                if q['SimpQA_MRR'] == 1 and q['SplitQA_composition_MRR'] < 1:
                    if composition_rc_conf < SimpQA_rc_conf:
                        comp += 1
                        only_search_count_right += 1
                    only_search_count += 1
                    comp_count += 1
            else:
                if q['SimpQA_MRR'] < 1 and q['SplitQA_conjunction_MRR'] == 1:
                    if conjunction_rc_conf > SimpQA_rc_conf:
                        only_comp_count_right += 1
                        conj += 1
                    comj_count += 1
                    only_comp_count += 1
                if q['SimpQA_MRR'] == 1 and q['SplitQA_conjunction_MRR'] < 1:
                    if conjunction_rc_conf < SimpQA_rc_conf:
                        conj += 1
                        only_search_count_right += 1
                    only_search_count += 1
                    comj_count += 1
        
        print('SplitQA-composition RC conf accuracy: ' + str(float(comp) / comp_count))
        print('SplitQA-conjunction RC conf accuracy: ' + str(float(conj) / comj_count))
        print('number of only Compositionality : ' + str(only_comp_count))
        print('number of only Compositionality that we got right: ' + str(only_comp_count_right))
        print('number of only Search : ' + str(only_search_count))
        print('number of only Search that we got right: ' + str(only_search_count_right))
        print('number of both ( at same time): ' + str(both_count))
        print('compositionality portion: ' + str(float(we_chose_comp) / (we_chose_comp + we_chose_simp)))
        print('SimpQA: ' + str(float(SimpQA_P1_sum) / len(self.split_points)))
        print('SplitQA ' + str(float(SplitQA_P1_sum) / len(self.split_points)))
        print('SplitQAOracle ' + str(float(SplitQA_oracle_P1_sum) / len(self.split_points)))