From 7a2041d10afc1d2c92b09cd01b83d13606ddd8e6 Mon Sep 17 00:00:00 2001 From: Andrew Tavis Date: Wed, 12 Jan 2022 14:09:03 +0100 Subject: [PATCH] #95 update data update json totals and text differences --- Data/update_data.py | 33 +++++++++++++++++++++++++++++++++ Data/updated_data.txt | 6 ------ 2 files changed, 33 insertions(+), 6 deletions(-) delete mode 100644 Data/updated_data.txt diff --git a/Data/update_data.py b/Data/update_data.py index c4868fdb..c252a721 100644 --- a/Data/update_data.py +++ b/Data/update_data.py @@ -99,6 +99,8 @@ queries_to_run = list({q for sub in queries_to_run_lists for q in sub}) +data_added_dict = {} + for q in tqdm(queries_to_run[:1], desc="Data updated", unit="dirs",): target_type = q.split("/")[1] query_name = "query" + target_type.title() + ".sparql" @@ -132,3 +134,34 @@ ["python", f"./{q.split('/')[0]}/{q.split('/')[1]}/format_{q.split('/')[1]}"], shell=True, ) + + with open( + f"./../Keyboards/LanguageKeyboards/{q.split('/')[0]}/{q.split('/')[1]}.json" + ) as f: + new_keyboard_data = json.load(f) + + data_added_dict[q.split("/")[0]][q.split("/")[1]] = ( + len(new_keyboard_data) - current_data[q.split("/")[0]][q.split("/")[1]] + ) + + current_data[q.split("/")[0]][q.split("/")[1]] = len(new_keyboard_data) + +# Update total_data.json +with open("./total_data.json", "w", encoding="utf-8",) as f: + json.dump(current_data, f, ensure_ascii=False, indent=2) + +# Update data_updates.txt +data_added_string = """""" +for l in data_added_dict: + data_added_string += f"\n{l}" + for w in word_types: + if data_added_dict[l][w] == 0: + pass + elif data_added_dict[l][w] == 1: # remove the s for label + data_added_string += f"{data_added_dict[l][w]} {w[:-1]}," + else: + data_added_string += f"{data_added_dict[l][w]} {w}," + data_added_string = data_added_string[:-1] # remove the last comma + +with open("data_updates.txt", "w+") as f: + f.writelines(data_added_string) diff --git a/Data/updated_data.txt b/Data/updated_data.txt deleted file mode 100644 index fa3e0768..00000000 --- a/Data/updated_data.txt +++ /dev/null @@ -1,6 +0,0 @@ -- French (New): 15,710 nouns, 1,241 verbs (mostly infinitives), 67,609 translations -- German: 401 nouns, 78 verbs, corrected many prepositions -- Portuguese (New): 4,530 nouns, 188 verbs, 67,609 translations -- Russian (New): 194,389 nouns, 11 verbs, 12 prepositions, 67,609 translations -- Spanish: 180 nouns, 22 verbs -- Swedish (New): 41,102 nouns, 4,133 verbs, 67,609 translations