-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy path2023-05-01--norovirus.py
74 lines (66 loc) · 2.43 KB
/
2023-05-01--norovirus.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
group_I = 0
group_II = 0
group_IV = 0
group_IX = 0
group_I_II = 0
group_II_IV = 0
group_I_II_IX = 0
group_any = 0
with open("prevalence-data/cdc-nors-outbreak-data.tsv") as inf:
cols = None
for line in inf:
row = line.strip().split("\t")
if not cols:
cols = row
continue
etiologies = set(row[cols.index("Etiology")].split("; "))
etiologies = set(x.replace(" unknown", "").replace(" other", "")
for x in etiologies
if "Norovirus" in x)
if len(etiologies) > 1 and "Norovirus" in etiologies:
etiologies.remove("Norovirus")
genotype = row[cols.index("Serotype or Genotype")]
if not any("Norovirus" in etiology for etiology in etiologies):
continue
group_any += 1
if len(etiologies) == 1:
if list(etiologies) == ['Norovirus Genogroup I']:
group_I += 1
elif list(etiologies) == ['Norovirus Genogroup II']:
group_II += 1
elif list(etiologies) == ['Norovirus Genogroup IV']:
group_IV += 1
elif list(etiologies) == ['Norovirus Genogroup IX']:
group_IX += 1
elif list(etiologies) == ['Norovirus']:
pass
else:
raise Exception(etiologies)
elif len(etiologies) == 2:
if etiologies == set(('Norovirus Genogroup I',
'Norovirus Genogroup II')):
group_I_II += 1
elif etiologies == set(('Norovirus Genogroup II',
'Norovirus Genogroup IV')):
group_II_IV += 1
else:
raise Exception(etiologies)
elif len(etiologies) == 3:
if etiologies == set(('Norovirus Genogroup I',
'Norovirus Genogroup II',
'Norovirus Genogroup IX')):
group_I_II_IX += 1
else:
raise Exception(etiologies)
else:
raise Exception(etiologies)
#print ("%s\t%s" % (";".join(etiologies), genotype))
#print (etiologies)
print("I\t%s" % (group_I))
print("II\t%s" % (group_II))
print("IV\t%s" % (group_IV))
print("IX\t%s" % (group_IX))
print("I+II\t%s" % (group_I_II))
print("II+IV\t%s" % (group_II_IV))
print("I+II+IX\t%s" % (group_I_II_IX))
print(group_any)