-
Notifications
You must be signed in to change notification settings - Fork 1
/
go-process-participants.py
87 lines (78 loc) · 2.8 KB
/
go-process-participants.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
import pronto, six, csv
from sys import *
reader = csv.DictReader(open('chebi.tab', 'r'), delimiter='\t')
qs = {}
dups = set()
for item in reader:
iturl = item.get('item')
qit = iturl[iturl.rfind('/')+1:]
chid = 'CHEBI:' + item.get('ch')
g = qs.get(chid)
if g is None:
qs[chid] = qit
else:
dups.add(chid)
reader = csv.DictReader(open('goid.tab', 'r'), delimiter='\t')
efs = {}
for item in reader:
go = item.get('goid')
iturl = item.get('item')
it = iturl[iturl.rfind('/')+1:]
git = efs.get(go)
if git is None:
efs[go] = it
else:
print('============= {}'.format(go))
ignore = {'425228', '144646', '27941'}
secondary = {'365419':'64090', '12800':'46570', '24036':'72010',
'425228':'29484', '578003':'65172', '22318':'134249',
'30410':'42121', '3736':'48947', '593038':'49537',
'198346':'41688', '22473':'32988', '3669':'16822',
'23008':'16646', '3736':'48947', '578003':'65172'}
"""has_input
has_intermediate
has_output
has_participant
has_primary_input
has_primary_input_or_output
has_primary_output"""
ont = pronto.Ontology('/home/ralf/go-ontology/src/ontology/go-edit.obo')
for term in ont.terms.values():
goid = term.id
if goid[:3] != 'GO:':
continue
goit = efs.get(goid)
if goit is None:
continue
ix = term.other.get('intersection_of')
if ix is None:
continue
ns = term.other.get('namespace')
if ns[0] != 'biological_process':
continue
for cstr in ix:
if cstr[:4] != 'has_':
continue
chid = cstr.split()[1]
chit = qs.get(chid)
if chid in dups or chit is None:
continue
type = cstr.split()[0]
if type == 'has_output' or type == 'has_primary_output':
print('{}|P527|{}|P3831|Q542929|S248|Q75154902'.format(goit, chit))
#print('-{}|P361|{}'.format(chit, goit))
print('{}|P361|{}|P2868|Q542929|S248|Q75154902'.format(chit, goit))
if type == 'has_input' or type == 'has_primary_input':
print('{}|P527|{}|P3831|Q45342565|S248|Q75154902'.format(goit, chit))
#print('-{}|P361|{}'.format(chit, goit))
print('{}|P361|{}|P2868|Q45342565|S248|Q75154902'.format(chit, goit))
if type == 'has_intermediate':
print('{}|P527|{}|P3831|Q7458208|S248|Q75154902'.format(goit, chit))
#print('-{}|P361|{}'.format(chit, goit))
print('{}|P361|{}|P12868|Q7458208|S248|Q75154902'.format(chit, goit))
if type == 'has_participant' or type == 'has_primary_input_or_output':
print('{}|P527|{}|P3831|Q75232720|S248|Q75154902'.format(goit, chit))
#print('-{}|P361|{}'.format(chit, goit))
print('{}|P361|{}|P2868|Q75232720|S248|Q75154902'.format(chit, goit))
"""
"""