-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathreference_data.py
More file actions
94 lines (77 loc) · 6.69 KB
/
reference_data.py
File metadata and controls
94 lines (77 loc) · 6.69 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
class ReferenceData:
ROW_1 = [
"Short name", "Mass", "pI", "Charge", "NumResidues", "G", "A", "L", "M", "F",
"W", "K", "Q", "E", "S", "P", "V", "I", "C", "Y", "H", "R", "N", "D", "T",
"ncont", "scont", "FoldIndex", "NumberIntrons", "AvergaeIntLength",
"FirstIntLength", "GCcontent", "IntronContaining", "Intronless", "rRNA",
"protein_coding", "ncRNA", "snoRNA", "tRNA", "pseudogene", "snRNA",
"Chromosome1", "Chromosome2", "Chromosome3", "Mitochondria", "Abs_telomere",
"Abs_centromere", "Rel_telomere", "Rel_centromere"
]
ROW_2 = ["Long name","Molecular weight (kDa)","Isoelectric point (predicted pH)","Charge","Number of amino acids","Glycine","Alanine",
"Leucine","Methionine","Phenylalanine","Tryptophan","Lysine","Glutamine","Glutamic acid","Serine","Proline","Valine","Isoleucine",
"Cysteine","Tyrosine","Histidine","Arginine","Asparagine","Aspartic acid","Threonine","Nitrogen content","Sulphur content",
"Fold Index","Number of introns","Average intron length","Length of first intron","GC contents of first intron","Intron-containing genes",
"Intron-less genes","rRNA","protein_coding","ncRNA","snoRNA","tRNA","pseudogene","snRNA","Chromosome 1","Chromosome 2","Chromosome 3",
"Mitochondria","Abs. distance from telomere","Abs. distance from centromere","Relative distance from telomere","Relative distance from centromere"]
ROW_3 = ["Scale of measurement","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric",
"Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric","Metric",
"Metric","Metric","Metric","Binary","Binary","Binary","Binary","Binary","Binary","Binary","Binary","Binary","Binary","Binary","Binary",
"Binary","Metric","Metric","Metric","Metric"]
ROW_4 = ["Group","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features",
"Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features",
"Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features",
"Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Protein Features","Gene Features",
"Gene Features","Gene Features","Gene Features","Gene Features","Gene Features","Transcript Features","Transcript Features","Transcript Features",
"Transcript Features","Transcript Features","Transcript Features","Transcript Features","Gene Features","Gene Features","Gene Features",
"Gene Features","Gene Features","Gene Features","Gene Features","Gene Features"]
ROW_5 = ["Source","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase",
"Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase",
"Prilusky J, Felder CE, Zeev-Ben-Mordehai T, Rydberg EH, Man O, Beckmann JS, Silman I, Sussman JL. 2005. FoldIndex: a simple tool to predict whether a given protein sequence is intrinsically unfolded. Bioinformatics 21(16): 3435-3438",
"Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase",
"Pombase","Pombase","Pombase","Pombase","Pombase","Pombase","Pombase"]
ROW_6 = ["Author","DB","DB","DB","DB","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP",
"DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB/VP","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB","DB",
"DB","DB","DB","DB","DB","DB"]
ROW_8 = ["Link","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org",
"http://www.pombase.org","http://www.pombase.org","http://www.pombase.org","http://www.pombase.org"]
def main():
"""
Run this to validate that the length of the rows is the same.
NOTE: Row 7 is intentionally omitted as it is the current date
"""
if len(ReferenceData.ROW_1) != len(ReferenceData.ROW_2):
print("The lengths of ROW_1 and ROW_2 do not match.")
else:
print("The lengths of ROW_1 and ROW_2 match.")
if len(ReferenceData.ROW_1) != len(ReferenceData.ROW_3):
print("The lengths of ROW_1 and ROW_3 do not match.")
else:
print("The lengths of ROW_1 and ROW_3 match.")
if len(ReferenceData.ROW_1) != len(ReferenceData.ROW_4):
print("The lengths of ROW_1 and ROW_4 do not match.")
else:
print("The lengths of ROW_1 and ROW_4 match.")
if len(ReferenceData.ROW_1) != len(ReferenceData.ROW_5):
print("The lengths of ROW_1 and ROW_5 do not match.")
else:
print("The lengths of ROW_1 and ROW_5 match.")
if len(ReferenceData.ROW_1) != len(ReferenceData.ROW_6):
print("The lengths of ROW_1 and ROW_6 do not match.")
else:
print("The lengths of ROW_1 and ROW_6 match.")
if len(ReferenceData.ROW_1) != len(ReferenceData.ROW_8):
print(f"The lengths of ROW_1 {len(ReferenceData.ROW_1)} and ROW_8 {len(ReferenceData.ROW_8)} do not match.")
else:
print("The lengths of ROW_1 and ROW_8 match.")
# Example usage
if __name__ == "__main__":
main()