%load_ext autoreload
%autoreload 2
The autoreload extension is already loaded. To reload it, use: %reload_ext autoreload
%pylab inline
Populating the interactive namespace from numpy and matplotlib
WARNING: pylab import has clobbered these variables: ['clf', 'grid'] `%matplotlib` prevents importing * from pylab and numpy
import dammit
from dammit.model import CRBL
reload(dammit)
<module 'dammit' from 'dammit/__init__.pyc'>
import seaborn as sns
import pandas as pd
from sklearn import svm
from sklearn import preprocessing
from sklearn.naive_bayes import GaussianNB
import numpy as np
sns.set_style('ticks')
blue_ct_cmap = sns.cubehelix_palette(10, start=.5, rot=-.3, light=1, dark=.4, as_cmap=True)
red_ct_cmap = sns.cubehelix_palette(10, start=1.5, rot=-.5, light=1, dark=.4, as_cmap=True)
sns.palplot(blue_ct_cmap.colors[np.linspace(0, 255, 10, dtype=int)])
sns.palplot(red_ct_cmap.colors[np.linspace(0, 255, 10, dtype=int)])
def get_grid(mins, maxs, clf):
xx, yy = np.meshgrid(np.linspace(mins, maxs, 1000),
np.linspace(mins, maxs, 1000))
'''
if hasattr(clf, 'decision_function'):
Z = clf.decision_function(np.c_[xx.ravel(), yy.ravel()])
else:
Z = clf.predict(np.c_[xx.ravel(), yy.ravel()])
'''
Z = clf.predict(np.c_[xx.ravel(), yy.ravel()])
Z = Z.reshape(xx.shape)
return xx, yy, Z
def scale_evalue(col):
col.ix[col == 0.0] = 1e-256
return -np.log10(col)
test_aln_A = pd.DataFrame([[0.0, 0.0, 200, 2000, 'tr_Aa', 200, '+', 70, 70, 'pr_Ba', 0, '+', 200, 200.0],
[1e-100, 1e-100, 200, 2000, 'tr_Aa', 200, '+', 70, 70, 'pr_Bb', 0, '+', 200, 200.0],
[0.0, 0.0, 200, 2000, 'tr_Ab', 200, '+', 70, 70, 'pr_Ba', 0, '+', 200, 200.0],
[0.0, 0.0, 200, 2000, 'tr_Ac', 200, '+', 70, 70, 'pr_Bc', 0, '+', 200, 200.0]],
columns=[u'E', u'EG2', u'q_aln_len', u'q_len', u'q_name', u'q_start',
u'q_strand', u's_aln_len', u's_len', u's_name', u's_start', u's_strand',
u'score', u'bitscore'])
test_aln_B = pd.DataFrame([[0.0, 0.0, 200, 2000, 'pr_Ba', 200, '+', 70, 70, 'tr_Aa', 0, '+', 200, 200.0],
[0.0, 0.0, 200, 2000, 'pr_Ba', 200, '+', 70, 70, 'tr_Ac', 0, '+', 200, 200.0],
[1e-100, 1e-100, 200, 2000, 'pr_Ba', 200, '+', 70, 70, 'tr_Ab', 0, '+', 200, 200.0],
[0.0, 0.0, 200, 2000, 'pr_Bb', 200, '+', 70, 70, 'tr_Aa', 0, '+', 200, 200.0]],
columns=[u'E', u'EG2', u'q_aln_len', u'q_len', u'q_name', u'q_start',
u'q_strand', u's_aln_len', u's_len', u's_name', u's_start', u's_strand',
u'score', u'bitscore'])5
CRBL.reciprocal_best_hits(test_aln_A, test_aln_B)
E | EG2_x | q_aln_len | q_len | q_name | q_start_x | q_strand_x | s_aln_len_x | s_len_x | s_start_x | ... | s_len | s_name | q_start_y | q_strand_y | s_aln_len_y | s_len_y | s_start_y | s_strand_y | score_y | bitscore_y | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 0 | 0 | 200 | 2000 | tr_Aa | 200 | + | 70 | 70 | 0 | ... | 2000 | pr_Ba | 200 | + | 70 | 70 | 0 | + | 200 | 200 |
1 rows × 26 columns
bh_df.columns
Index([u'E', u'EG2', u'q_aln_len', u'q_len', u'q_name', u'q_start', u'q_strand', u's_aln_len', u's_len', u's_name', u's_start', u's_strand', u'score', u'bitscore', u'RBH'], dtype='object')
rbh_df = pd.read_csv('pom.500.fa.dammit/pom.500.fa.transdecoder.pep.rbhx.pep.fa.csv')
rbh_df['E'] = scale_evalue(rbh_df['E'].copy())
bh_df = pd.concat([group for group in dammit.parsers.maf_to_df_iter('pom.500.fa.dammit/pom.500.fa.x.pep.fa.maf')])
bh_df['E'] = scale_evalue(bh_df['E'].copy())
bh_df['RBH'] = False
bh_df.ix[rbh_df.index, 'RBH'] = True
bh_df.sort_values(by=['q_name', 'E'], ascending=False).drop_duplicates(subset='q_name').query('RBH == True')
E | EG2 | q_aln_len | q_len | q_name | q_start | q_strand | s_aln_len | s_len | s_name | s_start | s_strand | score | bitscore | RBH | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
172 | 51.920819 | 1.400000e-44 | 210 | 2270 | SPAPJ695.02_74452_76721_-1_SPAPJ695.02_I_prote... | 811 | + | 70 | 70 | SPAPJ695.02_SPAPJ695.02_I_Schizosaccharomyces | 0 | + | 385 | 205.442170 | True |
168 | 99.431798 | 3.900000e-86 | 351 | 587 | SPAPJ695.01c_77480_78066_-1_SPAPJ695.01c_I_pro... | 135 | + | 117 | 117 | SPAPJ695.01c_SPAPJ695.01c_I_S. | 0 | + | 647 | 343.501215 | True |
54 | 114.154902 | 1.600000e-101 | 399 | 747 | SPAC977.18_31140_32345_-1_SPAC977.18_I_protein... | 158 | + | 133 | 133 | SPAC977.18_SPAC977.18_I_conserved | 0 | + | 744 | 394.614678 | True |
167 | 256.000000 | 0.000000e+00 | 1794 | 3603 | SPAC977.17_66219_69821_1_SPAC977.17_I_protein_... | 924 | + | 598 | 598 | SPAC977.17_SPAC977.17_I_MIP | 0 | + | 3447 | 1818.941394 | True |
153 | 256.000000 | 0.000000e+00 | 1773 | 2421 | SPAC977.16c_64559_66980_-1_dak2_I_protein_codi... | 300 | + | 591 | 591 | SPAC977.16c_dak2_I_dihydroxyacetone | 0 | + | 3254 | 1717.241410 | True |
160 | 237.920819 | 4.400000e-212 | 741 | 902 | SPAC977.15_62961_63862_1_SPAC977.15_I_protein_... | 28 | + | 247 | 247 | SPAC977.15_SPAC977.15_I_dienelactone | 0 | + | 1441 | 761.893894 | True |
159 | 282.522879 | 3.100000e-258 | 975 | 1294 | SPAC977.14c_59614_60907_-1_SPAC977.14c_I_prote... | 215 | + | 325 | 325 | SPAC750.01_SPAC750.01_I_aldo_keto | 0 | + | 1732 | 915.234284 | True |
155 | 320.886260 | 8.100000e-293 | 1068 | 1364 | SPAC977.12_56373_57736_1_SPAC977.12_I_protein_... | 119 | + | 356 | 356 | SPAC977.12_SPAC977.12_I_L-asparaginase | 0 | + | 1950 | 1030.107841 | True |
157 | 290.420216 | 2.900000e-264 | 933 | 1250 | SPAC977.11_55059_56308_1_SPAC977.11_I_protein_... | 215 | + | 311 | 311 | SPAC977.11_SPAC977.11_I_CRCB | 0 | + | 1770 | 935.258115 | True |
82 | 256.000000 | 0.000000e+00 | 1404 | 2836 | SPAC977.10_50946_53858_1_sod2_I_protein_coding... | 1171 | + | 468 | 468 | SPAC977.10_sod2_I_plasma | 0 | + | 2609 | 1377.363226 | True |
85 | 298.721246 | 1.400000e-287 | 1713 | 2461 | SPAC977.09c_45875_48399_-1_SPAC977.09c_I_prote... | 413 | + | 570 | 623 | SPCC1450.09c_SPCC1450.09c_III_phospholipase | 51 | + | 1917 | 1012.718725 | True |
86 | 215.091515 | 8.000000e-191 | 708 | 825 | SPAC977.08_44644_45468_1_SPAC977.08_I_protein_... | 60 | + | 236 | 236 | SPAC977.08_SPAC977.08_I_short | 0 | + | 1307 | 691.283543 | True |
83 | 256.000000 | 0.000000e+00 | 1248 | 1251 | SPAC977.07c_42057_43307_-1_pfl6_I_protein_codi... | 0 | + | 416 | 416 | SPAC977.07c_pfl6_I_cell | 0 | + | 2357 | 1244.573610 | True |
91 | 176.356547 | 4.500000e-153 | 592 | 607 | SPAC977.06_39416_40072_1_SPAC977.06_I_protein_... | 15 | + | 198 | 230 | SPBC1348.07_SPBC1348.07_II_S. | 0 | + | 1069 | 565.871128 | True |
30 | 191.886057 | 2.100000e-166 | 612 | 615 | SPAC977.05c_35768_36382_-1_SPAC977.05c_I_prote... | 0 | + | 204 | 204 | SPAC977.05c_SPAC977.05c_I_conserved | 0 | + | 1153 | 610.134333 | True |
39 | 151.721246 | 3.000000e-133 | 501 | 681 | SPAC977.04_34298_34978_1_SPAC977.04_I_protein_... | 15 | + | 167 | 485 | SPAC750.02c_SPAC750.02c_I_transmembrane | 318 | + | 944 | 500.003263 | True |
46 | 133.795880 | 8.800000e-113 | 435 | 438 | SPAC977.03_33835_34272_1_SPAC977.03_I_protein_... | 0 | + | 145 | 145 | SPAC977.03_SPAC977.03_I_methyltransferase | 0 | + | 815 | 432.027626 | True |
44 | 124.337242 | 2.100000e-113 | 438 | 979 | SPAC977.02_32034_33012_1_SPAC977.02_I_protein_... | 196 | + | 146 | 146 | SPAC977.02_SPAC977.02_I_S. | 0 | + | 819 | 434.135398 | True |
20 | 296.698970 | 6.300000e-271 | 948 | 1306 | SPAC977.01_29764_31069_1_SPAC977.01_I_protein_... | 2 | + | 316 | 316 | SPAC977.01_SPAC977.01_I_S. | 0 | + | 1812 | 957.389718 | True |
361 | 305.744727 | 1.900000e-293 | 1038 | 2372 | SPAC5H10.13c_167766_170137_-1_gmh2_I_protein_c... | 287 | + | 346 | 346 | SPAC5H10.13c_gmh2_I_alpha-1 | 0 | + | 1954 | 1032.215613 | True |
348 | 256.000000 | 0.000000e+00 | 1113 | 2013 | SPAC5H10.12c_165814_167826_-1_SPAC5H10.12c_I_p... | 291 | + | 371 | 371 | SPAC5H10.12c_SPAC5H10.12c_I_acetylglucosaminyl... | 0 | + | 2132 | 1126.011453 | True |
349 | 295.769551 | 2.000000e-277 | 987 | 1766 | SPAC5H10.11_164570_166335_1_gmh1_I_protein_cod... | 158 | + | 329 | 329 | SPAC5H10.11_gmh1_I_alpha-1 | 0 | + | 1853 | 978.994378 | True |
347 | 256.000000 | 0.000000e+00 | 1176 | 1880 | SPAC5H10.10_162756_164635_1_SPAC5H10.10_I_prot... | 204 | + | 392 | 392 | SPAC5H10.10_SPAC5H10.10_I_NADPH | 0 | + | 2262 | 1194.514033 | True |
351 | 249.795880 | 5.800000e-221 | 801 | 846 | SPAC5H10.09c_160977_161822_-1_ecm31_I_protein_... | 42 | + | 267 | 267 | SPAC5H10.09c_ecm31_I_3-methyl-2-oxobutanoatehy... | 0 | + | 1497 | 791.402698 | True |
350 | 257.721246 | 1.500000e-232 | 849 | 1066 | SPAC5H10.08c_159880_160945_-1_pan6_I_protein_c... | 0 | + | 283 | 283 | SPAC5H10.08c_pan6_I_pantoate-beta-alanine | 0 | + | 1570 | 829.869531 | True |
343 | 73.468521 | 6.400000e-64 | 267 | 696 | SPAC5H10.07_158777_159472_1_SPAC5H10.07_I_prot... | 426 | + | 89 | 89 | SPAC5H10.07_SPAC5H10.07_I_Schizosaccharomyces | 0 | + | 507 | 269.729206 | True |
340 | 256.000000 | 0.000000e+00 | 1137 | 1878 | SPAC5H10.06c_156430_158307_-1_adh4_I_protein_c... | 620 | + | 379 | 379 | SPAC5H10.06c_adh4_I_alcohol | 0 | + | 2117 | 1118.107309 | True |
344 | 256.000000 | 0.000000e+00 | 1146 | 2514 | SPAC5H10.05c_153070_155583_-1_SPAC5H10.05c_I_p... | 317 | - | 382 | 382 | SPAC5H10.04_SPAC5H10.04_I_NADPH | 0 | + | 2203 | 1163.424400 | True |
339 | 256.000000 | 0.000000e+00 | 1146 | 2665 | SPAC5H10.04_152851_155515_1_SPAC5H10.04_I_prot... | 536 | + | 382 | 382 | SPAC5H10.04_SPAC5H10.04_I_NADPH | 0 | + | 2203 | 1163.424400 | True |
332 | 186.161151 | 9.100000e-179 | 657 | 3464 | SPAC5H10.03_149446_152909_1_SPAC5H10.03_I_prot... | 2467 | + | 219 | 219 | SPAC5H10.03_SPAC5H10.03_I_phosphoglycerate | 0 | + | 1231 | 651.235881 | True |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
412 | 256.000000 | 0.000000e+00 | 2577 | 3066 | SPAC13G6.12c_195940_199051_-1_chs1_I_protein_c... | 336 | + | 859 | 859 | SPAC13G6.12c_chs1_I_chitin | 0 | + | 4861 | 2564.038684 | True |
414 | 256.000000 | 0.000000e+00 | 1212 | 1279 | SPAC13G6.11c_194099_195626_-1_erg12_I_protein_... | 44 | + | 404 | 404 | SPAC13G6.11c_erg12_I_mevalonate | 0 | + | 2213 | 1168.693829 | True |
413 | 256.000000 | 0.000000e+00 | 1590 | 2126 | SPAC13G6.10c_191928_194053_-1_asl1_I_protein_c... | 165 | + | 530 | 530 | SPAC13G6.10c_asl1_I_cell | 0 | + | 2918 | 1540.188589 | True |
415 | 247.167491 | 4.600000e-232 | 822 | 1611 | SPAC13G6.09_190192_191947_1_SPAC13G6.09_I_prot... | 130 | + | 274 | 274 | SPAC13G6.09_SPAC13G6.09_I_SSU-rRNA | 0 | + | 1567 | 828.288702 | True |
405 | 256.000000 | 0.000000e+00 | 1605 | 2331 | SPAC13G6.08_187701_190031_1_SPAC13G6.08_I_prot... | 676 | + | 535 | 535 | SPAC13G6.08_SPAC13G6.08_I_Cdc20_Fizzy | 0 | + | 3041 | 1605.002568 | True |
406 | 209.455932 | 4.200000e-195 | 717 | 1370 | SPAC13G6.07c_186314_187683_-1_rps601_I_protein... | 120 | + | 239 | 239 | SPAC13G6.07c_rps601_I_40S | 0 | + | 1334 | 705.511002 | True |
404 | 256.000000 | 0.000000e+00 | 3093 | 4022 | SPAC13G6.06c_182337_186358_-1_gcv2_I_protein_c... | 287 | + | 1031 | 1031 | SPAC13G6.06c_gcv2_I_glycine | 0 | + | 5839 | 3079.388861 | True |
399 | 231.148742 | 4.100000e-208 | 759 | 996 | SPAC13G6.05c_180903_182254_-1_trs33_I_protein_... | 60 | + | 253 | 253 | SPAC13G6.05c_trs33_I_TRAPP | 0 | + | 1416 | 748.720321 | True |
402 | 73.187087 | 1.700000e-62 | 261 | 573 | SPAC13G6.04_180272_181069_1_tim8_I_protein_cod... | 151 | + | 87 | 87 | SPAC13G6.04_tim8_I_TIM22 | 0 | + | 498 | 264.986720 | True |
398 | 256.000000 | 0.000000e+00 | 2274 | 4139 | SPAC13G6.03_175890_180028_1_gpi7_I_protein_cod... | 1402 | + | 758 | 758 | SPAC13G6.03_gpi7_I_GPI | 0 | + | 4217 | 2224.687443 | True |
400 | 212.091515 | 1.300000e-201 | 756 | 1791 | SPAC13G6.02c_174865_176655_-1_rps101_I_protein... | 884 | + | 252 | 252 | SPAC13G6.02c_rps101_I_40S | 0 | + | 1375 | 727.115662 | True |
360 | 256.000000 | 0.000000e+00 | 3399 | 4213 | SPAC13G6.01c_170489_174701_-1_rad8_I_protein_c... | 328 | + | 1133 | 1133 | SPAC13G6.01c_rad8_I_ubiquitin-protein | 0 | + | 6393 | 3371.315239 | True |
203 | 60.823909 | 3.900000e-53 | 231 | 1469 | SPAC11D3.19_106893_108361_1_SPAC11D3.19_I_prot... | 72 | + | 77 | 77 | SPAC11D3.19_SPAC11D3.19_I_Schizosaccharomyces | 0 | + | 439 | 233.897088 | True |
325 | 256.000000 | 0.000000e+00 | 1494 | 2075 | SPAC11D3.18c_144819_146935_-1_SPAC11D3.18c_I_p... | 535 | + | 498 | 498 | SPAC11D3.18c_SPAC11D3.18c_I_plasma | 0 | + | 2761 | 1457.458550 | True |
324 | 256.000000 | 0.000000e+00 | 1755 | 3522 | SPAC11D3.17_141199_144768_1_SPAC11D3.17_I_prot... | 1428 | + | 585 | 585 | SPAC11D3.17_SPAC11D3.17_I_transcription | 0 | + | 3343 | 1764.139330 | True |
323 | 110.275724 | 7.800000e-102 | 393 | 1273 | SPAC11D3.16c_140381_141653_-1_SPAC11D3.16c_I_p... | 453 | + | 131 | 131 | SPAC11D3.16c_SPAC11D3.16c_I_Schizosaccharomyces | 0 | + | 746 | 395.668564 | True |
321 | 256.000000 | 0.000000e+00 | 3951 | 4227 | SPAC11D3.15_136139_140365_1_SPAC11D3.15_I_prot... | 192 | + | 1317 | 1317 | SPAC11D3.15_SPAC11D3.15_I_5-oxoprolinase | 0 | + | 7345 | 3872.964900 | True |
319 | 256.000000 | 0.000000e+00 | 3780 | 4547 | SPAC11D3.14c_131190_135736_-1_SPAC11D3.14c_I_p... | 635 | + | 1260 | 1260 | SPAC11D3.14c_SPAC11D3.14c_I_5-oxoprolinase | 0 | + | 7065 | 3725.420882 | True |
303 | 195.677781 | 2.100000e-179 | 666 | 1121 | SPAC11D3.13_130148_131268_1_hsp3104_I_protein_... | 181 | + | 222 | 222 | SPAC11D3.13_hsp3104_I_ThiJ | 0 | + | 1235 | 653.343653 | True |
299 | 256.000000 | 0.000000e+00 | 1071 | 2279 | SPAC11D3.11c_126951_129316_-1_SPAC11D3.11c_I_p... | 131 | + | 357 | 357 | SPAC11D3.11c_SPAC11D3.11c_I_zn(2)-C6 | 0 | + | 2078 | 1097.556535 | True |
315 | 307.193820 | 1.200000e-299 | 1026 | 4147 | SPAC11D3.10_124907_129053_1_SPAC11D3.10_I_prot... | 0 | - | 342 | 357 | SPAC11D3.11c_SPAC11D3.11c_I_zn(2)-C6 | 15 | + | 1993 | 1052.766387 | True |
285 | 256.000000 | 0.000000e+00 | 1182 | 1930 | SPAC11D3.09_122187_124116_1_SPAC11D3.09_I_prot... | 658 | + | 394 | 394 | SPAC11D3.09_SPAC11D3.09_I_agmatinase | 0 | + | 2219 | 1171.855487 | True |
295 | 272.619789 | 6.700000e-265 | 939 | 3465 | SPAC11D3.08c_120321_123785_-1_SPAC11D3.08c_I_p... | 2524 | - | 313 | 394 | SPAC11D3.09_SPAC11D3.09_I_agmatinase | 0 | + | 1774 | 937.365887 | True |
271 | 256.000000 | 0.000000e+00 | 1911 | 4256 | SPAC11D3.07c_116054_120309_-1_toe4_I_protein_c... | 201 | + | 637 | 637 | SPAC11D3.07c_toe4_I_transcription | 0 | + | 3600 | 1899.563661 | True |
272 | 256.000000 | 0.000000e+00 | 1365 | 1859 | SPAC11D3.06_116331_118189_1_SPAC11D3.06_I_prot... | 362 | + | 455 | 455 | SPAC11D3.06_SPAC11D3.06_I_MatE | 0 | + | 2482 | 1310.441475 | True |
253 | 310.045757 | 1.900000e-293 | 1536 | 2013 | SPAC11D3.05_113950_115962_1_mfs2_I_protein_cod... | 232 | + | 508 | 541 | SPBC530.02_SPBC530.02_II_transmembrane | 33 | + | 1954 | 1032.215613 | True |
257 | 104.142668 | 1.900000e-96 | 390 | 1865 | SPAC11D3.04c_112514_114445_-1_SPAC11D3.04c_I_p... | 1069 | + | 130 | 130 | SPAC11D3.04c_SPAC11D3.04c_I_polyketide | 0 | + | 712 | 377.752505 | True |
254 | 286.568636 | 2.200000e-265 | 906 | 1501 | SPAC11D3.03c_110904_112499_-1_SPAC11D3.03c_I_p... | 491 | + | 302 | 302 | SPAC11D3.03c_SPAC11D3.03c_I_conserved | 0 | + | 1777 | 938.946716 | True |
196 | 132.397940 | 1.800000e-115 | 450 | 627 | SPAC11D3.02c_109829_110455_-1_SPAC11D3.02c_I_p... | 174 | + | 150 | 150 | SPAC11D3.02c_SPAC11D3.02c_I_ELLA | 0 | + | 832 | 440.985656 | True |
202 | 67.853872 | 2.600000e-56 | 237 | 464 | SPAC11D3.01c_108732_109195_-1_SPAC11D3.01c_I_p... | 48 | + | 79 | 79 | SPAC11D3.01c_SPAC11D3.01c_I_conserved | 0 | + | 459 | 244.435946 | True |
82 rows × 15 columns
pep_x_db_df = pd.concat([group for group in dammit.parsers.maf_to_df_iter('pom.500.fa.dammit/pom.500.fa.transdecoder.pep.x.pep.fa.maf')])
db_x_pep_df = pd.concat([group for group in dammit.parsers.maf_to_df_iter('pom.500.fa.dammit/pep.fa.x.pom.500.fa.transdecoder.pep.maf')])
rbh_pep_df = CRBL.reciprocal_best_hits(pep_x_db_df, db_x_pep_df)
rbh_pep_df
E | EG2_x | q_aln_len | q_len | q_name | q_start_x | q_strand_x | s_aln_len_x | s_len_x | s_start_x | ... | s_len | s_name | q_start_y | q_strand_y | s_aln_len_y | s_len_y | s_start_y | s_strand_y | score_y | bitscore_y | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 0.000000e+00 | 0.000000e+00 | 1473 | 1474 | SPAC10F6.01c_1200916_1206090_-1_sir1_I_protein... | 0 | + | 1473 | 1473 | 0 | ... | 1473 | SPAC10F6.01c_sir1_I_sulfite | 0 | + | 1473 | 1474 | 0 | + | 7597 | 3356.382439 |
1 | 0.000000e+00 | 0.000000e+00 | 1168 | 1169 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 0 | + | 1168 | 1168 | 0 | ... | 1168 | SPAC10F6.02c_prp22_I_ATP-dependent | 0 | + | 1168 | 1169 | 0 | + | 6008 | 2655.044067 |
2 | 0.000000e+00 | 0.000000e+00 | 600 | 601 | SPAC10F6.03c_1211195_1213553_-1_cts1_I_protein... | 0 | + | 600 | 600 | 0 | ... | 600 | SPAC10F6.03c_cts1_I_CTP | 0 | + | 600 | 601 | 0 | + | 3123 | 1381.689000 |
3 | 1.500000e-275 | 1.100000e-234 | 351 | 352 | SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_pr... | 0 | + | 351 | 351 | 0 | ... | 351 | SPAC10F6.04_SPAC10F6.04_I_RCC | 0 | + | 351 | 352 | 0 | + | 1889 | 837.037300 |
5 | 3.700000e-173 | 3.700000e-143 | 227 | 243 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 15 | + | 227 | 227 | 0 | ... | 227 | SPAC10F6.05c_ubc6_I_ubiquitin | 0 | + | 227 | 243 | 15 | + | 1200 | 532.932745 |
6 | 1.600000e-184 | 3.000000e-153 | 257 | 258 | SPAC10F6.06_1217077_1218228_1_vip1_I_protein_c... | 0 | + | 257 | 257 | 0 | ... | 257 | SPAC10F6.06_vip1_I_RNA-binding | 0 | + | 257 | 258 | 0 | + | 1276 | 566.476934 |
7 | 1.400000e-142 | 1.600000e-115 | 188 | 189 | SPAC10F6.07c_1218321_1218887_-1_mug94_I_protei... | 0 | + | 188 | 188 | 0 | ... | 188 | SPAC10F6.07c_mug94_I_Schizosaccharomyces | 0 | + | 188 | 189 | 0 | + | 992 | 441.127596 |
8 | 2.100000e-249 | 1.600000e-212 | 341 | 358 | SPAC10F6.08c_1219667_1220847_-1_nht1_I_protein... | 16 | + | 341 | 341 | 0 | ... | 341 | SPAC10F6.08c_nht1_I_Ino80 | 0 | + | 341 | 358 | 16 | + | 1722 | 763.328358 |
9 | 0.000000e+00 | 0.000000e+00 | 908 | 916 | SPAC10F6.09c_1220969_1224862_-1_psm3_I_protein... | 8 | + | 908 | 1194 | 0 | ... | 1194 | SPAC10F6.09c_psm3_I_mitotic | 0 | + | 908 | 916 | 8 | + | 4532 | 2003.580608 |
10 | 3.400000e-57 | 8.700000e-40 | 79 | 96 | SPAC11D3.01c_108732_109195_-1_SPAC11D3.01c_I_p... | 16 | + | 79 | 79 | 0 | ... | 79 | SPAC11D3.01c_SPAC11D3.01c_I_conserved | 0 | + | 79 | 96 | 16 | + | 422 | 189.546179 |
11 | 9.200000e-110 | 3.700000e-86 | 150 | 151 | SPAC11D3.02c_109829_110455_-1_SPAC11D3.02c_I_p... | 0 | + | 150 | 150 | 0 | ... | 150 | SPAC11D3.02c_SPAC11D3.02c_I_ELLA | 0 | + | 150 | 151 | 0 | + | 771 | 343.584626 |
12 | 8.600000e-241 | 2.400000e-203 | 302 | 303 | SPAC11D3.03c_110904_112499_-1_SPAC11D3.03c_I_p... | 0 | + | 302 | 302 | 0 | ... | 302 | SPAC11D3.03c_SPAC11D3.03c_I_conserved | 0 | + | 302 | 303 | 0 | + | 1653 | 732.873766 |
13 | 3.200000e-92 | 1.300000e-70 | 130 | 131 | SPAC11D3.04c_112514_114445_-1_SPAC11D3.04c_I_p... | 0 | + | 130 | 130 | 0 | ... | 130 | SPAC11D3.04c_SPAC11D3.04c_I_polyketide | 0 | + | 130 | 131 | 0 | + | 654 | 291.944229 |
15 | 0.000000e+00 | 0.000000e+00 | 546 | 547 | SPAC11D3.05_113950_115962_1_mfs2_I_protein_cod... | 0 | + | 546 | 546 | 0 | ... | 546 | SPAC11D3.05_mfs2_I_MFS | 0 | + | 546 | 547 | 0 | + | 2905 | 1285.470142 |
16 | 0.000000e+00 | 5.700000e-290 | 455 | 456 | SPAC11D3.06_116331_118189_1_SPAC11D3.06_I_prot... | 0 | + | 455 | 455 | 0 | ... | 455 | SPAC11D3.06_SPAC11D3.06_I_MatE | 0 | + | 455 | 456 | 0 | + | 2305 | 1020.647597 |
18 | 0.000000e+00 | 0.000000e+00 | 637 | 638 | SPAC11D3.07c_116054_120309_-1_toe4_I_protein_c... | 0 | + | 637 | 637 | 0 | ... | 637 | SPAC11D3.07c_toe4_I_transcription | 0 | + | 637 | 638 | 0 | + | 3330 | 1473.052777 |
19 | 0.000000e+00 | 0.000000e+00 | 550 | 551 | SPAC11D3.08c_120321_123785_-1_SPAC11D3.08c_I_p... | 0 | + | 550 | 550 | 0 | ... | 550 | SPAC11D3.08c_SPAC11D3.08c_I_amino | 0 | + | 550 | 551 | 0 | + | 2833 | 1253.691437 |
21 | 2.000000e-298 | 1.100000e-255 | 394 | 395 | SPAC11D3.09_122187_124116_1_SPAC11D3.09_I_prot... | 0 | + | 394 | 394 | 0 | ... | 394 | SPAC11D3.09_SPAC11D3.09_I_agmatinase | 0 | + | 394 | 395 | 0 | + | 2047 | 906.773903 |
22 | 0.000000e+00 | 6.100000e-281 | 434 | 435 | SPAC11D3.10_124907_129053_1_SPAC11D3.10_I_prot... | 0 | + | 434 | 434 | 0 | ... | 434 | SPAC11D3.10_SPAC11D3.10_I_nifs | 0 | + | 434 | 435 | 0 | + | 2237 | 990.634376 |
24 | 1.100000e-281 | 3.800000e-240 | 357 | 358 | SPAC11D3.11c_126951_129316_-1_SPAC11D3.11c_I_p... | 0 | + | 357 | 357 | 0 | ... | 357 | SPAC11D3.11c_SPAC11D3.11c_I_zn(2)-C6 | 0 | + | 357 | 358 | 0 | + | 1930 | 855.133507 |
27 | 2.700000e-165 | 7.600000e-136 | 222 | 223 | SPAC11D3.13_130148_131268_1_hsp3104_I_protein_... | 0 | + | 222 | 222 | 0 | ... | 222 | SPAC11D3.13_hsp3104_I_ThiJ | 0 | + | 222 | 223 | 0 | + | 1145 | 508.657345 |
28 | 0.000000e+00 | 0.000000e+00 | 1260 | 1261 | SPAC11D3.14c_131190_135736_-1_SPAC11D3.14c_I_p... | 0 | + | 1260 | 1260 | 0 | ... | 1260 | SPAC11D3.14c_SPAC11D3.14c_I_5-oxoprolinase | 0 | + | 1260 | 1261 | 0 | + | 6526 | 2883.674197 |
29 | 0.000000e+00 | 0.000000e+00 | 1317 | 1318 | SPAC11D3.15_136139_140365_1_SPAC11D3.15_I_prot... | 0 | + | 1317 | 1317 | 0 | ... | 1317 | SPAC11D3.15_SPAC11D3.15_I_5-oxoprolinase | 0 | + | 1317 | 1318 | 0 | + | 6787 | 2998.872004 |
30 | 1.000000e-97 | 2.900000e-75 | 131 | 132 | SPAC11D3.16c_140381_141653_-1_SPAC11D3.16c_I_p... | 0 | + | 131 | 131 | 0 | ... | 131 | SPAC11D3.16c_SPAC11D3.16c_I_Schizosaccharomyces | 0 | + | 131 | 132 | 0 | + | 689 | 307.392211 |
31 | 0.000000e+00 | 0.000000e+00 | 585 | 586 | SPAC11D3.17_141199_144768_1_SPAC11D3.17_I_prot... | 0 | + | 585 | 585 | 0 | ... | 585 | SPAC11D3.17_SPAC11D3.17_I_transcription | 0 | + | 585 | 586 | 0 | + | 3105 | 1373.744323 |
32 | 0.000000e+00 | 0.000000e+00 | 498 | 499 | SPAC11D3.18c_144819_146935_-1_SPAC11D3.18c_I_p... | 0 | + | 498 | 498 | 0 | ... | 498 | SPAC11D3.18c_SPAC11D3.18c_I_plasma | 0 | + | 498 | 499 | 0 | + | 2554 | 1130.548953 |
33 | 0.000000e+00 | 0.000000e+00 | 542 | 543 | SPAC1296.01c_707948_710479_-1_SPAC1296.01c_I_p... | 0 | + | 542 | 542 | 0 | ... | 542 | SPAC1296.01c_SPAC1296.01c_I_phosphoacetylgluco... | 0 | + | 542 | 543 | 0 | + | 2745 | 1214.850797 |
34 | 5.300000e-122 | 4.700000e-97 | 164 | 165 | SPAC1296.02_711238_712354_1_cox4_I_protein_cod... | 0 | + | 164 | 164 | 0 | ... | 164 | SPAC1296.02_cox4_I_cytochrome | 0 | + | 164 | 165 | 0 | + | 853 | 379.777040 |
35 | 0.000000e+00 | 0.000000e+00 | 507 | 508 | SPAC1296.03c_712217_714070_-1_sxa2_I_protein_c... | 0 | + | 507 | 507 | 0 | ... | 507 | SPAC1296.03c_sxa2_I_serine | 0 | + | 507 | 508 | 0 | + | 2653 | 1174.244673 |
36 | 4.700000e-190 | 1.200000e-157 | 248 | 249 | SPAC1296.04_715377_716978_1_mug65_I_protein_co... | 0 | + | 248 | 248 | 0 | ... | 248 | SPAC1296.04_mug65_I_spore | 0 | + | 248 | 249 | 0 | + | 1309 | 581.042174 |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
513 | 1.900000e-264 | 2.100000e-225 | 357 | 358 | SPAC821.05_988076_989866_1_tif38_I_protein_cod... | 0 | + | 357 | 357 | 0 | ... | 357 | SPAC821.05_tif38_I_translation | 0 | + | 357 | 358 | 0 | + | 1819 | 806.141336 |
514 | 3.100000e-250 | 2.200000e-212 | 331 | 332 | SPAC821.06_990192_991889_1_spn2_I_protein_codi... | 0 | + | 331 | 331 | 0 | ... | 331 | SPAC821.06_spn2_I_mitotic | 0 | + | 331 | 332 | 0 | + | 1721 | 762.886988 |
515 | 0.000000e+00 | 0.000000e+00 | 508 | 509 | SPAC821.07c_991632_994230_-1_moc3_I_protein_co... | 0 | + | 508 | 508 | 0 | ... | 508 | SPAC821.07c_moc3_I_transcription | 0 | + | 508 | 509 | 0 | + | 2674 | 1183.513462 |
516 | 0.000000e+00 | 0.000000e+00 | 488 | 489 | SPAC821.08c_994941_997625_-1_slp1_I_protein_co... | 0 | + | 488 | 488 | 0 | ... | 488 | SPAC821.08c_slp1_I_substrate-specific | 0 | + | 488 | 489 | 0 | + | 2574 | 1139.376372 |
517 | 2.100000e-112 | 1.500000e-88 | 154 | 155 | SPAC821.10c_1002838_1003600_-1_sod1_I_protein_... | 0 | + | 154 | 154 | 0 | ... | 154 | SPAC821.10c_sod1_I_superoxide | 0 | + | 154 | 155 | 0 | + | 789 | 351.529302 |
518 | 0.000000e+00 | 1.600000e-282 | 451 | 452 | SPAC821.11_1006259_1008003_1_pro1_I_protein_co... | 0 | + | 451 | 451 | 0 | ... | 451 | SPAC821.11_pro1_I_gamma-glutamyl | 0 | + | 451 | 452 | 0 | + | 2249 | 995.930827 |
519 | 0.000000e+00 | 0.000000e+00 | 469 | 470 | SPAC821.12_1008215_1010318_1_orb6_I_protein_co... | 0 | + | 469 | 469 | 0 | ... | 469 | SPAC821.12_orb6_I_serine_threonine | 0 | + | 469 | 470 | 0 | + | 2482 | 1098.770248 |
520 | 0.000000e+00 | 0.000000e+00 | 1562 | 1563 | SPAC821.13c_1010343_1015415_-1_dnf1_I_protein_... | 0 | + | 1562 | 1562 | 0 | ... | 1562 | SPAC821.13c_dnf1_I_Trans-golgi | 0 | + | 1562 | 1563 | 0 | + | 8035 | 3549.702896 |
521 | 1.100000e-243 | 2.900000e-206 | 316 | 317 | SPAC977.01_29764_31069_1_SPAC977.01_I_protein_... | 0 | + | 316 | 316 | 0 | ... | 316 | SPAC977.01_SPAC977.01_I_S. | 0 | + | 316 | 317 | 0 | + | 1675 | 742.583926 |
522 | 7.400000e-108 | 2.000000e-84 | 146 | 147 | SPAC977.02_32034_33012_1_SPAC977.02_I_protein_... | 0 | + | 146 | 146 | 0 | ... | 146 | SPAC977.02_SPAC977.02_I_S. | 0 | + | 146 | 147 | 0 | + | 758 | 337.846804 |
523 | 8.900000e-108 | 2.700000e-84 | 145 | 146 | SPAC977.03_33835_34272_1_SPAC977.03_I_protein_... | 0 | + | 145 | 145 | 0 | ... | 145 | SPAC977.03_SPAC977.03_I_methyltransferase | 0 | + | 145 | 146 | 0 | + | 757 | 337.405433 |
524 | 9.500000e-126 | 1.700000e-100 | 169 | 173 | SPAC977.04_34298_34978_1_SPAC977.04_I_protein_... | 3 | + | 169 | 485 | 316 | ... | 485 | SPAC750.02c_SPAC750.02c_I_transmembrane | 316 | + | 169 | 173 | 3 | + | 879 | 391.252684 |
525 | 7.200000e-154 | 9.500000e-126 | 204 | 205 | SPAC977.05c_35768_36382_-1_SPAC977.05c_I_prote... | 0 | + | 204 | 204 | 0 | ... | 204 | SPAC977.05c_SPAC977.05c_I_conserved | 0 | + | 204 | 205 | 0 | + | 1069 | 475.113156 |
526 | 2.200000e-142 | 2.200000e-115 | 189 | 195 | SPAC977.06_39416_40072_1_SPAC977.06_I_protein_... | 5 | + | 189 | 189 | 0 | ... | 189 | SPAC977.06_SPAC977.06_I_S. | 0 | + | 189 | 195 | 5 | + | 991 | 440.686225 |
527 | 5.780568e-322 | 1.500000e-276 | 416 | 417 | SPAC977.07c_42057_43307_-1_pfl6_I_protein_codi... | 0 | + | 416 | 416 | 0 | ... | 416 | SPAC977.07c_pfl6_I_cell | 0 | + | 416 | 417 | 0 | + | 2204 | 976.069136 |
528 | 5.800000e-174 | 5.900000e-144 | 236 | 237 | SPAC977.08_44644_45468_1_SPAC977.08_I_protein_... | 0 | + | 236 | 236 | 0 | ... | 236 | SPAC977.08_SPAC977.08_I_short | 0 | + | 236 | 237 | 0 | + | 1206 | 535.580970 |
529 | 0.000000e+00 | 0.000000e+00 | 673 | 674 | SPAC977.09c_45875_48399_-1_SPAC977.09c_I_prote... | 0 | + | 673 | 673 | 0 | ... | 673 | SPAC977.09c_SPAC977.09c_I_phospholipase | 0 | + | 673 | 674 | 0 | + | 3581 | 1583.836875 |
530 | 0.000000e+00 | 0.000000e+00 | 468 | 544 | SPAC977.10_50946_53858_1_sod2_I_protein_coding... | 75 | + | 468 | 468 | 0 | ... | 468 | SPAC977.10_sod2_I_plasma | 0 | + | 468 | 544 | 75 | + | 2433 | 1077.143074 |
531 | 2.300000e-239 | 2.100000e-202 | 311 | 312 | SPAC977.11_55059_56308_1_SPAC977.11_I_protein_... | 0 | + | 311 | 311 | 0 | ... | 311 | SPAC977.11_SPAC977.11_I_CRCB | 0 | + | 311 | 312 | 0 | + | 1646 | 729.784169 |
532 | 7.400000e-262 | 3.900000e-223 | 356 | 357 | SPAC977.12_56373_57736_1_SPAC977.12_I_protein_... | 0 | + | 356 | 356 | 0 | ... | 356 | SPAC977.12_SPAC977.12_I_L-asparaginase | 0 | + | 356 | 357 | 0 | + | 1802 | 798.638031 |
533 | 3.100000e-266 | 1.000000e-226 | 351 | 352 | SPAC977.14c_59614_60907_-1_SPAC977.14c_I_prote... | 0 | + | 351 | 351 | 0 | ... | 351 | SPAC977.14c_SPAC977.14c_I_aldo_keto | 0 | + | 351 | 352 | 0 | + | 1829 | 810.555046 |
534 | 7.600000e-194 | 1.300000e-161 | 247 | 257 | SPAC977.15_62961_63862_1_SPAC977.15_I_protein_... | 9 | + | 247 | 247 | 0 | ... | 247 | SPAC977.15_SPAC977.15_I_dienelactone | 0 | + | 247 | 257 | 9 | + | 1339 | 594.283301 |
535 | 0.000000e+00 | 0.000000e+00 | 591 | 592 | SPAC977.16c_64559_66980_-1_dak2_I_protein_codi... | 0 | + | 591 | 591 | 0 | ... | 591 | SPAC977.16c_dak2_I_dihydroxyacetone | 0 | + | 591 | 592 | 0 | + | 3014 | 1333.579571 |
537 | 0.000000e+00 | 0.000000e+00 | 598 | 599 | SPAC977.17_66219_69821_1_SPAC977.17_I_protein_... | 0 | + | 598 | 598 | 0 | ... | 598 | SPAC977.17_SPAC977.17_I_MIP | 0 | + | 598 | 599 | 0 | + | 3180 | 1406.847141 |
538 | 8.700000e-98 | 2.200000e-75 | 133 | 134 | SPAC977.18_31140_32345_-1_SPAC977.18_I_protein... | 0 | + | 133 | 133 | 0 | ... | 133 | SPAC977.18_SPAC977.18_I_conserved | 0 | + | 133 | 134 | 0 | + | 690 | 307.833582 |
539 | 0.000000e+00 | 0.000000e+00 | 1687 | 1688 | SPAPB21F2.02_492335_497927_1_SPAPB21F2.02_I_pr... | 0 | + | 1687 | 1687 | 0 | ... | 1687 | SPAPB21F2.02_SPAPB21F2.02_I_Dopey | 0 | + | 1687 | 1688 | 0 | + | 8609 | 3803.049797 |
540 | 2.600000e-121 | 8.700000e-97 | 172 | 173 | SPAPB21F2.03_498111_499027_1_slx9_I_protein_co... | 0 | + | 172 | 172 | 0 | ... | 172 | SPAPB21F2.03_slx9_I_ribosome | 0 | + | 172 | 173 | 0 | + | 851 | 378.894298 |
541 | 2.100000e-86 | 3.700000e-65 | 117 | 118 | SPAPJ695.01c_77480_78066_-1_SPAPJ695.01c_I_pro... | 0 | + | 117 | 117 | 0 | ... | 117 | SPAPJ695.01c_SPAPJ695.01c_I_S. | 0 | + | 117 | 118 | 0 | + | 613 | 273.848022 |
542 | 0.000000e+00 | 0.000000e+00 | 549 | 550 | SPAPJ696.01c_719090_723684_-1_vps17_I_protein_... | 0 | + | 549 | 549 | 0 | ... | 549 | SPAPJ696.01c_vps17_I_retromer | 0 | + | 549 | 550 | 0 | + | 2795 | 1236.919342 |
543 | 4.900143e-320 | 2.300000e-275 | 430 | 431 | SPAPJ696.02_724145_725946_1_lsb4_I_protein_cod... | 0 | + | 430 | 430 | 0 | ... | 430 | SPAPJ696.02_lsb4_I_actin | 0 | + | 430 | 431 | 0 | + | 2195 | 972.096798 |
477 rows × 26 columns
for key, row in rbh_df.iterrows():
print row.q_name, '\t', row.s_name, '\n'
SPAC10F6.01c_1200916_1206090_-1_sir1_I_protein_coding_sulfite|m.826 SPAC10F6.01c_sir1_I_sulfite SPAC10F6.02c_1206812_1210630_-1_prp22_I_protein_coding_ATP-dependent|m.834 SPAC10F6.02c_prp22_I_ATP-dependent SPAC10F6.03c_1211195_1213553_-1_cts1_I_protein_coding_CTP|m.835 SPAC10F6.03c_cts1_I_CTP SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_protein_coding_RCC|m.839 SPAC10F6.04_SPAC10F6.04_I_RCC SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein_coding_ubiquitin|m.841 SPAC10F6.05c_ubc6_I_ubiquitin SPAC10F6.06_1217077_1218228_1_vip1_I_protein_coding_RNA-binding|m.843 SPAC10F6.06_vip1_I_RNA-binding SPAC10F6.07c_1218321_1218887_-1_mug94_I_protein_coding_Schizosaccharomyces|m.844 SPAC10F6.07c_mug94_I_Schizosaccharomyces SPAC10F6.08c_1219667_1220847_-1_nht1_I_protein_coding_Ino80|m.846 SPAC10F6.08c_nht1_I_Ino80 SPAC10F6.09c_1220969_1224862_-1_psm3_I_protein_coding_mitotic|m.847 SPAC10F6.09c_psm3_I_mitotic SPAC10F6.10_1225464_1227365_1_rio1_I_protein_coding_protein|m.848 SPAC10F6.10_rio1_I_protein SPAC11D3.01c_108732_109195_-1_SPAC11D3.01c_I_protein_coding_conserved|m.52 SPAC11D3.01c_SPAC11D3.01c_I_conserved SPAC11D3.02c_109829_110455_-1_SPAC11D3.02c_I_protein_coding_ELLA|m.53 SPAC11D3.02c_SPAC11D3.02c_I_ELLA SPAC11D3.03c_110904_112499_-1_SPAC11D3.03c_I_protein_coding_conserved|m.54 SPAC11D3.03c_SPAC11D3.03c_I_conserved SPAC11D3.04c_112514_114445_-1_SPAC11D3.04c_I_protein_coding_polyketide|m.56 SPAC11D3.04c_SPAC11D3.04c_I_polyketide SPAC11D3.05_113950_115962_1_mfs2_I_protein_coding_MFS|m.58 SPAC11D3.05_mfs2_I_MFS SPAC11D3.06_116331_118189_1_SPAC11D3.06_I_protein_coding_MatE|m.65 SPAC11D3.06_SPAC11D3.06_I_MatE SPAC11D3.07c_116054_120309_-1_toe4_I_protein_coding_transcription|m.61 SPAC11D3.07c_toe4_I_transcription SPAC11D3.08c_120321_123785_-1_SPAC11D3.08c_I_protein_coding_amino|m.67 SPAC11D3.08c_SPAC11D3.08c_I_amino SPAC11D3.09_122187_124116_1_SPAC11D3.09_I_protein_coding_agmatinase|m.71 SPAC11D3.09_SPAC11D3.09_I_agmatinase SPAC11D3.10_124907_129053_1_SPAC11D3.10_I_protein_coding_nifs|m.74 SPAC11D3.10_SPAC11D3.10_I_nifs SPAC11D3.11c_126951_129316_-1_SPAC11D3.11c_I_protein_coding_zn(2)-C6|m.78 SPAC11D3.11c_SPAC11D3.11c_I_zn(2)-C6 SPAC11D3.13_130148_131268_1_hsp3104_I_protein_coding_ThiJ|m.80 SPAC11D3.13_hsp3104_I_ThiJ SPAC11D3.14c_131190_135736_-1_SPAC11D3.14c_I_protein_coding_5-oxoprolinase|m.81 SPAC11D3.14c_SPAC11D3.14c_I_5-oxoprolinase SPAC11D3.15_136139_140365_1_SPAC11D3.15_I_protein_coding_5-oxoprolinase|m.83 SPAC11D3.15_SPAC11D3.15_I_5-oxoprolinase SPAC11D3.16c_140381_141653_-1_SPAC11D3.16c_I_protein_coding_Schizosaccharomyces|m.86 SPAC11D3.16c_SPAC11D3.16c_I_Schizosaccharomyces SPAC11D3.17_141199_144768_1_SPAC11D3.17_I_protein_coding_transcription|m.87 SPAC11D3.17_SPAC11D3.17_I_transcription SPAC11D3.18c_144819_146935_-1_SPAC11D3.18c_I_protein_coding_plasma|m.89 SPAC11D3.18c_SPAC11D3.18c_I_plasma SPAC1296.01c_707948_710479_-1_SPAC1296.01c_I_protein_coding_phosphoacetylglucosamine|m.466 SPAC1296.01c_SPAC1296.01c_I_phosphoacetylglucosamine SPAC1296.02_711238_712354_1_cox4_I_protein_coding_cytochrome|m.468 SPAC1296.02_cox4_I_cytochrome SPAC1296.03c_712217_714070_-1_sxa2_I_protein_coding_serine|m.469 SPAC1296.03c_sxa2_I_serine SPAC1296.04_715377_716978_1_mug65_I_protein_coding_spore|m.470 SPAC1296.04_mug65_I_spore SPAC1296.05c_716874_718168_-1_lcp1_I_protein_coding_cyclin|m.472 SPAC1296.05c_lcp1_I_cyclin SPAC1296.06_719380_721549_1_tah18_I_protein_coding_NADPH-dependent|m.476 SPAC1296.06_tah18_I_NADPH-dependent SPAC12G12.01c_346795_350151_1_sea4_I_protein_coding_SEA|m.220 SPAC12G12.01c_sea4_I_SEA SPAC12G12.02_345234_347735_-1_efg1_I_protein_coding_rRNA|m.218 SPAC12G12.02_efg1_I_rRNA SPAC12G12.03_342090_345182_-1_cip2_I_protein_coding_RNA-binding|m.215 SPAC12G12.03_cip2_I_RNA-binding SPAC12G12.04_339766_342080_-1_mcp60_I_protein_coding_mitochondrial|m.213 SPAC12G12.04_mcp60_I_mitochondrial SPAC12G12.05c_338286_339763_1_taf9_I_protein_coding_SAGA|m.211 SPAC12G12.05c_taf9_I_SAGA SPAC12G12.06c_336308_338157_1_rcl1_I_protein_coding_rRNA|m.209 SPAC12G12.06c_rcl1_I_rRNA SPAC12G12.07c_334615_336131_1_SPAC12G12.07c_I_protein_coding_conserved|m.208 SPAC12G12.07c_SPAC12G12.07c_I_conserved SPAC12G12.08_333178_334621_-1_mrpl1602_I_protein_coding_mitochondrial|m.206 SPAC12G12.08_mrpl1602_I_mitochondrial SPAC12G12.09_329810_332816_-1_eti1_I_protein_coding_conserved|m.204 SPAC12G12.09_eti1_I_conserved SPAC12G12.10_328196_329545_-1_wdr21_I_protein_coding_WD|m.203 SPAC12G12.10_wdr21_I_WD SPAC12G12.11c_326440_328122_1_SPAC12G12.11c_I_protein_coding_DUF544|m.202 SPAC12G12.11c_SPAC12G12.11c_I_DUF544 SPAC12G12.12_324042_325517_-1_gms2_I_protein_coding_UDP-galactose|m.201 SPAC12G12.12_gms2_I_UDP-galactose SPAC12G12.13c_321764_324129_1_cid14_I_protein_coding_poly(A)|m.200 SPAC12G12.13c_cid14_I_poly(A) SPAC12G12.14c_319815_321825_1_pfs2_I_protein_coding_WD|m.198 SPAC12G12.14c_pfs2_I_WD SPAC12G12.15_316996_319185_-1_sif3_I_protein_coding_mitochondrial|m.196 SPAC12G12.15_sif3_I_mitochondrial SPAC12G12.16c_315394_317585_1_SPAC12G12.16c_I_protein_coding_Fen1|m.194 SPAC12G12.16c_SPAC12G12.16c_I_Fen1 SPAC139.02c_1019248_1020838_-1_oac1_I_protein_coding_mitochondrial|m.669 SPAC139.02c_oac1_I_mitochondrial SPAC139.03_1021695_1024135_1_toe2_I_protein_coding_transcription|m.671 SPAC139.03_toe2_I_transcription SPAC139.04c_1024002_1025903_-1_fap2_I_protein_coding_L-saccharopine|m.672 SPAC139.04c_fap2_I_L-saccharopine SPAC139.05_1027811_1029993_1_SPAC139.05_I_protein_coding_succinate-semialdehyde|m.673 SPAC139.05_SPAC139.05_I_succinate-semialdehyde SPAC139.06_1030125_1031941_1_hat1_I_protein_coding_histone|m.674 SPAC139.06_hat1_I_histone SPAC13A11.01c_570753_574417_-1_rga8_I_protein_coding_Rho-type|m.376 SPAC13A11.01c_rga8_I_Rho-type SPAC2F7.17_569550_571876_1_mrf1_I_protein_coding_mitochondrial|m.375 SPAC2F7.17_mrf1_I_mitochondrial SPAC13A11.02c_574652_577171_-1_erg11_I_protein_coding_sterol|m.378 SPAC13A11.02c_erg11_I_sterol SPAC13A11.03_578392_579948_1_mcp7_I_protein_coding_meiosis|m.380 SPAC13A11.03_mcp7_I_meiosis SPAC13A11.04c_579353_581553_-1_ubp8_I_protein_coding_SAGA|m.381 SPAC13A11.04c_ubp8_I_SAGA SPAC13A11.05_582273_584402_1_ysp2_I_protein_coding_peptidase|m.383 SPAC13A11.05_ysp2_I_peptidase SPAC13A11.06_585355_587495_1_SPAC13A11.06_I_protein_coding_pyruvate|m.385 SPAC13A11.06_SPAC13A11.06_I_pyruvate SPAC13C5.01c_423926_425256_-1_pre9_I_protein_coding_20S|m.283 SPAC13C5.01c_pre9_I_20S SPAC13C5.02_425631_427415_1_dre4_I_protein_coding_splicing|m.284 SPAC13C5.02_dre4_I_splicing SPAC13C5.03_427350_430121_1_tht1_I_protein_coding_nuclear|m.285 SPAC13C5.03_tht1_I_nuclear SPAC13C5.04_430056_431032_1_SPAC13C5.04_I_protein_coding_amidotransferase|m.286 SPAC13C5.04_SPAC13C5.04_I_amidotransferase SPAC13C5.05c_431367_433274_-1_SPAC13C5.05c_I_protein_coding_N-acetylglucosamine-phosphate|m.287 SPAC13C5.05c_SPAC13C5.05c_I_N-acetylglucosamine-phosphate SPAC13C5.06c_434102_435179_-1_mug121_I_protein_coding_Schizosaccharomyces|m.288 SPAC13C5.06c_mug121_I_Schizosaccharomyces SPAC13C5.07_435170_439980_1_mre11_I_protein_coding_Mre11|m.289 SPAC13C5.07_mre11_I_Mre11 SPAC13G6.01c_170489_174701_-1_rad8_I_protein_coding_ubiquitin-protein|m.110 SPAC13G6.01c_rad8_I_ubiquitin-protein SPAC13G6.02c_174865_176655_-1_rps101_I_protein_coding_40S|m.113 SPAC13G6.02c_rps101_I_40S SPAC13G6.03_175890_180028_1_gpi7_I_protein_coding_GPI|m.114 SPAC13G6.03_gpi7_I_GPI SPAC13G6.04_180272_181069_1_tim8_I_protein_coding_TIM22|m.115 SPAC13G6.04_tim8_I_TIM22 SPAC13G6.05c_180903_182254_-1_trs33_I_protein_coding_TRAPP|m.116 SPAC13G6.05c_trs33_I_TRAPP SPAC13G6.06c_182337_186358_-1_gcv2_I_protein_coding_glycine|m.117 SPAC13G6.06c_gcv2_I_glycine SPAC13G6.07c_186314_187683_-1_rps601_I_protein_coding_40S|m.118 SPAC13G6.07c_rps601_I_40S SPAC13G6.08_187701_190031_1_SPAC13G6.08_I_protein_coding_Cdc20_Fizzy|m.120 SPAC13G6.08_SPAC13G6.08_I_Cdc20_Fizzy SPAC13G6.09_190192_191947_1_SPAC13G6.09_I_protein_coding_SSU-rRNA|m.122 SPAC13G6.09_SPAC13G6.09_I_SSU-rRNA SPAC13G6.10c_191928_194053_-1_asl1_I_protein_coding_cell|m.123 SPAC13G6.10c_asl1_I_cell SPAC13G6.11c_194099_195626_-1_erg12_I_protein_coding_mevalonate|m.124 SPAC13G6.11c_erg12_I_mevalonate SPAC13G6.12c_195940_199051_-1_chs1_I_protein_coding_chitin|m.125 SPAC13G6.12c_chs1_I_chitin SPAC13G6.13_198884_199231_1_SPAC13G6.13_I_protein_coding_Schizosaccharomyces|m.126 SPAC13G6.13_SPAC13G6.13_I_Schizosaccharomyces SPAC13G6.14_200121_201517_1_aps1_I_protein_coding_diadenosine|m.127 SPAC13G6.14_aps1_I_diadenosine SPAC13G6.15c_201729_203346_-1_SPAC13G6.15c_I_protein_coding_calcipressin|m.128 SPAC13G6.15c_SPAC13G6.15c_I_calcipressin SPAC1639.01c_251173_254600_-1_SPAC1639.01c_I_protein_coding_GNS1_SUR4|m.163 SPAC1639.01c_SPAC1639.01c_I_GNS1_SUR4 SPAC1639.02c_255881_259505_-1_trk2_I_protein_coding_potassium|m.165 SPAC1639.02c_trk2_I_potassium SPAC1687.01_903042_903861_1_rpc19_I_protein_coding_DNA-directed|m.587 SPAC1687.01_rpc19_I_DNA-directed SPAC1687.03c_905077_906465_-1_rfc4_I_protein_coding_DNA|m.591 SPAC1687.03c_rfc4_I_DNA SPAC1687.02_904026_906347_1_SPAC1687.02_I_protein_coding_CAAX|m.589 SPAC1687.02_SPAC1687.02_I_CAAX SPAC1687.04_906778_908799_1_mcb1_I_protein_coding_MCM|m.592 SPAC1687.04_mcb1_I_MCM SPAC1687.05_908736_911854_1_pli1_I_protein_coding_SUMO|m.593 SPAC1687.05_pli1_I_SUMO SPAC1687.05_908736_911854_1_pli1_I_protein_coding_SUMO|m.594 SPAC1687.06c_rpl44_I_60S SPAC1687.07_913657_914031_1_SPAC1687.07_I_protein_coding_conserved|m.598 SPAC1687.07_SPAC1687.07_I_conserved SPAC1687.08_914328_914618_1_SPAC1687.08_I_protein_coding_Schizosaccharomyces|m.599 SPAC1687.08_SPAC1687.08_I_Schizosaccharomyces SPAC1687.09_914940_919775_1_tax4_I_protein_coding_autophagy_CVT|m.600 SPAC1687.09_tax4_I_autophagy_CVT SPAC1687.10_919726_922098_1_mcp1_I_protein_coding_microtubule|m.602 SPAC1687.10_mcp1_I_microtubule SPAC1687.11_922271_925133_1_spb1_I_protein_coding_rRNA|m.603 SPAC1687.11_spb1_I_rRNA SPAC1687.12c_925111_926289_-1_coq4_I_protein_coding_ubiquinone|m.604 SPAC1687.12c_coq4_I_ubiquinone SPAC1687.13c_926394_927671_-1_csn5_I_protein_coding_COP9_signalosome|m.605 SPAC1687.13c_csn5_I_COP9_signalosome SPAC1687.15_929843_932197_1_gsk3_I_protein_coding_serine_threonine|m.607 SPAC1687.15_gsk3_I_serine_threonine SPAC1687.16c_932425_934021_-1_erg31_I_protein_coding_C-5|m.610 SPAC1687.16c_erg31_I_C-5 SPAC1687.17c_934941_936081_-1_SPAC1687.17c_I_protein_coding_Der1-like|m.612 SPAC1687.17c_SPAC1687.17c_I_Der1-like SPAC1687.18c_936188_938157_-1_ssl3_I_protein_coding_cohesin|m.613 SPAC1687.18c_ssl3_I_cohesin SPAC1687.19c_938311_939831_-1_qtr1_I_protein_coding_queuine|m.614 SPAC1687.19c_qtr1_I_queuine SPAC1687.20c_939770_941944_-1_mis6_I_protein_coding_inner|m.615 SPAC1687.20c_mis6_I_inner SPAC1687.21_941942_943335_1_SPAC1687.21_I_protein_coding_phosphoglycerate|m.616 SPAC1687.21_SPAC1687.21_I_phosphoglycerate SPAC1687.22c_943265_946909_-1_puf3_I_protein_coding_RNA-binding|m.617 SPAC1687.22c_puf3_I_RNA-binding SPAC1687.23c_929156_929654_-1_SPAC1687.23c_I_protein_coding_Schizosaccharomyces|m.606 SPAC1687.23c_SPAC1687.23c_I_Schizosaccharomyces SPAC16C9.01c_790245_792274_-1_SPAC16C9.01c_I_protein_coding_carbohydrate|m.519 SPAC16C9.01c_SPAC16C9.01c_I_carbohydrate SPAC16C9.02c_792521_793937_-1_SPAC16C9.02c_I_protein_coding_S-methyl-5-thioadenosine|m.520 SPAC16C9.02c_SPAC16C9.02c_I_S-methyl-5-thioadenosine SPAC16C9.03_794866_796821_1_nmd3_I_protein_coding_export|m.522 SPAC16C9.03_nmd3_I_export SPAC16C9.04c_796876_798833_-1_mot2_I_protein_coding_CCR4-Not|m.523 SPAC16C9.04c_mot2_I_CCR4-Not SPAC16C9.05_799341_800981_1_cph1_I_protein_coding_Clr6|m.525 SPAC16C9.05_cph1_I_Clr6 SPAC16C9.06c_801141_804123_-1_upf1_I_protein_coding_ATP-dependent|m.526 SPAC16C9.06c_upf1_I_ATP-dependent SPAC16C9.07_804574_807722_1_pom2_I_protein_coding_DYRK|m.527 SPAC16C9.07_pom2_I_DYRK SPAC1751.01c_377844_384751_-1_gti1_I_protein_coding_gluconate|m.245 SPAC1751.01c_gti1_I_gluconate SPAC1751.02c_384886_386195_-1_rsm19_I_protein_coding_mitochondrial|m.254 SPAC1751.02c_rsm19_I_mitochondrial SPAC1751.03_386266_387856_1_SPAC1751.03_I_protein_coding_translation|m.255 SPAC1751.03_SPAC1751.03_I_translation SPAC1751.04_383580_385433_1_loc1_I_protein_coding_ribosome|m.252 SPAC1751.04_loc1_I_ribosome SPAC18B11.02c_313974_315335_1_SPAC18B11.02c_I_protein_coding_tRNA|m.192 SPAC18B11.02c_SPAC18B11.02c_I_tRNA SPAC18B11.03c_311920_314040_1_SPAC18B11.03c_I_protein_coding_N-acetyltransferase|m.191 SPAC18B11.03c_SPAC18B11.03c_I_N-acetyltransferase SPAC18B11.04_310157_311712_-1_ncs1_I_protein_coding_neuronal|m.190 SPAC18B11.04_ncs1_I_neuronal SPAC18B11.06_306764_308031_-1_lcp5_I_protein_coding_U3|m.187 SPAC18B11.06_lcp5_I_U3 SPAC18B11.07c_305602_306762_1_rhp6_I_protein_coding_Rad6|m.185 SPAC18B11.07c_rhp6_I_Rad6 SPAC18B11.08c_304355_305168_1_SPAC18B11.08c_I_protein_coding_conserved|m.184 SPAC18B11.08c_SPAC18B11.08c_I_conserved SPAC18B11.09c_303004_304161_1_SPAC18B11.09c_I_protein_coding_serine|m.183 SPAC18B11.09c_SPAC18B11.09c_I_serine SPAC18B11.10_299278_301837_-1_tup11_I_protein_coding_transcriptional|m.182 SPAC18B11.10_tup11_I_transcriptional SPAC18B11.11_294591_299154_-1_SPAC18B11.11_I_protein_coding_GTPase|m.181 SPAC18B11.11_SPAC18B11.11_I_GTPase SPAC1A6.01c_1066192_1070006_-1_SPAC1A6.01c_I_protein_coding_human|m.708 SPAC1A6.01c_SPAC1A6.01c_I_human SPAC1A6.01c_1066192_1070006_-1_SPAC1A6.01c_I_protein_coding_human|m.709 SPAC1A6.02_SPAC1A6.02_I_WD SPAC23C4.19_1063729_1066954_1_spt5_I_protein_coding_DSIF|m.700 SPAC23C4.19_spt5_I_DSIF SPAC1A6.03c_1069923_1072343_-1_SPAC1A6.03c_I_protein_coding_phospholipase|m.714 SPAC1A6.03c_SPAC1A6.03c_I_phospholipase SPAC1A6.04c_1074331_1077514_-1_plb1_I_protein_coding_phospholipase|m.719 SPAC1A6.04c_plb1_I_phospholipase SPAC1A6.05c_1079635_1081713_-1_ptl3_I_protein_coding_triacylglycerol|m.725 SPAC1A6.05c_ptl3_I_triacylglycerol SPAC1A6.06c_1081916_1083616_-1_meu31_I_protein_coding_Schizosaccharomyces|m.726 SPAC1A6.06c_meu31_I_Schizosaccharomyces SPAC1A6.07_1084068_1086426_1_sle1_I_protein_coding_eisosome|m.727 SPAC1A6.07_sle1_I_eisosome SPAC1A6.08c_1086242_1087505_-1_mug125_I_protein_coding_Schizosaccharomyces|m.729 SPAC1A6.08c_mug125_I_Schizosaccharomyces SPAC1A6.09c_1087443_1089673_-1_lag1_I_protein_coding_sphingosine|m.730 SPAC1A6.09c_lag1_I_sphingosine SPAC1A6.10_1090678_1092303_1_tcd1_I_protein_coding_tRNA|m.731 SPAC1A6.10_tcd1_I_tRNA SPAC1D4.01_639405_641280_1_tls1_I_protein_coding_splicing|m.416 SPAC1D4.01_tls1_I_splicing SPAC1D4.02c_639545_641680_-1_grh1_I_protein_coding_human|m.420 SPAC1D4.02c_grh1_I_human SPAC1D4.03c_641845_643775_-1_aut12_I_protein_coding_autophagy|m.423 SPAC1D4.03c_aut12_I_autophagy SPAC1D4.04_644667_646547_1_cct2_I_protein_coding_chaperonin-containing|m.427 SPAC1D4.04_cct2_I_chaperonin-containing SPAC1D4.05c_644623_648097_-1_SPAC1D4.05c_I_protein_coding_Erd1|m.426 SPAC1D4.05c_SPAC1D4.05c_I_Erd1 SPAC1D4.06c_648301_649393_-1_csk1_I_protein_coding_cyclin-dependent|m.428 SPAC1D4.06c_csk1_I_cyclin-dependent SPAC1D4.08_650465_652224_1_pis1_I_protein_coding_CDP-diacylglycerol--inositol|m.430 SPAC1D4.08_pis1_I_CDP-diacylglycerol--inositol SPAC1D4.09c_652225_653321_-1_rtf2_I_protein_coding_replication|m.431 SPAC1D4.09c_rtf2_I_replication SPAC1D4.10_653449_656657_1_trz1_I_protein_coding_nuclear|m.432 SPAC1D4.10_trz1_I_nuclear SPAC1D4.11c_656076_660381_-1_lkh1_I_protein_coding_dual|m.434 SPAC1D4.11c_lkh1_I_dual SPAC1D4.12_664310_667647_1_rad15_I_protein_coding_transcription|m.436 SPAC1D4.12_rad15_I_transcription SPAC1D4.13_667815_669742_1_byr1_I_protein_coding_MAP|m.438 SPAC1D4.13_byr1_I_MAP SPAC1D4.14_670203_675444_1_tho2_I_protein_coding_THO|m.439 SPAC1D4.14_tho2_I_THO SPAC1F3.01_610842_613338_1_rrp6_I_protein_coding_exosome|m.399 SPAC1F3.01_rrp6_I_exosome SPAC1F3.02c_613369_617324_-1_mkh1_I_protein_coding_MEK|m.400 SPAC1F3.02c_mkh1_I_MEK SPAC1F3.03_617816_622703_1_sro7_I_protein_coding_Lgl|m.402 SPAC1F3.03_sro7_I_Lgl SPAC1F3.04c_621054_622267_-1_tsr3_I_protein_coding_SSU-rRNA|m.404 SPAC1F3.04c_tsr3_I_SSU-rRNA SPAC1F3.05_623091_625407_1_gga21_I_protein_coding_Golgi|m.406 SPAC1F3.05_gga21_I_Golgi SPAC1F3.06c_625173_631401_-1_spo15_I_protein_coding_sporulation|m.407 SPAC1F3.06c_spo15_I_sporulation SPAC1F3.07c_631511_633102_-1_rsc58_I_protein_coding_RSC|m.410 SPAC1F3.07c_rsc58_I_RSC SPAC1F3.09_633652_636959_1_mug161_I_protein_coding_CwfJ|m.412 SPAC1F3.09_mug161_I_CwfJ SPAC1F3.10c_634898_639430_-1_oct1_I_protein_coding_mitochondrial|m.413 SPAC1F3.10c_oct1_I_mitochondrial SPAC1F5.02_291979_293771_-1_pdi1_I_protein_coding_protein|m.180 SPAC1F5.02_pdi1_I_protein SPAC1F5.03c_289790_291927_1_SPAC1F5.03c_I_protein_coding_FAD-dependent|m.179 SPAC1F5.03c_SPAC1F5.03c_I_FAD-dependent SPAC1F5.04c_283287_289200_1_cdc12_I_protein_coding_formin|m.176 SPAC1F5.04c_cdc12_I_formin SPAC1F5.05c_281774_282745_1_mso1_I_protein_coding_endocytic|m.175 SPAC1F5.05c_mso1_I_endocytic SPAC1F5.06_276657_281347_-1_lsh1_I_protein_coding_ER|m.172 SPAC1F5.06_lsh1_I_ER SPAC1F5.06_276657_281347_-1_lsh1_I_protein_coding_ER|m.173 SPAC1F5.07c_hem14_I_protoporphyrinogen SPAC1F5.08c_275089_276661_1_yam8_I_protein_coding_stretch-activated|m.171 SPAC1F5.08c_yam8_I_stretch-activated SPAC1F5.09c_273152_274921_1_shk2_I_protein_coding_PAK-related|m.169 SPAC1F5.09c_shk2_I_PAK-related SPAC1F5.10_270893_272610_-1_SPAC1F5.10_I_protein_coding_ATP-dependent|m.167 SPAC1F5.10_SPAC1F5.10_I_ATP-dependent SPAC1F5.11c_259603_271053_1_tra2_I_protein_coding_NuA4|m.166 SPAC1F5.11c_tra2_I_NuA4 SPAC1F8.01_82746_84786_1_ght3_I_protein_coding_hexose|m.34 SPAC1F8.01_ght3_I_hexose SPAC1F8.02c_85566_86324_-1_shu1_I_protein_coding_heme|m.35 SPAC1F8.02c_shu1_I_heme SPAC1F8.03c_88201_90300_-1_str3_I_protein_coding_siderophore-iron|m.37 SPAC1F8.03c_str3_I_siderophore-iron SPAC1F8.04c_92387_93931_-1_SPAC1F8.04c_I_protein_coding_hydrolase|m.38 SPAC1F8.04c_SPAC1F8.04c_I_hydrolase SPAC1F8.05_95961_96966_1_isp3_I_protein_coding_Schizosaccharomyces|m.42 SPAC1F8.05_isp3_I_Schizosaccharomyces SPAC1F8.06_99871_101431_1_fta5_I_protein_coding_cell|m.45 SPAC1F8.06_fta5_I_cell SPAC1F8.07c_101715_103594_-1_SPAC1F8.07c_I_protein_coding_pyruvate|m.47 SPAC1F8.07c_SPAC1F8.07c_I_pyruvate SPAC1F8.08_103941_104953_1_SPAC1F8.08_I_protein_coding_Schizosaccharomyces|m.51 SPAC1F8.08_SPAC1F8.08_I_Schizosaccharomyces SPAC212.01c_28738_29657_1_SPAC212.01c_I_protein_coding_S.|m.10 SPAC212.01c_SPAC212.01c_I_S. SPAC212.02_27353_27763_-1_SPAC212.02_I_protein_coding_Schizosaccharomyces|m.9 SPAC212.02_SPAC212.02_I_Schizosaccharomyces SPAC212.03_23589_24054_-1_SPAC212.03_I_protein_coding_hypothetical|m.8 SPAC212.03_SPAC212.03_I_hypothetical SPAC212.04c_21381_23050_1_SPAC212.04c_I_protein_coding_S.|m.7 SPAC212.04c_SPAC212.04c_I_S. SPAC212.06c_18042_18974_1_SPAC212.06c_I_protein_coding_DNA|m.6 SPAC212.06c_SPAC212.06c_I_DNA SPAC212.08c_11784_12994_1_SPAC212.08c_I_protein_coding_S.|m.4 SPAC212.08c_SPAC212.08c_I_S. SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ|m.1 SPAC212.11_tlh1_I_RecQ SPAC212.12_15855_16226_1_SPAC212.12_I_protein_coding_S.|m.5 SPAC212.12_SPAC212.12_I_S. SPAC222.03c_947876_948800_-1_tim10_I_protein_coding_Tim9-Tim10|m.618 SPAC222.03c_tim10_I_Tim9-Tim10 SPAC222.04c_950120_950813_-1_ies6_I_protein_coding_Ino80|m.620 SPAC222.04c_ies6_I_Ino80 SPAC222.05c_950912_953006_-1_mss1_I_protein_coding_mitochondrial|m.621 SPAC222.05c_mss1_I_mitochondrial SPAC222.06_953095_954325_1_mak16_I_protein_coding_nuclear|m.624 SPAC222.06_mak16_I_nuclear SPAC222.07c_954279_956707_-1_hri2_I_protein_coding_eIF2|m.626 SPAC222.07c_hri2_I_eIF2 SPAC222.08c_957367_958774_-1_sno1_I_protein_coding_glutamine|m.627 SPAC222.08c_sno1_I_glutamine SPAC222.09_959867_962227_1_seb1_I_protein_coding_RNA-binding|m.629 SPAC222.09_seb1_I_RNA-binding SPAC222.10c_962314_964867_-1_byr4_I_protein_coding_two-component|m.632 SPAC222.10c_byr4_I_two-component SPAC222.11_966164_967591_1_hem13_I_protein_coding_coproporphyrinogen|m.637 SPAC222.11_hem13_I_coproporphyrinogen SPAC222.12c_968507_970412_-1_atp2_I_protein_coding_F1-ATPase|m.641 SPAC222.12c_atp2_I_F1-ATPase SPAC222.13c_970875_973548_-1_SPAC222.13c_I_protein_coding_6-phosphofructo-2-kinase|m.643 SPAC222.13c_SPAC222.13c_I_6-phosphofructo-2-kinase SPAC222.14c_973843_976782_-1_sey1_I_protein_coding_GTP|m.644 SPAC222.14c_sey1_I_GTP SPAC222.15_977709_978637_1_meu13_I_protein_coding_Tat|m.645 SPAC222.15_meu13_I_Tat SPAC222.16c_979482_981161_-1_csn3_I_protein_coding_COP9_signalosome|m.647 SPAC222.16c_csn3_I_COP9_signalosome SPAC222.17_967583_968302_-1_SPAC222.17_I_protein_coding_conserved|m.640 SPAC222.17_SPAC222.17_I_conserved SPAC222.18_978722_979643_1_SPAC222.18_I_protein_coding_Srp1|m.646 SPAC222.18_SPAC222.18_I_Srp1 SPAC222.19_949646_950047_1_tam1_I_protein_coding_Schizosaccharomyces|m.619 SPAC222.19_tam1_I_Schizosaccharomyces SPAC227.01c_498878_500674_-1_erd1_I_protein_coding_Erd1|m.323 SPAC227.01c_erd1_I_Erd1 SPAC227.02c_501751_502444_-1_rrp15_I_protein_coding_rRNA|m.325 SPAC227.02c_rrp15_I_rRNA SPAC227.03c_502577_504324_-1_yea6_I_protein_coding_mitochondrial|m.326 SPAC227.03c_yea6_I_mitochondrial SPAC227.04_504835_505775_1_atg10_I_protein_coding_Atg12|m.327 SPAC227.04_atg10_I_Atg12 SPAC227.05_505902_506355_1_gim3_I_protein_coding_prefoldin|m.328 SPAC227.05_gim3_I_prefoldin SPAC227.06_506520_507605_1_yip5_I_protein_coding_Rab|m.329 SPAC227.06_yip5_I_Rab SPAC227.07c_507522_509960_-1_pab1_I_protein_coding_protein|m.330 SPAC227.07c_pab1_I_protein SPAC227.08c_510410_511433_-1_yth1_I_protein_coding_mRNA|m.331 SPAC227.08c_yth1_I_mRNA SPAC227.09_511350_513382_1_fol3_I_protein_coding_folylpolyglutamate|m.332 SPAC227.09_fol3_I_folylpolyglutamate SPAC227.11c_513967_517252_-1_yos9_I_protein_coding_sensor|m.338 SPAC227.11c_yos9_I_sensor SPAC227.10_513820_514921_1_gim4_I_protein_coding_prefoldin|m.336 SPAC227.10_gim4_I_prefoldin SPAC227.12_515661_517504_1_rna4_I_protein_coding_U4_U6|m.341 SPAC227.12_rna4_I_U4_U6 SPAC227.13c_517416_519017_-1_isu1_I_protein_coding_mitochondrial|m.342 SPAC227.13c_isu1_I_mitochondrial SPAC227.14_520174_522766_1_yfh7_I_protein_coding_uridine|m.343 SPAC227.14_yfh7_I_uridine SPAC227.15_523097_526412_1_reg1_I_protein_coding_protein|m.345 SPAC227.15_reg1_I_protein SPAC227.16c_527782_528906_-1_psf3_I_protein_coding_GINS|m.349 SPAC227.16c_psf3_I_GINS SPAC227.17c_529167_530275_-1_SPAC227.17c_I_protein_coding_conserved|m.350 SPAC227.17c_SPAC227.17c_I_conserved SPAC227.18_530261_531981_1_lys3_I_protein_coding_saccharopine|m.351 SPAC227.18_lys3_I_saccharopine SPAC227.19c_501117_501485_-1_SPAC227.19c_I_protein_coding_conserved|m.324 SPAC227.19c_SPAC227.19c_I_conserved SPAC22A12.01c_1156487_1159594_-1_pso2_I_protein_coding_DNA|m.785 SPAC22A12.01c_pso2_I_DNA SPAC22A12.02c_1159626_1160000_-1_mug103_I_protein_coding_Schizosaccharomyces|m.786 SPAC22A12.02c_mug103_I_Schizosaccharomyces SPAC22A12.03c_1160118_1161595_-1_csn4_I_protein_coding_COP9_signalosome|m.787 SPAC22A12.03c_csn4_I_COP9_signalosome SPAC22A12.04c_1162203_1162901_-1_rps2201_I_protein_coding_40S|m.788 SPAC22A12.04c_rps2201_I_40S SPAC22A12.05_1163057_1163522_1_rpc11_I_protein_coding_DNA-directed|m.789 SPAC22A12.05_rpc11_I_DNA-directed SPAC22A12.06c_1163745_1165581_-1_SPAC22A12.06c_I_protein_coding_serine|m.791 SPAC22A12.06c_SPAC22A12.06c_I_serine SPAC22A12.07c_1166562_1169743_-1_ogm1_I_protein_coding_protein|m.794 SPAC22A12.07c_ogm1_I_protein SPAC22A12.08c_1170196_1172171_-1_SPAC22A12.08c_I_protein_coding_cardiolipin|m.796 SPAC22A12.08c_SPAC22A12.08c_I_cardiolipin SPAC22A12.09c_1172351_1174497_-1_sap114_I_protein_coding_U2|m.801 SPAC22A12.09c_sap114_I_U2 SPAC22A12.10_1172209_1176801_1_ept1_I_protein_coding_diacylglycerol|m.797 SPAC22A12.10_ept1_I_diacylglycerol SPAC22A12.11_1176703_1178897_1_dak1_I_protein_coding_dihydroxyacetone|m.802 SPAC22A12.11_dak1_I_dihydroxyacetone SPAC22A12.12c_1178856_1180072_-1_rrp40_I_protein_coding_exosome|m.805 SPAC22A12.12c_rrp40_I_exosome SPAC22A12.13_1180184_1181157_1_mug84_I_protein_coding_pig-P|m.806 SPAC22A12.13_mug84_I_pig-P SPAC22A12.14c_1180999_1182528_-1_SPAC22A12.14c_I_protein_coding_BSD|m.807 SPAC22A12.14c_SPAC22A12.14c_I_BSD SPAC22A12.15c_1182693_1185497_-1_bip1_I_protein_coding_ER|m.808 SPAC22A12.15c_bip1_I_ER SPAC22A12.16_1186205_1187928_1_SPAC22A12.16_I_protein_coding_ATP-citrate|m.815 SPAC22A12.16_SPAC22A12.16_I_ATP-citrate SPAC22A12.17c_1185837_1189506_-1_SPAC22A12.17c_I_protein_coding_short|m.810 SPAC22A12.17c_SPAC22A12.17c_I_short SPAC22F3.02_705042_708014_-1_atf31_I_protein_coding_transcription|m.462 SPAC22F3.02_atf31_I_transcription SPAC22F3.03c_703669_707990_1_rdh54_I_protein_coding_ATP-dependent|m.460 SPAC22F3.03c_rdh54_I_ATP-dependent SPAC22F3.04_697960_702755_-1_mug62_I_protein_coding_AMP|m.458 SPAC22F3.04_mug62_I_AMP SPAC22F3.05c_697191_703040_1_alp41_I_protein_coding_GTP-binding|m.457 SPAC22F3.05c_alp41_I_GTP-binding SPAC22F3.06c_693514_697130_1_lon1_I_protein_coding_Lon|m.454 SPAC22F3.06c_lon1_I_Lon SPAC22F3.07c_691472_692077_1_atp20_I_protein_coding_F0-ATPase|m.452 SPAC22F3.07c_atp20_I_F0-ATPase SPAC22F3.08c_689345_691122_1_rok1_I_protein_coding_ATP-dependent|m.450 SPAC22F3.08c_rok1_I_ATP-dependent SPAC22F3.09c_686543_689179_1_res2_I_protein_coding_MBF|m.448 SPAC22F3.09c_res2_I_MBF SPAC22F3.10c_683990_686347_1_gcs1_I_protein_coding_glutamate-cysteine|m.447 SPAC22F3.10c_gcs1_I_glutamate-cysteine SPAC22F3.11c_682835_683660_1_snu23_I_protein_coding_U4_U6|m.446 SPAC22F3.11c_snu23_I_U4_U6 SPAC22F3.12c_679062_681890_1_rgs1_I_protein_coding_regulator|m.445 SPAC22F3.12c_rgs1_I_regulator SPAC22F3.13_673984_678307_-1_tsc1_I_protein_coding_hamartin|m.441 SPAC22F3.13_tsc1_I_hamartin SPAC22F3.15_692567_693061_1_SPAC22F3.15_I_protein_coding_GatB_YqeY|m.453 SPAC22F3.15_SPAC22F3.15_I_GatB_YqeY SPAC22G7.01c_725865_728242_-1_fra1_I_protein_coding_iron|m.479 SPAC22G7.01c_fra1_I_iron SPAC22G7.02_728335_731867_1_kap111_I_protein_coding_karyopherin|m.482 SPAC22G7.02_kap111_I_karyopherin SPAC22G7.03_731933_732759_1_SPAC22G7.03_I_protein_coding_Schizosaccharomyces|m.483 SPAC22G7.03_SPAC22G7.03_I_Schizosaccharomyces SPAC22G7.04_732826_736603_1_pan2_I_protein_coding_ubiquitin|m.484 SPAC22G7.04_pan2_I_ubiquitin SPAC22G7.05_736722_738782_1_kri1_I_protein_coding_ribosome|m.485 SPAC22G7.05_kri1_I_ribosome SPAC22G7.06c_739167_746117_-1_ura1_I_protein_coding_carbamoyl-phosphate|m.486 SPAC22G7.06c_ura1_I_carbamoyl-phosphate SPAC22G7.07c_746537_748971_-1_ime4_I_protein_coding_mRNA|m.489 SPAC22G7.07c_ime4_I_mRNA SPAC22G7.08_749523_751846_1_ppk8_I_protein_coding_serine_threonine|m.490 SPAC22G7.08_ppk8_I_serine_threonine SPAC22G7.09c_751647_753492_-1_nup45_I_protein_coding_nucleoporin|m.491 SPAC22G7.09c_nup45_I_nucleoporin SPAC22G7.10_753624_755676_1_iss1_I_protein_coding_mRNA|m.492 SPAC22G7.10_iss1_I_mRNA SPAC22G7.10_753624_755676_1_iss1_I_protein_coding_mRNA|m.493 SPAC22G7.11c_cum1_I_conserved SPAC22H12.01c_893278_894532_-1_mug35_I_protein_coding_Schizosaccharomyces|m.578 SPAC22H12.01c_mug35_I_Schizosaccharomyces SPAC22H12.02_893996_896547_1_tfg3_I_protein_coding_transcription|m.579 SPAC22H12.02_tfg3_I_transcription SPAC22H12.03_896668_897900_1_SPAC22H12.03_I_protein_coding_mitochondrial|m.581 SPAC22H12.03_SPAC22H12.03_I_mitochondrial SPAC22H12.04c_898045_898994_-1_rps102_I_protein_coding_40S|m.582 SPAC22H12.04c_rps102_I_40S SPAC22H12.05c_899283_902080_-1_fsc1_I_protein_coding_fasciclin|m.585 SPAC22H12.05c_fsc1_I_fasciclin SPAC23C4.02_1032085_1034167_1_crn1_I_protein_coding_actin|m.675 SPAC23C4.02_crn1_I_actin SPAC23C4.03_1034296_1035992_1_hrk1_I_protein_coding_haspin|m.677 SPAC23C4.03_hrk1_I_haspin SPAC23C4.04c_1036033_1036508_1_SPAC23C4.04c_I_protein_coding_Schizosaccharomyces|m.678 SPAC23C4.04c_SPAC23C4.04c_I_Schizosaccharomyces SPAC23C4.05c_1036639_1038267_-1_SPAC23C4.05c_I_protein_coding_LEA|m.679 SPAC23C4.05c_SPAC23C4.05c_I_LEA SPAC23C4.08_1041414_1043083_1_rho3_I_protein_coding_Rho|m.685 SPAC23C4.08_rho3_I_Rho SPAC23C4.09c_1041980_1044240_-1_SPAC23C4.09c_I_protein_coding_DNA-binding|m.687 SPAC23C4.09c_SPAC23C4.09c_I_DNA-binding SPAC23C4.10_1044844_1046788_1_sec2_I_protein_coding_guanyl-nucleotide|m.688 SPAC23C4.10_sec2_I_guanyl-nucleotide SPAC23C4.12_1048957_1051136_1_hhp2_I_protein_coding_serine_threonine|m.689 SPAC23C4.12_hhp2_I_serine_threonine SPAC23C4.13_1051665_1052724_1_bet1_I_protein_coding_SNARE|m.690 SPAC23C4.13_bet1_I_SNARE SPAC23C4.14_1052875_1054468_1_alg1_I_protein_coding_mannosyltransferase|m.691 SPAC23C4.14_alg1_I_mannosyltransferase SPAC23C4.15_1054665_1055906_1_rpb5_I_protein_coding_DNA-directed|m.692 SPAC23C4.15_rpb5_I_DNA-directed SPAC23C4.16c_1055849_1057578_-1_atg15_I_protein_coding_autophagy|m.693 SPAC23C4.16c_atg15_I_autophagy SPAC23C4.17_1057701_1061166_1_trm402_I_protein_coding_tRNA|m.694 SPAC23C4.17_trm402_I_tRNA SPAC23C4.18c_1058646_1063306_-1_rad4_I_protein_coding_BRCT|m.696 SPAC23C4.18c_rad4_I_BRCT SPAC23E2.01_442201_445721_1_fep1_I_protein_coding_iron-sensing|m.291 SPAC23E2.01_fep1_I_iron-sensing SPAC23E2.02_446491_450726_1_lsd2_I_protein_coding_histone|m.292 SPAC23E2.02_lsd2_I_histone SPAC23E2.03c_450860_453603_-1_ste7_I_protein_coding_arrestin|m.293 SPAC23E2.03c_ste7_I_arrestin SPAC23G3.01_850591_854385_1_rpb2_I_protein_coding_RNA|m.556 SPAC23G3.01_rpb2_I_RNA SPAC23G3.02c_854453_869704_-1_sib1_I_protein_coding_ferrichrome|m.559 SPAC23G3.02c_sib1_I_ferrichrome SPAC23G3.03_870740_872773_1_sib2_I_protein_coding_ornithine|m.560 SPAC23G3.03_sib2_I_ornithine SPAC23G3.04_872883_874248_1_ies4_I_protein_coding_Ino80|m.562 SPAC23G3.04_ies4_I_Ino80 SPAC23G3.05c_874160_875763_-1_SPAC23G3.05c_I_protein_coding_regulator|m.564 SPAC23G3.05c_SPAC23G3.05c_I_regulator SPAC23G3.06_876862_878930_1_nop58_I_protein_coding_U3|m.565 SPAC23G3.06_nop58_I_U3 SPAC23G3.07c_879147_880546_-1_snf30_I_protein_coding_SWI_SNF|m.567 SPAC23G3.07c_snf30_I_SWI_SNF SPAC23G3.08c_880660_884231_-1_ubp7_I_protein_coding_ubiquitin|m.568 SPAC23G3.08c_ubp7_I_ubiquitin SPAC23G3.09_884365_885989_1_taf4_I_protein_coding_transcription|m.570 SPAC23G3.09_taf4_I_transcription SPAC23G3.10c_884513_887531_-1_ssr3_I_protein_coding_SWI_SNF|m.571 SPAC23G3.10c_ssr3_I_SWI_SNF SPAC23G3.11_885944_889096_1_rpn6_I_protein_coding_19S|m.573 SPAC23G3.11_rpn6_I_19S SPAC23G3.12c_889058_892211_-1_SPAC23G3.12c_I_protein_coding_serine|m.575 SPAC23G3.12c_SPAC23G3.12c_I_serine SPAC24B11.05_204386_206081_1_SPAC24B11.05_I_protein_coding_pyrimidine|m.129 SPAC24B11.05_SPAC24B11.05_I_pyrimidine SPAC24B11.06c_206476_208044_-1_sty1_I_protein_coding_MAP|m.130 SPAC24B11.06c_sty1_I_MAP SPAC24B11.07c_208839_211275_-1_SPAC24B11.07c_I_protein_coding_oxidoreductase|m.131 SPAC24B11.07c_SPAC24B11.07c_I_oxidoreductase SPAC24B11.08c_211714_213591_-1_SPAC24B11.08c_I_protein_coding_COPII-coated|m.133 SPAC24B11.08c_SPAC24B11.08c_I_COPII-coated SPAC24B11.09_214093_216962_1_mpc2_I_protein_coding_mitochondrial|m.136 SPAC24B11.09_mpc2_I_mitochondrial SPAC24B11.10c_218260_221562_-1_cfh1_I_protein_coding_chitin|m.138 SPAC24B11.10c_cfh1_I_chitin SPAC24B11.11c_221694_223991_-1_sid2_I_protein_coding_NDR|m.139 SPAC24B11.11c_sid2_I_NDR SPAC24B11.12c_224080_229307_-1_SPAC24B11.12c_I_protein_coding_P-type|m.142 SPAC24B11.12c_SPAC24B11.12c_I_P-type SPAC24B11.13_231311_233488_1_hem3_I_protein_coding_hydroxymethylbilane|m.148 SPAC24B11.13_hem3_I_hydroxymethylbilane SPAC806.02c_233032_235164_-1_SPAC806.02c_I_protein_coding_Par|m.152 SPAC806.02c_SPAC806.02c_I_Par SPAC24B11.14_230545_231136_1_SPAC24B11.14_I_protein_coding_dubious|m.147 SPAC24B11.14_SPAC24B11.14_I_dubious SPAC24H6.01c_489871_492181_1_SPAC24H6.01c_I_protein_coding_membrane|m.318 SPAC24H6.01c_SPAC24H6.01c_I_membrane SPAC24H6.02c_488339_489482_1_tim15_I_protein_coding_TIM23|m.317 SPAC24H6.02c_tim15_I_TIM23 SPAC24H6.03_485723_488811_-1_cul3_I_protein_coding_cullin|m.316 SPAC24H6.03_cul3_I_cullin SPAC24H6.04_482607_485408_-1_hxk1_I_protein_coding_hexokinase|m.315 SPAC24H6.04_hxk1_I_hexokinase SPAC24H6.05_479228_482556_-1_cdc25_I_protein_coding_M|m.311 SPAC24H6.05_cdc25_I_M SPAC24H6.06_476474_478803_-1_sld3_I_protein_coding_DNA|m.309 SPAC24H6.06_sld3_I_DNA SPAC24H6.07_475354_476128_-1_rps901_I_protein_coding_40S|m.307 SPAC24H6.07_rps901_I_40S SPAC24H6.08_473792_475041_-1_SPAC24H6.08_I_protein_coding_Schizosaccharomyces|m.306 SPAC24H6.08_SPAC24H6.08_I_Schizosaccharomyces SPAC24H6.09_469981_472993_-1_gef1_I_protein_coding_Cdc42|m.304 SPAC24H6.09_gef1_I_Cdc42 SPAC24H6.10c_468664_469890_1_SPAC24H6.10c_I_protein_coding_phospho-2-dehydro-3-deoxyheptonate|m.303 SPAC24H6.10c_SPAC24H6.10c_I_phospho-2-dehydro-3-deoxyheptonate SPAC24H6.11c_464120_468581_1_SPAC24H6.11c_I_protein_coding_sulfate|m.301 SPAC24H6.11c_SPAC24H6.11c_I_sulfate SPAC24H6.12c_461686_463599_1_uba3_I_protein_coding_NEDD8|m.299 SPAC24H6.12c_uba3_I_NEDD8 SPAC24H6.13_456931_460811_-1_SPAC24H6.13_I_protein_coding_DUF221|m.296 SPAC24H6.13_SPAC24H6.13_I_DUF221 SPAC2F7.02c_531794_533731_-1_psr1_I_protein_coding_NLI|m.352 SPAC2F7.02c_psr1_I_NLI SPAC2F7.03c_534120_537869_-1_pom1_I_protein_coding_DYRK|m.353 SPAC2F7.03c_pom1_I_DYRK SPAC2F7.04_537888_540012_1_pmc2_I_protein_coding_mediator|m.356 SPAC2F7.04_pmc2_I_mediator SPAC2F7.05c_539919_541640_-1_tif5_I_protein_coding_translation|m.357 SPAC2F7.05c_tif5_I_translation SPAC2F7.06c_541576_543735_-1_pol4_I_protein_coding_DNA|m.359 SPAC2F7.06c_pol4_I_DNA SPAC2F7.07c_544127_546240_-1_cph2_I_protein_coding_Clr6|m.361 SPAC2F7.07c_cph2_I_Clr6 SPAC2F7.08c_546664_548562_-1_snf5_I_protein_coding_SWI_SNF|m.363 SPAC2F7.08c_snf5_I_SWI_SNF SPAC2F7.09c_548768_550726_-1_gep3_I_protein_coding_mitochondrial|m.364 SPAC2F7.09c_gep3_I_mitochondrial SPAC2F7.10_550630_553595_1_akr1_I_protein_coding_palmitoyltransferase|m.365 SPAC2F7.10_akr1_I_palmitoyltransferase SPAC2F7.11_555277_559051_1_nrd1_I_protein_coding_RNA-binding|m.366 SPAC2F7.11_nrd1_I_RNA-binding SPAC2F7.13c_558909_560549_-1_wrs1_I_protein_coding_cytoplasmic|m.369 SPAC2F7.13c_wrs1_I_cytoplasmic SPAC2F7.14c_560824_562179_-1_rrp4_I_protein_coding_exosome|m.370 SPAC2F7.14c_rrp4_I_exosome SPAC2F7.15_563698_565073_1_rsm24_I_protein_coding_mitochondrial|m.371 SPAC2F7.15_rsm24_I_mitochondrial SPAC2F7.16c_565035_569485_-1_pld1_I_protein_coding_phospholipase|m.372 SPAC2F7.16c_pld1_I_phospholipase SPAC2G11.02_807894_812194_1_urb2_I_protein_coding_ribosome|m.528 SPAC2G11.02_urb2_I_ribosome SPAC2G11.03c_811443_814228_-1_vps45_I_protein_coding_vacuolar|m.530 SPAC2G11.03c_vps45_I_vacuolar SPAC2G11.04_814218_815490_1_SPAC2G11.04_I_protein_coding_RNA-binding|m.533 SPAC2G11.04_SPAC2G11.04_I_RNA-binding SPAC2G11.05c_815388_817984_-1_rim20_I_protein_coding_BRO1|m.534 SPAC2G11.05c_rim20_I_BRO1 SPAC2G11.06_817996_819739_1_vps4_I_protein_coding_AAA|m.535 SPAC2G11.06_vps4_I_AAA SPAC2G11.07c_819768_821920_-1_ptc3_I_protein_coding_protein|m.536 SPAC2G11.07c_ptc3_I_protein SPAC2G11.08c_822092_823278_-1_smn1_I_protein_coding_SMN|m.538 SPAC2G11.08c_smn1_I_SMN SPAC2G11.09_823493_826399_1_SPAC2G11.09_I_protein_coding_calcium|m.539 SPAC2G11.09_SPAC2G11.09_I_calcium SPAC2G11.10c_826313_828123_-1_uba42_I_protein_coding_thiosulfate|m.540 SPAC2G11.10c_uba42_I_thiosulfate SPAC2G11.11c_828321_831629_-1_prh1_I_protein_coding_ATP-dependent|m.541 SPAC2G11.11c_prh1_I_ATP-dependent SPAC2G11.12_831918_836094_1_rqh1_I_protein_coding_RecQ|m.542 SPAC2G11.12_rqh1_I_RecQ SPAC2G11.13_836206_838256_1_atg22_I_protein_coding_vacuolar|m.544 SPAC2G11.13_atg22_I_vacuolar SPAC2G11.14_838228_841562_1_taf111_I_protein_coding_transcription|m.545 SPAC2G11.14_taf111_I_transcription SPAC2G11.15c_841471_842624_-1_tgs1_I_protein_coding_rRNA|m.547 SPAC2G11.15c_tgs1_I_rRNA SPAC30D11.01c_1119880_1123773_1_gto2_I_protein_coding_alpha-glucosidase|m.752 SPAC30D11.01c_gto2_I_alpha-glucosidase SPAC30D11.02c_1118926_1119763_1_SPAC30D11.02c_I_protein_coding_Schizosaccharomyces|m.751 SPAC30D11.02c_SPAC30D11.02c_I_Schizosaccharomyces SPAC30D11.03_1115899_1118412_-1_ddx27_I_protein_coding_ATP-dependent|m.749 SPAC30D11.03_ddx27_I_ATP-dependent SPAC30D11.04c_1112170_1115868_1_nup124_I_protein_coding_nucleoporin|m.743 SPAC30D11.04c_nup124_I_nucleoporin SPAC30D11.06c_1108485_1110686_1_hfl1_I_protein_coding_Lazarus1|m.740 SPAC30D11.06c_hfl1_I_Lazarus1 SPAC30D11.05_1109349_1111221_-1_aps3_I_protein_coding_AP-3|m.742 SPAC30D11.05_aps3_I_AP-3 SPAC30D11.07_1106430_1107885_-1_nth1_I_protein_coding_DNA|m.739 SPAC30D11.07_nth1_I_DNA SPAC30D11.08c_1104753_1106608_1_phf2_I_protein_coding_Lsd1_2|m.738 SPAC30D11.08c_phf2_I_Lsd1_2 SPAC30D11.09_1101685_1103890_-1_cwf19_I_protein_coding_complexed|m.737 SPAC30D11.09_cwf19_I_complexed SPAC30D11.10_1099489_1101583_-1_rad52_I_protein_coding_DNA|m.736 SPAC30D11.10_rad52_I_DNA SPAC30D11.11_1097449_1099554_-1_SPAC30D11.11_I_protein_coding_Haemolysin-III|m.735 SPAC30D11.11_SPAC30D11.11_I_Haemolysin-III SPAC30D11.13_1094262_1095547_-1_hus5_I_protein_coding_SUMO|m.734 SPAC30D11.13_hus5_I_SUMO SPAC30D11.14c_1092387_1094379_1_SPAC30D11.14c_I_protein_coding_RNA-binding|m.732 SPAC30D11.14c_SPAC30D11.14c_I_RNA-binding SPAC31A2.02_388233_389229_1_trm112_I_protein_coding_protein|m.256 SPAC31A2.02_trm112_I_protein SPAC31A2.03_389391_390520_1_mrp11_I_protein_coding_mitochondrial|m.257 SPAC31A2.03_mrp11_I_mitochondrial SPAC31A2.04c_390407_391260_-1_pre1_I_protein_coding_20S|m.258 SPAC31A2.04c_pre1_I_20S SPAC31A2.07c_399462_402266_-1_dbp10_I_protein_coding_ATP-dependent|m.267 SPAC31A2.07c_dbp10_I_ATP-dependent SPAC31A2.06_397426_402487_1_atp25_I_protein_coding_mitochondrial|m.263 SPAC31A2.06_atp25_I_mitochondrial SPAC31A2.08_402841_403862_1_mrp20_I_protein_coding_mitochondrial|m.270 SPAC31A2.08_mrp20_I_mitochondrial SPAC31A2.09c_402719_405389_-1_apm4_I_protein_coding_AP-2|m.268 SPAC31A2.09c_apm4_I_AP-2 SPAC31A2.10_405582_407710_1_SPAC31A2.10_I_protein_coding_Ran|m.271 SPAC31A2.10_SPAC31A2.10_I_Ran SPAC31A2.11c_407714_409872_-1_cuf1_I_protein_coding_nutritional|m.272 SPAC31A2.11c_cuf1_I_nutritional SPAC31A2.12_411651_414448_1_rod1_I_protein_coding_arrestin_PY|m.274 SPAC31A2.12_rod1_I_arrestin_PY SPAC31A2.13c_414245_414930_-1_sft1_I_protein_coding_SNARE|m.276 SPAC31A2.13c_sft1_I_SNARE SPAC31A2.14_414942_418504_1_bun107_I_protein_coding_WD|m.277 SPAC31A2.14_bun107_I_WD SPAC31A2.15c_417823_419996_-1_dcc1_I_protein_coding_Ctf18|m.279 SPAC31A2.15c_dcc1_I_Ctf18 SPAC31A2.16_419958_423991_1_gef2_I_protein_coding_RhoGEF|m.282 SPAC31A2.16_gef2_I_RhoGEF SPAC3H8.02_588543_590751_1_csr102_I_protein_coding_sec14|m.387 SPAC3H8.02_csr102_I_sec14 SPAC3H8.03_590691_592152_1_img2_I_protein_coding_mitochondrial|m.388 SPAC3H8.03_img2_I_mitochondrial SPAC3H8.04_592226_593906_1_SPAC3H8.04_I_protein_coding_possible|m.389 SPAC3H8.04_SPAC3H8.04_I_possible SPAC3H8.05c_593901_597586_-1_mms1_I_protein_coding_E3|m.390 SPAC3H8.05c_mms1_I_E3 SPAC3H8.06_598473_600805_1_aur1_I_protein_coding_inositol|m.391 SPAC3H8.06_aur1_I_inositol SPAC3H8.07c_600826_601749_-1_pac10_I_protein_coding_prefoldin|m.394 SPAC3H8.07c_pac10_I_prefoldin SPAC3H8.08c_601848_603993_-1_SPAC3H8.08c_I_protein_coding_transcription|m.395 SPAC3H8.08c_SPAC3H8.08c_I_transcription SPAC3H8.09c_604312_607742_-1_nab3_I_protein_coding_poly(A)|m.397 SPAC3H8.09c_nab3_I_poly(A) SPAC3H8.10_608893_610703_1_spo20_I_protein_coding_sec14|m.398 SPAC3H8.10_spo20_I_sec14 SPAC4C5.01_1192210_1193756_1_SPAC4C5.01_I_protein_coding_pseudouridine-5'-phosphatase|m.818 SPAC4C5.01_SPAC4C5.01_I_pseudouridine-5'-phosphatase SPAC4C5.02c_1192702_1195167_-1_ryh1_I_protein_coding_GTPase|m.821 SPAC4C5.02c_ryh1_I_GTPase SPAC4C5.03_1196723_1198284_1_SPAC4C5.03_I_protein_coding_CTNS|m.824 SPAC4C5.03_SPAC4C5.03_I_CTNS SPAC4C5.04_1198224_1199733_1_rad31_I_protein_coding_SUMO|m.825 SPAC4C5.04_rad31_I_SUMO SPAC4G8.03c_757915_762714_-1_SPAC4G8.03c_I_protein_coding_RNA-binding|m.497 SPAC4G8.03c_SPAC4G8.03c_I_RNA-binding SPAC4G8.04_767446_770246_1_SPAC4G8.04_I_protein_coding_GTPase|m.499 SPAC4G8.04_SPAC4G8.04_I_GTPase SPAC4G8.05_770502_772666_1_ppk14_I_protein_coding_serine_threonine|m.500 SPAC4G8.05_ppk14_I_serine_threonine SPAC4G8.06c_772650_774027_-1_trm12_I_protein_coding_tRNA|m.502 SPAC4G8.06c_trm12_I_tRNA SPAC4G8.07c_774000_776062_-1_trm2_I_protein_coding_tRNA|m.503 SPAC4G8.07c_trm2_I_tRNA SPAC4G8.08_777177_778498_1_SPAC4G8.08_I_protein_coding_mitochondrial|m.505 SPAC4G8.08_SPAC4G8.08_I_mitochondrial SPAC4G8.09_778431_781324_1_SPAC4G8.09_I_protein_coding_mitochondrial|m.506 SPAC4G8.09_SPAC4G8.09_I_mitochondrial SPAC4G8.10_781348_783419_1_gos1_I_protein_coding_SNARE|m.511 SPAC4G8.10_gos1_I_SNARE SPAC4G8.11c_781347_783634_-1_atp10_I_protein_coding_mitochondrial|m.509 SPAC4G8.11c_atp10_I_mitochondrial SPAC4G8.13c_786778_790219_-1_prz1_I_protein_coding_calcineurin|m.517 SPAC4G8.13c_prz1_I_calcineurin SPAC521.02_843197_844165_1_SPAC521.02_I_protein_coding_WLM|m.548 SPAC521.02_SPAC521.02_I_WLM SPAC521.03_844948_846142_1_SPAC521.03_I_protein_coding_short|m.549 SPAC521.03_SPAC521.03_I_short SPAC521.04c_846022_849480_-1_sst1_I_protein_coding_calcium|m.552 SPAC521.04c_sst1_I_calcium SPAC521.05_849421_850259_1_rps802_I_protein_coding_40S|m.553 SPAC521.05_rps802_I_40S SPAC56F8.02_1124058_1129104_1_SPAC56F8.02_I_protein_coding_AMP|m.753 SPAC56F8.02_SPAC56F8.02_I_AMP SPAC56F8.03_1129519_1133089_1_SPAC56F8.03_I_protein_coding_translation|m.756 SPAC56F8.03_SPAC56F8.03_I_translation SPAC56F8.04c_1133226_1134356_-1_ppt1_I_protein_coding_para-hydroxybenzoate--polyprenyltransferase|m.759 SPAC56F8.04c_ppt1_I_para-hydroxybenzoate--polyprenyltransferase SPAC56F8.05c_1134418_1136038_-1_mug64_I_protein_coding_BAR|m.760 SPAC56F8.05c_mug64_I_BAR SPAC56F8.06c_1136196_1138046_-1_alg10_I_protein_coding_dolichyl-phosphate-glucose-glycolipid|m.761 SPAC56F8.06c_alg10_I_dolichyl-phosphate-glucose-glycolipid SPAC56F8.07_1138566_1139117_1_SPAC56F8.07_I_protein_coding_conserved|m.763 SPAC56F8.07_SPAC56F8.07_I_conserved SPAC56F8.08_1139130_1140325_1_mud1_I_protein_coding_UBA|m.764 SPAC56F8.08_mud1_I_UBA SPAC56F8.09_1140580_1142002_1_rrp8_I_protein_coding_rRNA|m.765 SPAC56F8.09_rrp8_I_rRNA SPAC56F8.10_1143063_1145256_1_met9_I_protein_coding_methylenetetrahydrofolate|m.766 SPAC56F8.10_met9_I_methylenetetrahydrofolate SPAC56F8.11_1145305_1146800_1_spc3_I_protein_coding_signal|m.769 SPAC56F8.11_spc3_I_signal SPAC56F8.12_1146833_1148085_1_SPAC56F8.12_I_protein_coding_conserved|m.770 SPAC56F8.12_SPAC56F8.12_I_conserved SPAC56F8.13_1149078_1150659_1_SPAC56F8.13_I_protein_coding_dubious|m.778 SPAC56F8.13_SPAC56F8.13_I_dubious SPAC56F8.14c_1148131_1152178_-1_mug115_I_protein_coding_Schizosaccharomyces|m.773 SPAC56F8.14c_mug115_I_Schizosaccharomyces SPAC56F8.15_1151431_1153638_1_SPAC56F8.15_I_protein_coding_Schizosaccharomyces|m.781 SPAC56F8.15_SPAC56F8.15_I_Schizosaccharomyces SPAC56F8.16_1153572_1156804_1_esc1_I_protein_coding_transcription|m.783 SPAC56F8.16_esc1_I_transcription SPAC5H10.01_146974_148055_1_SPAC5H10.01_I_protein_coding_DUF1445|m.90 SPAC5H10.01_SPAC5H10.01_I_DUF1445 SPAC5H10.02c_148038_150331_-1_hsp3102_I_protein_coding_glyoxylase|m.91 SPAC5H10.02c_hsp3102_I_glyoxylase SPAC5H10.03_149446_152909_1_SPAC5H10.03_I_protein_coding_phosphoglycerate|m.94 SPAC5H10.03_SPAC5H10.03_I_phosphoglycerate SPAC5H10.04_152851_155515_1_SPAC5H10.04_I_protein_coding_NADPH|m.95 SPAC5H10.04_SPAC5H10.04_I_NADPH SPAC5H10.04_152851_155515_1_SPAC5H10.04_I_protein_coding_NADPH|m.96 SPAC5H10.05c_SPAC5H10.05c_I_FAD SPAC5H10.06c_156430_158307_-1_adh4_I_protein_coding_alcohol|m.99 SPAC5H10.06c_adh4_I_alcohol SPAC5H10.08c_159880_160945_-1_pan6_I_protein_coding_pantoate-beta-alanine|m.103 SPAC5H10.08c_pan6_I_pantoate-beta-alanine SPAC5H10.09c_160977_161822_-1_ecm31_I_protein_coding_3-methyl-2-oxobutanoatehydroxymethyltransferase|m.104 SPAC5H10.09c_ecm31_I_3-methyl-2-oxobutanoatehydroxymethyltransferase SPAC5H10.10_162756_164635_1_SPAC5H10.10_I_protein_coding_NADPH|m.106 SPAC5H10.10_SPAC5H10.10_I_NADPH SPAC5H10.12c_165814_167826_-1_SPAC5H10.12c_I_protein_coding_acetylglucosaminyltransferase|m.108 SPAC5H10.12c_SPAC5H10.12c_I_acetylglucosaminyltransferase SPAC630.03_350406_352296_1_arp3_I_protein_coding_Arp2_3|m.225 SPAC630.03_arp3_I_Arp2_3 SPAC630.04c_350239_353340_-1_SPAC630.04c_I_protein_coding_Schizosaccharomyces|m.223 SPAC630.04c_SPAC630.04c_I_Schizosaccharomyces SPAC630.05_353783_356580_1_gyp7_I_protein_coding_GTPase|m.229 SPAC630.05_gyp7_I_GTPase SPAC630.06c_353705_357205_-1_SPAC630.06c_I_protein_coding_conserved|m.227 SPAC630.06c_SPAC630.06c_I_conserved SPAC630.07c_357325_359228_-1_SPAC630.07c_I_protein_coding_Schizosaccharomyces|m.231 SPAC630.07c_SPAC630.07c_I_Schizosaccharomyces SPAC630.08c_359638_361266_-1_erg25_I_protein_coding_C-4|m.233 SPAC630.08c_erg25_I_C-4 SPAC630.09c_362248_363714_-1_mug58_I_protein_coding_GLYK|m.238 SPAC630.09c_mug58_I_GLYK SPAC630.10_365204_366442_1_bmt2_I_protein_coding_rRNA|m.239 SPAC630.10_bmt2_I_rRNA SPAC630.11_366634_367890_1_vps55_I_protein_coding_vacuolar|m.240 SPAC630.11_vps55_I_vacuolar SPAC630.12_368040_369950_1_SPAC630.12_I_protein_coding_ER|m.242 SPAC630.12_SPAC630.12_I_ER SPAC630.13c_369791_374217_-1_tsc2_I_protein_coding_tuberin|m.243 SPAC630.13c_tsc2_I_tuberin SPAC630.14c_374316_377908_-1_tup12_I_protein_coding_transcriptional|m.244 SPAC630.14c_tup12_I_transcriptional SPAC806.03c_235533_236104_-1_rps2601_I_protein_coding_40S|m.154 SPAC806.03c_rps2601_I_40S SPAC806.04c_241008_243122_-1_SPAC806.04c_I_protein_coding_protein-glutamate|m.156 SPAC806.04c_SPAC806.04c_I_protein-glutamate SPAC806.05_244214_247574_1_SPAC806.05_I_protein_coding_mitochondrial|m.159 SPAC806.06c_SPAC806.06c_I_nicotinamide SPAC806.05_244214_247574_1_SPAC806.05_I_protein_coding_mitochondrial|m.160 SPAC806.05_SPAC806.05_I_mitochondrial SPAC806.07_247821_248560_1_ndk1_I_protein_coding_nucleoside|m.161 SPAC806.07_ndk1_I_nucleoside SPAC806.08c_248579_250983_-1_mod21_I_protein_coding_gamma|m.162 SPAC806.08c_mod21_I_gamma SPAC821.03c_981473_983481_-1_slf1_I_protein_coding_cell|m.648 SPAC821.03c_slf1_I_cell SPAC821.04c_983567_987084_-1_cid13_I_protein_coding_poly(A)|m.649 SPAC821.04c_cid13_I_poly(A) SPAC821.05_988076_989866_1_tif38_I_protein_coding_translation|m.651 SPAC821.05_tif38_I_translation SPAC821.06_990192_991889_1_spn2_I_protein_coding_mitotic|m.652 SPAC821.06_spn2_I_mitotic SPAC821.07c_991632_994230_-1_moc3_I_protein_coding_transcription|m.654 SPAC821.07c_moc3_I_transcription SPAC821.08c_994941_997625_-1_slp1_I_protein_coding_substrate-specific|m.655 SPAC821.08c_slp1_I_substrate-specific SPAC821.10c_1002838_1003600_-1_sod1_I_protein_coding_superoxide|m.660 SPAC821.10c_sod1_I_superoxide SPAC821.11_1006259_1008003_1_pro1_I_protein_coding_gamma-glutamyl|m.662 SPAC821.11_pro1_I_gamma-glutamyl SPAC821.12_1008215_1010318_1_orb6_I_protein_coding_serine_threonine|m.664 SPAC821.12_orb6_I_serine_threonine SPAC821.13c_1010343_1015415_-1_dnf1_I_protein_coding_Trans-golgi|m.665 SPAC821.13c_dnf1_I_Trans-golgi SPAC977.01_29764_31069_1_SPAC977.01_I_protein_coding_S.|m.11 SPAC977.01_SPAC977.01_I_S. SPAC977.02_32034_33012_1_SPAC977.02_I_protein_coding_S.|m.13 SPAC977.02_SPAC977.02_I_S. SPAC977.03_33835_34272_1_SPAC977.03_I_protein_coding_methyltransferase|m.14 SPAC977.03_SPAC977.03_I_methyltransferase SPAC977.04_34298_34978_1_SPAC977.04_I_protein_coding_truncated|m.15 SPAC750.02c_SPAC750.02c_I_transmembrane SPAC977.05c_35768_36382_-1_SPAC977.05c_I_protein_coding_conserved|m.16 SPAC977.05c_SPAC977.05c_I_conserved SPAC977.06_39416_40072_1_SPAC977.06_I_protein_coding_S.|m.17 SPAC977.06_SPAC977.06_I_S. SPAC977.07c_42057_43307_-1_pfl6_I_protein_coding_cell|m.18 SPAC977.07c_pfl6_I_cell SPAC977.08_44644_45468_1_SPAC977.08_I_protein_coding_short|m.19 SPAC977.08_SPAC977.08_I_short SPAC977.09c_45875_48399_-1_SPAC977.09c_I_protein_coding_phospholipase|m.20 SPAC977.09c_SPAC977.09c_I_phospholipase SPAC977.10_50946_53858_1_sod2_I_protein_coding_plasma|m.22 SPAC977.10_sod2_I_plasma SPAC977.11_55059_56308_1_SPAC977.11_I_protein_coding_CRCB|m.23 SPAC977.11_SPAC977.11_I_CRCB SPAC977.12_56373_57736_1_SPAC977.12_I_protein_coding_L-asparaginase|m.24 SPAC977.12_SPAC977.12_I_L-asparaginase SPAC977.14c_59614_60907_-1_SPAC977.14c_I_protein_coding_aldo_keto|m.25 SPAC977.14c_SPAC977.14c_I_aldo_keto SPAC977.15_62961_63862_1_SPAC977.15_I_protein_coding_dienelactone|m.26 SPAC977.15_SPAC977.15_I_dienelactone SPAC977.16c_64559_66980_-1_dak2_I_protein_coding_dihydroxyacetone|m.27 SPAC977.16c_dak2_I_dihydroxyacetone SPAC977.17_66219_69821_1_SPAC977.17_I_protein_coding_MIP|m.30 SPAC977.17_SPAC977.17_I_MIP SPAC977.18_31140_32345_-1_SPAC977.18_I_protein_coding_conserved|m.12 SPAC977.18_SPAC977.18_I_conserved SPAPB21F2.02_492335_497927_1_SPAPB21F2.02_I_protein_coding_Dopey|m.319 SPAPB21F2.02_SPAPB21F2.02_I_Dopey SPAPB21F2.03_498111_499027_1_slx9_I_protein_coding_ribosome|m.321 SPAPB21F2.03_slx9_I_ribosome SPAPJ695.01c_77480_78066_-1_SPAPJ695.01c_I_protein_coding_S.|m.33 SPAPJ695.01c_SPAPJ695.01c_I_S. SPAPJ696.01c_719090_723684_-1_vps17_I_protein_coding_retromer|m.473 SPAPJ696.01c_vps17_I_retromer SPAPJ696.02_724145_725946_1_lsb4_I_protein_coding_actin|m.477 SPAPJ696.02_lsb4_I_actin
db_x_pep_df.s_name[0]
'SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ|m.1'
len(bh_df.query('RBH == True'))
478
scaler = preprocessing.StandardScaler()
scaler.fit(bh_df.query('RBH == True')[['E', 'q_len']])
StandardScaler(copy=True, with_mean=True, with_std=True)
rbh_df[['E', 'q_len']] = scaler.transform(rbh_df[['E', 'q_len']])
bh_df[['E', 'q_len']] = scaler.transform(bh_df[['E', 'q_len']])
len(bh_df)
500
CRBL.best_hits(bh_df)
len(bh_df.query('RBH == True'))
81
sns.distplot(rbh_df['E'], label='E')
sns.distplot(rbh_df['q_len'], label='Length')
<matplotlib.axes._subplots.AxesSubplot at 0x111f78250>
figsize(12,8)
scatter(bh_df.q_len, bh_df.E, c=bh_df.RBH, cmap=plt.cm.Paired, alpha=0.8)
xlabel('Query Length (scaled)')
ylabel('$\log10 Evalue$ (scaled)')
title('LAST hits, RBH and regular', fontsize=14)
savefig('sigh.svg')
g = sns.lmplot('q_len', 'E', bh_df, size=10,
hue='RBH', order=2, palette=sns.color_palette('Set1'))
g = (g.set_axis_labels("Query Length (scaled)", "$\log10 Evalue$ (scaled)"))
title(r'$S. pombe$ LAST hits, RBH and regular', fontsize=14)
axis(ymax=2, ymin=-2)
savefig('sigh2.svg')
<bound method FacetGrid.despine of <seaborn.axisgrid.FacetGrid object at 0x10f622390>>
np.linspace(bh_df.q_len.min(), bh_df.q_len.max(), 500)
array([ -1.50237213e+00, -1.47722045e+00, -1.45206877e+00, -1.42691709e+00, -1.40176541e+00, -1.37661374e+00, -1.35146206e+00, -1.32631038e+00, -1.30115870e+00, -1.27600702e+00, -1.25085534e+00, -1.22570366e+00, -1.20055198e+00, -1.17540030e+00, -1.15024862e+00, -1.12509694e+00, -1.09994526e+00, -1.07479358e+00, -1.04964191e+00, -1.02449023e+00, -9.99338547e-01, -9.74186867e-01, -9.49035188e-01, -9.23883509e-01, -8.98731830e-01, -8.73580151e-01, -8.48428471e-01, -8.23276792e-01, -7.98125113e-01, -7.72973434e-01, -7.47821754e-01, -7.22670075e-01, -6.97518396e-01, -6.72366717e-01, -6.47215037e-01, -6.22063358e-01, -5.96911679e-01, -5.71760000e-01, -5.46608320e-01, -5.21456641e-01, -4.96304962e-01, -4.71153283e-01, -4.46001604e-01, -4.20849924e-01, -3.95698245e-01, -3.70546566e-01, -3.45394887e-01, -3.20243207e-01, -2.95091528e-01, -2.69939849e-01, -2.44788170e-01, -2.19636490e-01, -1.94484811e-01, -1.69333132e-01, -1.44181453e-01, -1.19029774e-01, -9.38780943e-02, -6.87264151e-02, -4.35747358e-02, -1.84230566e-02, 6.72862265e-03, 3.18803019e-02, 5.70319811e-02, 8.21836603e-02, 1.07335340e-01, 1.32487019e-01, 1.57638698e-01, 1.82790377e-01, 2.07942057e-01, 2.33093736e-01, 2.58245415e-01, 2.83397094e-01, 3.08548773e-01, 3.33700453e-01, 3.58852132e-01, 3.84003811e-01, 4.09155490e-01, 4.34307170e-01, 4.59458849e-01, 4.84610528e-01, 5.09762207e-01, 5.34913887e-01, 5.60065566e-01, 5.85217245e-01, 6.10368924e-01, 6.35520603e-01, 6.60672283e-01, 6.85823962e-01, 7.10975641e-01, 7.36127320e-01, 7.61279000e-01, 7.86430679e-01, 8.11582358e-01, 8.36734037e-01, 8.61885717e-01, 8.87037396e-01, 9.12189075e-01, 9.37340754e-01, 9.62492434e-01, 9.87644113e-01, 1.01279579e+00, 1.03794747e+00, 1.06309915e+00, 1.08825083e+00, 1.11340251e+00, 1.13855419e+00, 1.16370587e+00, 1.18885755e+00, 1.21400923e+00, 1.23916091e+00, 1.26431258e+00, 1.28946426e+00, 1.31461594e+00, 1.33976762e+00, 1.36491930e+00, 1.39007098e+00, 1.41522266e+00, 1.44037434e+00, 1.46552602e+00, 1.49067770e+00, 1.51582938e+00, 1.54098106e+00, 1.56613274e+00, 1.59128441e+00, 1.61643609e+00, 1.64158777e+00, 1.66673945e+00, 1.69189113e+00, 1.71704281e+00, 1.74219449e+00, 1.76734617e+00, 1.79249785e+00, 1.81764953e+00, 1.84280121e+00, 1.86795289e+00, 1.89310457e+00, 1.91825624e+00, 1.94340792e+00, 1.96855960e+00, 1.99371128e+00, 2.01886296e+00, 2.04401464e+00, 2.06916632e+00, 2.09431800e+00, 2.11946968e+00, 2.14462136e+00, 2.16977304e+00, 2.19492472e+00, 2.22007640e+00, 2.24522807e+00, 2.27037975e+00, 2.29553143e+00, 2.32068311e+00, 2.34583479e+00, 2.37098647e+00, 2.39613815e+00, 2.42128983e+00, 2.44644151e+00, 2.47159319e+00, 2.49674487e+00, 2.52189655e+00, 2.54704823e+00, 2.57219990e+00, 2.59735158e+00, 2.62250326e+00, 2.64765494e+00, 2.67280662e+00, 2.69795830e+00, 2.72310998e+00, 2.74826166e+00, 2.77341334e+00, 2.79856502e+00, 2.82371670e+00, 2.84886838e+00, 2.87402006e+00, 2.89917173e+00, 2.92432341e+00, 2.94947509e+00, 2.97462677e+00, 2.99977845e+00, 3.02493013e+00, 3.05008181e+00, 3.07523349e+00, 3.10038517e+00, 3.12553685e+00, 3.15068853e+00, 3.17584021e+00, 3.20099189e+00, 3.22614356e+00, 3.25129524e+00, 3.27644692e+00, 3.30159860e+00, 3.32675028e+00, 3.35190196e+00, 3.37705364e+00, 3.40220532e+00, 3.42735700e+00, 3.45250868e+00, 3.47766036e+00, 3.50281204e+00, 3.52796372e+00, 3.55311539e+00, 3.57826707e+00, 3.60341875e+00, 3.62857043e+00, 3.65372211e+00, 3.67887379e+00, 3.70402547e+00, 3.72917715e+00, 3.75432883e+00, 3.77948051e+00, 3.80463219e+00, 3.82978387e+00, 3.85493555e+00, 3.88008722e+00, 3.90523890e+00, 3.93039058e+00, 3.95554226e+00, 3.98069394e+00, 4.00584562e+00, 4.03099730e+00, 4.05614898e+00, 4.08130066e+00, 4.10645234e+00, 4.13160402e+00, 4.15675570e+00, 4.18190738e+00, 4.20705905e+00, 4.23221073e+00, 4.25736241e+00, 4.28251409e+00, 4.30766577e+00, 4.33281745e+00, 4.35796913e+00, 4.38312081e+00, 4.40827249e+00, 4.43342417e+00, 4.45857585e+00, 4.48372753e+00, 4.50887921e+00, 4.53403088e+00, 4.55918256e+00, 4.58433424e+00, 4.60948592e+00, 4.63463760e+00, 4.65978928e+00, 4.68494096e+00, 4.71009264e+00, 4.73524432e+00, 4.76039600e+00, 4.78554768e+00, 4.81069936e+00, 4.83585104e+00, 4.86100271e+00, 4.88615439e+00, 4.91130607e+00, 4.93645775e+00, 4.96160943e+00, 4.98676111e+00, 5.01191279e+00, 5.03706447e+00, 5.06221615e+00, 5.08736783e+00, 5.11251951e+00, 5.13767119e+00, 5.16282287e+00, 5.18797454e+00, 5.21312622e+00, 5.23827790e+00, 5.26342958e+00, 5.28858126e+00, 5.31373294e+00, 5.33888462e+00, 5.36403630e+00, 5.38918798e+00, 5.41433966e+00, 5.43949134e+00, 5.46464302e+00, 5.48979470e+00, 5.51494637e+00, 5.54009805e+00, 5.56524973e+00, 5.59040141e+00, 5.61555309e+00, 5.64070477e+00, 5.66585645e+00, 5.69100813e+00, 5.71615981e+00, 5.74131149e+00, 5.76646317e+00, 5.79161485e+00, 5.81676653e+00, 5.84191820e+00, 5.86706988e+00, 5.89222156e+00, 5.91737324e+00, 5.94252492e+00, 5.96767660e+00, 5.99282828e+00, 6.01797996e+00, 6.04313164e+00, 6.06828332e+00, 6.09343500e+00, 6.11858668e+00, 6.14373836e+00, 6.16889003e+00, 6.19404171e+00, 6.21919339e+00, 6.24434507e+00, 6.26949675e+00, 6.29464843e+00, 6.31980011e+00, 6.34495179e+00, 6.37010347e+00, 6.39525515e+00, 6.42040683e+00, 6.44555851e+00, 6.47071019e+00, 6.49586186e+00, 6.52101354e+00, 6.54616522e+00, 6.57131690e+00, 6.59646858e+00, 6.62162026e+00, 6.64677194e+00, 6.67192362e+00, 6.69707530e+00, 6.72222698e+00, 6.74737866e+00, 6.77253034e+00, 6.79768202e+00, 6.82283369e+00, 6.84798537e+00, 6.87313705e+00, 6.89828873e+00, 6.92344041e+00, 6.94859209e+00, 6.97374377e+00, 6.99889545e+00, 7.02404713e+00, 7.04919881e+00, 7.07435049e+00, 7.09950217e+00, 7.12465385e+00, 7.14980552e+00, 7.17495720e+00, 7.20010888e+00, 7.22526056e+00, 7.25041224e+00, 7.27556392e+00, 7.30071560e+00, 7.32586728e+00, 7.35101896e+00, 7.37617064e+00, 7.40132232e+00, 7.42647400e+00, 7.45162568e+00, 7.47677735e+00, 7.50192903e+00, 7.52708071e+00, 7.55223239e+00, 7.57738407e+00, 7.60253575e+00, 7.62768743e+00, 7.65283911e+00, 7.67799079e+00, 7.70314247e+00, 7.72829415e+00, 7.75344583e+00, 7.77859751e+00, 7.80374919e+00, 7.82890086e+00, 7.85405254e+00, 7.87920422e+00, 7.90435590e+00, 7.92950758e+00, 7.95465926e+00, 7.97981094e+00, 8.00496262e+00, 8.03011430e+00, 8.05526598e+00, 8.08041766e+00, 8.10556934e+00, 8.13072102e+00, 8.15587269e+00, 8.18102437e+00, 8.20617605e+00, 8.23132773e+00, 8.25647941e+00, 8.28163109e+00, 8.30678277e+00, 8.33193445e+00, 8.35708613e+00, 8.38223781e+00, 8.40738949e+00, 8.43254117e+00, 8.45769285e+00, 8.48284452e+00, 8.50799620e+00, 8.53314788e+00, 8.55829956e+00, 8.58345124e+00, 8.60860292e+00, 8.63375460e+00, 8.65890628e+00, 8.68405796e+00, 8.70920964e+00, 8.73436132e+00, 8.75951300e+00, 8.78466468e+00, 8.80981635e+00, 8.83496803e+00, 8.86011971e+00, 8.88527139e+00, 8.91042307e+00, 8.93557475e+00, 8.96072643e+00, 8.98587811e+00, 9.01102979e+00, 9.03618147e+00, 9.06133315e+00, 9.08648483e+00, 9.11163651e+00, 9.13678818e+00, 9.16193986e+00, 9.18709154e+00, 9.21224322e+00, 9.23739490e+00, 9.26254658e+00, 9.28769826e+00, 9.31284994e+00, 9.33800162e+00, 9.36315330e+00, 9.38830498e+00, 9.41345666e+00, 9.43860834e+00, 9.46376001e+00, 9.48891169e+00, 9.51406337e+00, 9.53921505e+00, 9.56436673e+00, 9.58951841e+00, 9.61467009e+00, 9.63982177e+00, 9.66497345e+00, 9.69012513e+00, 9.71527681e+00, 9.74042849e+00, 9.76558017e+00, 9.79073184e+00, 9.81588352e+00, 9.84103520e+00, 9.86618688e+00, 9.89133856e+00, 9.91649024e+00, 9.94164192e+00, 9.96679360e+00, 9.99194528e+00, 1.00170970e+01, 1.00422486e+01, 1.00674003e+01, 1.00925520e+01, 1.01177037e+01, 1.01428554e+01, 1.01680070e+01, 1.01931587e+01, 1.02183104e+01, 1.02434621e+01, 1.02686137e+01, 1.02937654e+01, 1.03189171e+01, 1.03440688e+01, 1.03692205e+01, 1.03943721e+01, 1.04195238e+01, 1.04446755e+01, 1.04698272e+01, 1.04949789e+01, 1.05201305e+01, 1.05452822e+01, 1.05704339e+01, 1.05955856e+01, 1.06207373e+01, 1.06458889e+01, 1.06710406e+01, 1.06961923e+01, 1.07213440e+01, 1.07464957e+01, 1.07716473e+01, 1.07967990e+01, 1.08219507e+01, 1.08471024e+01, 1.08722541e+01, 1.08974057e+01, 1.09225574e+01, 1.09477091e+01, 1.09728608e+01, 1.09980124e+01, 1.10231641e+01, 1.10483158e+01])
pd.rolling_mean(bh_df.set_index('q_len')['E'], 10)
q_len 3.094732 NaN 3.094732 NaN -0.687470 NaN -0.959387 NaN -0.959387 NaN -0.959387 NaN 3.094732 NaN -1.400403 NaN -1.400403 NaN -1.400403 0.638555 -0.687470 0.462870 -0.687470 0.287185 3.094732 0.033922 -0.959387 -0.091736 3.094732 -0.215210 3.094732 -0.343245 3.094732 -0.456894 3.094732 -0.568641 3.094732 -0.680564 3.094732 -0.789175 -0.606744 -0.570201 -0.606744 -0.351228 -0.606744 -0.059487 -0.606744 0.243277 -0.344174 0.504460 -0.984030 0.777044 -0.984030 1.048110 -0.984030 1.318149 -0.984030 1.571854 -0.984030 1.826568 ... 1.483621 -0.199843 0.101091 0.059302 1.483621 0.341218 1.483621 0.618060 1.483621 0.889124 1.483621 1.103656 1.483621 1.110536 1.483621 1.143865 1.483621 0.938542 1.483621 0.976199 1.483621 0.751432 0.681465 0.813889 -0.802185 0.857221 -0.737604 0.806812 0.115536 0.736152 -1.234703 0.698586 0.115536 0.545425 0.115536 0.480660 0.115536 0.427871 0.115536 0.380178 0.115536 0.339398 0.681465 0.195950 0.681465 -0.089015 0.681465 -0.322149 0.681465 -0.528582 1.555849 -0.444556 -0.259200 -0.191169 1.555849 -0.164765 1.555849 -0.148840 1.555849 -0.140356 Name: E, dtype: float64
svc_clf = svm.SVC()
gnb = GaussianNB()
svc_clf.fit(bh_df[['q_len', 'E']], bh_df.RBH.astype(int))
SVC(C=1.0, cache_size=200, class_weight=None, coef0=0.0, decision_function_shape=None, degree=3, gamma='auto', kernel='rbf', max_iter=-1, probability=False, random_state=None, shrinking=True, tol=0.001, verbose=False)
bh_df
E | EG2 | q_aln_len | q_len | q_name | q_start | q_strand | s_aln_len | s_len | s_name | s_start | s_strand | score | bitscore | RBH | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 1.164817 | 0.000000e+00 | 5661 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 0 | + | 1887 | 1887 | SPAC212.11_tlh1_I_RecQ | 0 | + | 10676 | 5628.211770 | True |
1 | 1.164817 | 0.000000e+00 | 5661 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 0 | + | 1887 | 1919 | SPBCPT2R1.08c_tlh2_II_RecQ | 0 | + | 10676 | 5628.211770 | True |
2 | 1.209665 | 1.300000e-237 | 834 | 1.858059 | SPAC212.08c_11784_12994_1_SPAC212.08c_I_protei... | 374 | + | 278 | 278 | SPAC212.08c_SPAC212.08c_I_S. | 0 | + | 1602 | 846.731705 | True |
3 | -0.095597 | 1.400000e-116 | 441 | 1.077528 | SPAC212.06c_18042_18974_1_SPAC212.06c_I_protei... | 30 | + | 147 | 147 | SPAC212.06c_SPAC212.06c_I_DNA | 0 | + | 839 | 444.674256 | True |
4 | -0.153000 | 2.400000e-111 | 462 | 1.077528 | SPAC212.06c_18042_18974_1_SPAC212.06c_I_protei... | 0 | + | 168 | 1887 | SPAC212.11_tlh1_I_RecQ | 1477 | + | 806 | 427.285140 | True |
5 | -0.153000 | 2.400000e-111 | 462 | 1.077528 | SPAC212.06c_18042_18974_1_SPAC212.06c_I_protei... | 0 | + | 168 | 1919 | SPBCPT2R1.08c_tlh2_II_RecQ | 1477 | + | 806 | 427.285140 | True |
6 | -0.272948 | 4.700000e-104 | 474 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 4461 | + | 144 | 147 | SPAC212.06c_SPAC212.06c_I_DNA | 0 | + | 760 | 403.045765 | True |
7 | -0.296894 | 8.900000e-90 | 369 | -0.188396 | SPAC212.12_15855_16226_1_SPAC212.12_I_protein_... | 0 | + | 123 | 123 | SPAC212.12_SPAC212.12_I_S. | 0 | + | 670 | 355.620902 | True |
8 | -0.296894 | 8.900000e-90 | 369 | -0.188396 | SPAC212.12_15855_16226_1_SPAC212.12_I_protein_... | 0 | + | 123 | 123 | SPAC750.07c_SPAC750.07c_I_S. | 0 | + | 670 | 355.620902 | True |
9 | -0.337173 | 2.700000e-86 | 371 | -0.188396 | SPAC212.12_15855_16226_1_SPAC212.12_I_protein_... | 0 | + | 127 | 278 | SPAC212.08c_SPAC212.08c_I_S. | 0 | + | 648 | 344.028158 | True |
10 | -0.473007 | 1.200000e-82 | 379 | 1.858059 | SPAC212.08c_11784_12994_1_SPAC212.08c_I_protei... | 374 | + | 123 | 123 | SPAC212.12_SPAC212.12_I_S. | 0 | + | 625 | 331.908471 | True |
11 | -0.473007 | 1.200000e-82 | 379 | 1.858059 | SPAC212.08c_11784_12994_1_SPAC212.08c_I_protei... | 374 | + | 123 | 123 | SPAC750.07c_SPAC750.07c_I_S. | 0 | + | 625 | 331.908471 | True |
12 | -1.151384 | 1.500000e-15 | 942 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 3633 | + | 308 | 1328 | SPAC2G11.12_rqh1_I_RecQ | 539 | + | 202 | 109.011615 | True |
13 | -1.267042 | 5.200000e-03 | 135 | 1.077528 | SPAC212.06c_18042_18974_1_SPAC212.06c_I_protei... | 9 | + | 45 | 1328 | SPAC2G11.12_rqh1_I_RecQ | 802 | + | 123 | 67.383125 | True |
14 | -1.304087 | 3.700000e+00 | 336 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 4248 | + | 115 | 1063 | SPAC23A1.19c_hrq1_I_RecQ | 552 | + | 105 | 57.898152 | True |
15 | -1.346600 | 7.100000e+04 | 66 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 1575 | + | 22 | 867 | SPBC3B8.04c_SPBC3B8.04c_II_sodium | 205 | + | 78 | 43.670693 | True |
16 | -1.332446 | 2.700000e+03 | 252 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 4523 | - | 77 | 534 | SPBC215.13_SPBC215.13_II_serine-rich | 301 | + | 87 | 48.413179 | True |
17 | -1.338651 | 1.100000e+04 | 270 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 4523 | - | 87 | 534 | SPBC215.13_SPBC215.13_II_serine-rich | 284 | + | 83 | 46.305408 | True |
18 | -1.340301 | 1.700000e+04 | 484 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 4291 | - | 157 | 534 | SPBC215.13_SPBC215.13_II_serine-rich | 243 | + | 82 | 45.778465 | True |
19 | -1.349697 | 1.500000e+05 | 45 | 12.714760 | SPAC212.11_1_5662_-1_tlh1_I_protein_coding_RecQ | 441 | - | 15 | 420 | SPBC17D11.01_nep1_II_NEDD8 | 295 | + | 76 | 42.616807 | True |
20 | 1.568373 | 6.300000e-271 | 948 | 2.089779 | SPAC977.01_29764_31069_1_SPAC977.01_I_protein_... | 2 | + | 316 | 316 | SPAC977.01_SPAC977.01_I_S. | 0 | + | 1812 | 957.389718 | True |
21 | 1.568373 | 6.300000e-271 | 948 | 2.089779 | SPAC977.01_29764_31069_1_SPAC977.01_I_protein_... | 2 | + | 316 | 344 | SPBC1348.02_SPBC1348.02_II_S. | 28 | + | 1812 | 957.389718 | True |
22 | 1.568373 | 6.300000e-271 | 948 | 2.089779 | SPAC977.01_29764_31069_1_SPAC977.01_I_protein_... | 2 | + | 316 | 344 | SPBPB2B2.19c_SPBPB2B2.19c_II_S. | 28 | + | 1812 | 957.389718 | True |
23 | 1.555473 | 1.200000e-269 | 948 | 2.089779 | SPAC977.01_29764_31069_1_SPAC977.01_I_protein_... | 2 | + | 316 | 344 | SPAC750.05c_SPAC750.05c_I_S. | 28 | + | 1804 | 953.174175 | True |
24 | 1.130793 | 5.500000e-237 | 864 | 2.843480 | SPAC212.04c_21381_23050_1_SPAC212.04c_I_protei... | 206 | + | 288 | 288 | SPAC212.04c_SPAC212.04c_I_S. | 0 | + | 1598 | 844.623933 | True |
25 | 1.194564 | 3.300000e-229 | 840 | 1.006792 | SPAC212.01c_28738_29657_1_SPAC212.01c_I_protei... | 0 | + | 280 | 280 | SPAC212.01c_SPAC212.01c_I_S. | 0 | + | 1549 | 818.803730 | True |
26 | 1.194564 | 3.300000e-229 | 840 | 1.006792 | SPAC212.01c_28738_29657_1_SPAC212.01c_I_protei... | 0 | + | 280 | 280 | SPBCPT2R1.04c_SPBCPT2R1.04c_II_S. | 0 | + | 1549 | 818.803730 | True |
27 | 1.178788 | 4.200000e-228 | 840 | 1.006792 | SPAC212.01c_28738_29657_1_SPAC212.01c_I_protei... | 0 | + | 280 | 280 | SPAC750.06c_SPAC750.06c_I_S. | 0 | + | 1542 | 815.115129 | True |
28 | 1.024869 | 1.300000e-214 | 840 | 1.006792 | SPAC212.01c_28738_29657_1_SPAC212.01c_I_protei... | 0 | + | 269 | 269 | SPBC1348.01_SPBC1348.01_II_S. | 0 | + | 1457 | 770.324981 | True |
29 | 1.024869 | 1.300000e-214 | 840 | 1.006792 | SPAC212.01c_28738_29657_1_SPAC212.01c_I_protei... | 0 | + | 269 | 269 | SPBCPT2R1.01c_SPBCPT2R1.01c_II_S. | 0 | + | 1457 | 770.324981 | True |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
2274 | 1.164817 | 0.000000e+00 | 4419 | 11.526889 | SPAC10F6.01c_1200916_1206090_-1_sir1_I_protein... | 592 | + | 1473 | 1473 | SPAC10F6.01c_sir1_I_sulfite | 0 | + | 8228 | 4338.255499 | False |
2275 | -1.163565 | 2.800000e-14 | 426 | 11.526889 | SPAC10F6.01c_1200916_1206090_-1_sir1_I_protein... | 2779 | + | 138 | 584 | SPAC1296.06_tah18_I_NADPH-dependent | 7 | + | 194 | 104.796072 | False |
2276 | 1.164817 | 0.000000e+00 | 3504 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 146 | + | 1168 | 1168 | SPAC10F6.02c_prp22_I_ATP-dependent | 0 | + | 6562 | 3460.368593 | False |
2277 | 1.164817 | 0.000000e+00 | 1800 | 4.121599 | SPAC10F6.03c_1211195_1213553_-1_cts1_I_protein... | 85 | + | 600 | 600 | SPAC10F6.03c_cts1_I_CTP | 0 | + | 3373 | 1779.947618 | False |
2278 | 1.377100 | 8.100000e-270 | 1929 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1649 | + | 645 | 1055 | SPBC19C2.01_cdc28_II_ATP-dependent | 409 | + | 1805 | 953.701118 | False |
2279 | 1.329796 | 4.600000e-265 | 2232 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1298 | + | 731 | 1173 | SPBC1711.17_prp16_II_ATP-dependent | 377 | + | 1775 | 937.892830 | False |
2280 | 1.260204 | 4.400000e-258 | 1872 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1658 | + | 635 | 735 | SPBC16H5.10c_prp43_II_ATP-dependent | 69 | + | 1731 | 914.707341 | False |
2281 | 0.731690 | 6.100000e-205 | 1869 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1658 | + | 623 | 719 | SPAC2G11.11c_prh1_I_ATP-dependent | 90 | + | 1396 | 738.181463 | False |
2282 | 0.230463 | 1.700000e-154 | 1845 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1661 | + | 619 | 647 | SPAC20H4.09_SPAC20H4.09_I_ATP-dependent | 20 | + | 1078 | 570.613614 | False |
2283 | -0.615596 | 2.600000e-69 | 1362 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1661 | + | 486 | 1327 | SPCC895.09c_ucp12_III_ATP-dependent | 572 | + | 541 | 287.645266 | False |
2284 | -0.749309 | 7.800000e-56 | 720 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 1652 | + | 257 | 1183 | SPAPB1A10.06c_SPAPB1A10.06c_I_ATP-dependent | 390 | + | 456 | 242.855117 | False |
2285 | -0.812507 | 1.700000e-49 | 843 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 2408 | + | 314 | 1183 | SPAPB1A10.06c_SPAPB1A10.06c_I_ATP-dependent | 703 | + | 416 | 221.777400 | False |
2286 | -0.930575 | 1.400000e-37 | 834 | 8.090113 | SPAC10F6.02c_1206812_1210630_-1_prp22_I_protei... | 2309 | + | 280 | 1428 | SPBC15C4.05_dhx29_II_ATP-dependent | 905 | + | 341 | 182.256681 | False |
2287 | 1.747075 | 6.900000e-305 | 1053 | 5.787546 | SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_pr... | 427 | + | 351 | 351 | SPAC10F6.04_SPAC10F6.04_I_RCC | 0 | + | 2026 | 1070.155503 | False |
2288 | 1.781061 | 4.800000e-285 | 1023 | 1.528772 | SPAC10F6.08c_1219667_1220847_-1_nht1_I_protein... | 50 | + | 341 | 341 | SPAC10F6.08c_nht1_I_Ino80 | 0 | + | 1901 | 1004.287638 | False |
2289 | 0.859854 | 9.800000e-206 | 771 | 1.714148 | SPAC10F6.06_1217077_1218228_1_vip1_I_protein_c... | 94 | + | 257 | 257 | SPAC10F6.06_vip1_I_RNA-binding | 0 | + | 1401 | 740.816178 | False |
2290 | 0.601482 | 8.000000e-191 | 681 | 4.163065 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 1139 | + | 227 | 227 | SPAC10F6.05c_ubc6_I_ubiquitin | 0 | + | 1307 | 691.283543 | False |
2291 | 0.381483 | 9.400000e-153 | 564 | 0.287240 | SPAC10F6.07c_1218321_1218887_-1_mug94_I_protei... | 0 | + | 188 | 188 | SPAC10F6.07c_mug94_I_Schizosaccharomyces | 0 | + | 1067 | 564.817242 | False |
2292 | -1.197387 | 1.800000e-10 | 333 | 4.163065 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 1154 | + | 110 | 147 | SPBC119.02_ubc4_II_ubiquitin | 1 | + | 170 | 92.149442 | False |
2293 | -1.219367 | 3.000000e-08 | 216 | 4.163065 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 1139 | + | 73 | 166 | SPBP16F5.04_ubc7_II_ubiquitin | 0 | + | 156 | 84.772241 | False |
2294 | -1.241428 | 5.000000e-06 | 324 | 4.163065 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 1160 | + | 107 | 148 | SPAC11E3.04c_ubc13_I_ubiquitin | 4 | + | 142 | 77.395040 | False |
2295 | -1.257127 | 1.900000e-04 | 327 | 4.163065 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 1160 | + | 111 | 160 | SPBC1198.09_ubc16_II_ubiquitin | 5 | + | 132 | 72.125611 | False |
2296 | -1.310745 | 4.800000e+01 | 336 | 4.163065 | SPAC10F6.05c_1214788_1217067_-1_ubc6_I_protein... | 1160 | + | 112 | 217 | SPBC2D10.20_ubc1_II_ubiquitin | 6 | + | 98 | 54.209552 | False |
2297 | 0.409781 | 2.900000e-172 | 738 | 5.787546 | SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_pr... | 259 | - | 218 | 227 | SPAC10F6.05c_ubc6_I_ubiquitin | 9 | + | 1190 | 629.631221 | False |
2298 | -0.875529 | 5.500000e-43 | 213 | 5.787546 | SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_pr... | 2608 | - | 71 | 600 | SPAC10F6.03c_cts1_I_CTP | 0 | + | 375 | 200.172741 | False |
2299 | -1.313539 | 6.900000e+01 | 399 | 5.787546 | SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_pr... | 265 | - | 104 | 147 | SPBC119.02_ubc4_II_ubiquitin | 7 | + | 97 | 53.682609 | False |
2300 | -1.322990 | 6.200000e+02 | 135 | 5.787546 | SPAC10F6.04_1213255_1216120_1_SPAC10F6.04_I_pr... | 259 | - | 47 | 160 | SPBC1198.09_ubc16_II_ubiquitin | 7 | + | 91 | 50.520951 | False |
2301 | 1.164817 | 0.000000e+00 | 2724 | 5.611926 | SPAC10F6.09c_1220969_1224862_-1_psm3_I_protein... | 26 | + | 908 | 1194 | SPAC10F6.09c_psm3_I_mitotic | 0 | + | 4965 | 2618.840748 | False |
2302 | -0.971476 | 2.600000e-33 | 2184 | 5.611926 | SPAC10F6.09c_1220969_1224862_-1_psm3_I_protein... | 5 | + | 743 | 1324 | SPBC146.03c_cut3_II_condensin | 116 | + | 314 | 168.029222 | False |
2303 | -1.091300 | 3.000000e-21 | 642 | 5.611926 | SPAC10F6.09c_1220969_1224862_-1_psm3_I_protein... | 26 | + | 221 | 1172 | SPBP4H10.06c_cut14_II_condensin | 0 | + | 238 | 127.981560 | False |
2304 rows × 15 columns
pred = gnb.fit(bh_df[['q_len', 'E']], bh_df.RBH.astype(int)).predict(bh_df[['q_len', 'E']])
xx, yy, zz = get_grid(-5, 15, svc_clf)
figsize(12,8)
plt.contourf(xx, yy, zz, cmap=plt.cm.Paired, alpha=0.8)
# Plot also the training points
plt.scatter(bh_df['q_len'], bh_df['E'], c=bh_df.RBH.astype(int), cmap=plt.cm.Paired)
plt.xlim(xx.min(), xx.max())
plt.ylim(yy.min(), yy.max())
(-5.0, 15.0)