Compare_energy_results.py 3.28 KB
from math import sqrt, ceil
import numpy as np
import matplotlib.pyplot as plt
import re
import seaborn as sns
import pandas as pd
import matplotlib.pylab as plt

# Retrieve for each rna the best value for MEA and compare this energy value with the one obtains with
# RNAeval and RNAfold from the ViennaRNA Package 2.0 (Ronny Lorentz et al., 2011)
# After getting those values, it will creates a figure.
def get_result_MEA(filename):
    ext = "json_pmE"
    file2 = open( "/mnt/c/Users/natha/Documents/IBISC/biorseo2/biorseo/results/" + filename + ext, "r")

    name = file2.readline()
    rna = file2.readline()
    twod = file2.readline()
    pred = re.findall(r'\S+', twod)

    score = '-' + pred[len(pred)-1]
    min = float(score)
    contacts = file2.readline()
    while twod:
        twod = file2.readline()
        pred = re.findall(r'\S+', twod)
        if len(pred) > 0:
            score = '-' + pred[len(pred) - 1]
            if float(score) < min:
                min = float(score)
        contacts = file2.readline()
    file2.close()
    return min

fileMFE = open( "/mnt/c/Users/natha/Documents/IBISC/biorseo2/biorseo/RNAfold_bm.log", "r")
lineRna = fileMFE.readline()
lineStruct = fileMFE.readline()

fileEval = open( "/mnt/c/Users/natha/Documents/IBISC/biorseo2/biorseo/RNAeval_bm.log", "r")
lineRna2 = fileEval.readline()
lineStruct2 = fileEval.readline()

file = open("/mnt/c/Users/natha/Documents/IBISC/biorseo2/biorseo/data/modules/ISAURE/Motifs_version_initiale/benchmark.dbn", "r")
name = file.readline().strip()
rna = file.readline()
twod = file.readline()
contacts = file.readline()
list_name = []
list_score = []
list_type = []
print(np)
while name:
    #print(name)
    if lineRna != rna:
        while lineRna != rna:
            lineRna = fileMFE.readline()
            lineStruct = fileMFE.readline()
    MFE = float(lineStruct[len(lineStruct)-8:len(lineStruct)-2])
    list_name.append(name[5:len(name)-1])
    list_score.append(MFE)
    list_type.append('MFE')
    #print("MFE:" + str(MFE))
    lineRna = fileMFE.readline()
    lineStruct = fileMFE.readline()

    if lineRna2 != rna:
        while lineRna2 != rna:
            lineRna2 = fileEval.readline()
            lineStruct2 = fileEval.readline()
    eval = float(lineStruct2[len(lineStruct2)-8:len(lineStruct2)-2])
    list_name.append(name[5:len(name) - 1])
    list_score.append(eval)
    list_type.append('eval')
    #print("Eval:" + str(eval))
    lineRna2 = fileEval.readline()
    lineStruct2 = fileEval.readline()

    best_mea = get_result_MEA(name)
    #print("MEA: " + str(best_mea) + "\n")
    list_name.append(name[5:len(name) - 1])
    list_score.append(best_mea)
    list_type.append('MEA')
    name = file.readline().strip()
    rna = file.readline()
    twod = file.readline()
    contacts = file.readline()

file.close()
fileMFE.close()
fileEval.close()

'''print(list_MFE)
print(list_MEA)
print(list_eval)'''

#np = [["rna", "type_score", "score"]]
d = {'rna':list_name,'score':list_score, 'type_score':list_type}
df = pd.DataFrame(d, columns=['rna','type_score','score'])

sns.stripplot(x="rna",y="score",data=df,jitter=True,hue='type_score',palette='Set1')
plt.xticks(rotation=90)
plt.savefig("compare_BiORSEOMEA_RNAeval_RNAfold.png")