From 32d10c9a1a51a69f613802c5aa19b8db9ce39932 Mon Sep 17 00:00:00 2001 From: Schneider Leo <leo.schneider@etu.ec-lyon.fr> Date: Thu, 3 Oct 2024 15:01:03 +0200 Subject: [PATCH] main change --- data_exploration.py | 11 +++++++++++ data_viz.py | 12 ++++++------ 2 files changed, 17 insertions(+), 6 deletions(-) diff --git a/data_exploration.py b/data_exploration.py index f74f487..0999118 100644 --- a/data_exploration.py +++ b/data_exploration.py @@ -1,6 +1,7 @@ import numpy as np import matplotlib.pyplot as plt import matplotlib +import pandas as pd matplotlib.use('agg') length = 30 @@ -284,3 +285,13 @@ def RT_distrib(Y, f_name): # RT_distrib(Y_validation,'fig/histo_RT_validation.png' ) # # +#ISA DATA + +df = pd.read_pickle('database/data_ISA_aligned_prosit.pkl') +seq = df['Sequence'].unique() +# rt = df['Retention time'] +df_mean = df.groupby(['Sequence'])['Retention time'].mean() +# feq_aa(seq, plot=False, save=True, f_name='fig/histo_aa_ISA_unique.png') +# dist_long(seq, plot=False, save=True, f_name='fig/histo_length_ISA_unique.png') + +RT_distrib(df_mean, 'fig/histo_RT_ISA_unique.png') diff --git a/data_viz.py b/data_viz.py index b655f79..ff1665f 100644 --- a/data_viz.py +++ b/data_viz.py @@ -254,7 +254,7 @@ def add_length(dataframe): dataframe['length']=dataframe['seq'].map(fonc) -df = pd.read_csv('output/out_common_ISA_ISA_eval_2.csv') +# df = pd.read_csv('output/out_common_ISA_ISA_eval_2.csv') # add_length(df) # df['abs_error'] = np.abs(df['rt pred']-df['true rt']) # histo_abs_error(df, display=False, save=True, path='fig/custom model res/histo_ISA_ISA_eval.png') @@ -275,11 +275,11 @@ df = pd.read_csv('output/out_common_ISA_ISA_eval_2.csv') # scatter_rt(df, display=False, save=True, path='fig/custom model res/RT_pred_prosit_ISA_eval.png', color=True) # histo_length_by_error(df, bins=10, display=False, save=True, path='fig/custom model res/histo_length_prosit_ISA_eval.png') -# df = pd.read_csv('output/out_common_ISA_ISA_eval_3.csv') +# df = pd.read_csv('output/out_common_ISA_prosit_eval.csv') # add_length(df) # df['abs_error'] = np.abs(df['rt pred']-df['true rt']) -# histo_abs_error(df, display=False, save=True, path='fig/custom model res/histo_ISA_ISA_eval_3.png') -# scatter_rt(df, display=False, save=True, path='fig/custom model res/RT_pred_ISA_ISA_eval_3_file.png', color=True, col = 'file') -# histo_length_by_error(df, bins=10, display=False, save=True, path='fig/custom model res/histo_length_ISA_ISA_eval_3.png') - +# histo_abs_error(df, display=False, save=True, path='fig/custom model res/histo_ISA_prosit_eval.png') +# scatter_rt(df, display=False, save=True, path='fig/custom model res/RT_pred_ISA_prosit_eval.png', color=True, col = 'seq') +# histo_length_by_error(df, bins=10, display=False, save=True, path='fig/custom model res/histo_length_ISA_prosit_eval.png') +# -- GitLab