Skip to content
Snippets Groups Projects
Commit bea45844 authored by Schneider Leo's avatar Schneider Leo
Browse files

datasets

parent 46c06035
No related branches found
No related tags found
No related merge requests found
...@@ -165,17 +165,18 @@ def load_data(path_train, path_val, path_test, batch_size, length, pad=False, co ...@@ -165,17 +165,18 @@ def load_data(path_train, path_val, path_test, batch_size, length, pad=False, co
return train_loader, val_loader, test_loader return train_loader, val_loader, test_loader
if __name__ =='__main__' : if __name__ =='__main__' :
irt_train = np.load('data/intensity/irt_train.npy') pass
seq_train = np.load('data/intensity/sequence_train.npy') # irt_train = np.load('data/intensity/irt_train.npy')
charge_train = np.load('data/intensity/precursor_charge_train.npy') # seq_train = np.load('data/intensity/sequence_train.npy')
spectra_train = np.load('data/intensity/intensity_train.npy') # charge_train = np.load('data/intensity/precursor_charge_train.npy')
# spectra_train = np.load('data/intensity/intensity_train.npy')
# #
# irt_holdout = np.load('data/intensity/irt_holdout.npy') # irt_holdout = np.load('data/intensity/irt_holdout.npy')
# seq_holdout = np.load('data/intensity/sequence_holdout.npy') # seq_holdout = np.load('data/intensity/sequence_holdout.npy')
# charge_holdout = np.load('data/intensity/precursor_charge_holdout.npy') # charge_holdout = np.load('data/intensity/precursor_charge_holdout.npy')
# spectra_holdout = np.load('data/intensity/intensity_holdout.npy') # spectra_holdout = np.load('data/intensity/intensity_holdout.npy')
# #
dataset_train = pd.DataFrame({'Sequence':list(seq_train), 'Retention time':list(irt_train), 'Charge':list(charge_train), 'Spectra' : list(spectra_train)},index=list(range(6787933))) # dataset_train = pd.DataFrame({'Sequence':list(seq_train), 'Retention time':list(irt_train), 'Charge':list(charge_train), 'Spectra' : list(spectra_train)},index=list(range(6787933)))
dataset_train.to_pickle('database/data_prosit_merged_train.pkl') # dataset_train.to_pickle('database/data_prosit_merged_train.pkl')
# dataset_test = pd.DataFrame({'Sequence':list(seq_holdout), 'Retention time':list(irt_holdout), 'Charge':list(charge_holdout), 'Spectra' : list(spectra_holdout)},index=list(range(754215))) # dataset_test = pd.DataFrame({'Sequence':list(seq_holdout), 'Retention time':list(irt_holdout), 'Charge':list(charge_holdout), 'Spectra' : list(spectra_holdout)},index=list(range(754215)))
# dataset_test.to_pickle('database/data_prosit_merged_holdout.pkl') # dataset_test.to_pickle('database/data_prosit_merged_holdout.pkl')
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment