diff --git a/preprocessing/pipelines.py b/preprocessing/pipelines.py index cdbf61b..9d35af9 100644 --- a/preprocessing/pipelines.py +++ b/preprocessing/pipelines.py @@ -199,6 +199,7 @@ class Pipeline(): print('Saving processed dataset...') t = time.time() env = {'inputs': inputs, 'outputs': outputs,'failed_samples':failed_samples} + os.makedirs(os.path.dirname(location_processed_dataset),exist_ok=True) io_utils.save_pickle( env, location_processed_dataset) print('Processed dataset saved (t=%.f s)' % (time.time() - t)) diff --git a/train.py b/train.py index d40c6a6..c32467b 100644 --- a/train.py +++ b/train.py @@ -77,7 +77,7 @@ if __name__ == '__main__': ''' check = False # Check = True to verify installation, =False for full training. train = True # True to retrain, False to evaluate the model shown in paper. - use_evolutionary = True # True to use evolutionary information (requires hhblits and a sequence database), False otherwise. + use_evolutionary = False # True to use evolutionary information (requires hhblits and a sequence database), False otherwise. Lmax_aa = 256 if check else 1024 ''' Maximum length of the protein sequences. diff --git a/transfer_learning_train.py b/transfer_learning_train.py index 90b42a5..6676522 100644 --- a/transfer_learning_train.py +++ b/transfer_learning_train.py @@ -21,7 +21,7 @@ if __name__ == '__main__': train = True # True to retrain, False to evaluate the model shown in paper. transfer = True # If False, retrain from scratch. freeze = False # If True, evaluate the binding site network without fine tuning. - use_evolutionary = True # True to use evolutionary information (requires hhblits and a sequence database), False otherwise. + use_evolutionary = False # True to use evolutionary information (requires hhblits and a sequence database), False otherwise. Lmax_aa = 256 if check else 2120 ''' Lmax_aa is the maximum length of the protein sequences.