nn-training/train_all_classification_task.py

import os
import random
import argparse
import time

import pandas
import pickle

import sys
sys.path.append('../code')
# sys.path.append('./code')
from nn_models import ConvModel, RecurrentModel, ConvModel_new, RecurrentModel_new
from nn_train_utils import *
from path_utils import PATH_TO_DATA, PATH_TO_OLD

def load_df(model_type, arch_type):
    """ Function to load dataframe based on model type and architecture type.
    Outputs:
    - all_conv_models: dataframe containing all the networks to train
    - key_trained: key to set when train is finished
    """
    if model_type == 'conv_new':
        all_conv_models = pickle.load(open(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_newhyp_seed.p', 'rb'))
    elif model_type == 'conv':
        all_conv_models = pickle.load(open(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_seed.p', 'rb'))
    elif model_type == 'rec':
        all_conv_models = pickle.load(open(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_new_seed_mod1.p', 'rb'))
    elif model_type == 'rec_new':
        all_conv_models = pickle.load(open(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_newhyp_seed.p', 'rb'))

    if (model_type == 'conv_new') or (model_type == 'conv'):
        best_models_arch = all_conv_models[all_conv_models['arch_type'] == arch_type] #.nlargest(1, 'test_accuracy')
        key_trained = 'is_trained'
    else:
        best_models_arch = all_conv_models[all_conv_models['rec_blocktype'] == arch_type]
        key_trained = 'is_training'
    return best_models_arch, key_trained

def save_df(best_models_arch, model_type, arch_type):
    """ Function to save the updated dataframe.
    """
    if model_type == 'conv_new':
        best_models_arch.to_pickle(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_newhyp_seed.p')
    elif model_type == 'conv':
        best_models_arch.to_pickle(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_seed.p')
    elif model_type == 'rec':
        best_models_arch.to_pickle(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_new_seed_mod1.p')
    elif model_type == 'rec_new':
        best_models_arch.to_pickle(PATH_TO_OLD + '/classification/ALL_' + arch_type + '_newhyp_seed.p')
    return 

def main(args):
    # Load dataset
    exp_id = args.exp_id

    train_data_path = os.path.join(PATH_TO_DATA, 'dataset_train_snap_scaled_fin1_10all.hdf5')
    val_data_path = os.path.join(PATH_TO_DATA, 'dataset_val_snap_scaled_fin1_10all.hdf5')
    train_data = Dataset(train_data_path, val_data_path, 'train', key='spindle_info')

    test_data_path = os.path.join(PATH_TO_DATA, 'dataset_test_snap_scaled_fin1_10all.hdf5')
    test_data = Dataset(test_data_path, dataset_type='test', key='spindle_info')
    
    start_id = args.start_id
    end_id = args.end_id
    model_type = args.type
    arch_type = args.arch_type

    best_models_arch, key_trained = load_df(model_type, arch_type)
    
    for i in range(start_id, end_id):
        print('---------------------------------')
        print('Training model: ', i)
        print('---------------------------------')

        ## Decomment this
        # if not best_models_arch.iloc[i][key_trained]:
        latents = best_models_arch.iloc[i]
        
        if model_type == 'conv':
            # Create model
            mymodel = ConvModel(
                experiment_id=exp_id, #i
                nclasses=20,
                arch_type=arch_type,
                nlayers=latents['nlayers'],
                n_skernels=latents['n_skernels'],
                n_tkernels=latents['n_tkernels'],
                s_kernelsize=latents['s_kernelsize'],
                t_kernelsize=latents['t_kernelsize'],
                s_stride=latents['s_stride'],
                t_stride=latents['t_stride']) #

        elif model_type == 'conv_new':
            # Create model
            mymodel = ConvModel_new(
                experiment_id=exp_id, #i
                nclasses=20,
                arch_type=arch_type,
                nlayers=latents['nlayers'],
                n_skernels=latents['n_skernels'],
                n_tkernels=latents['n_tkernels'],
                s_kernelsize=latents['s_kernelsize'],
                t_kernelsize=latents['t_kernelsize'],
                s_stride=latents['s_stride'],
                t_stride=latents['t_stride']) #,

        elif model_type == 'rec':
            mymodel = RecurrentModel(
                experiment_id=args.exp_id,
                nclasses=20,
                rec_blocktype=arch_type,
                n_recunits=latents['n_recunits'],
                npplayers=latents['npplayers'],
                nppfilters=latents['nppfilters'],
                s_kernelsize=latents['s_kernelsize'],
                s_stride=latents['s_stride'],
                seed=latents['seed'])

        elif model_type == 'rec_new':
            mymodel = RecurrentModel_new(
                experiment_id=args.exp_id,
                nclasses=20,
                rec_blocktype=arch_type,
                n_reclayers=latents['n_reclayers'],
                n_recunits=latents['n_recunits'],
                npplayers=latents['npplayers'],
                nppfilters=latents['nppfilters'],
                s_kernelsize=latents['s_kernelsize'],
                s_stride=latents['s_stride'],
                seed=latents['seed'])

        print(mymodel.__dict__)

        intime = time.time()
        # Create trainer and train!
        mytrainer = Trainer(mymodel, train_data, test_data)
        if model_type == 'rec':
            mytrainer.train(num_epochs=70, learning_rate=1e-3, batch_size=512, 
            early_stopping_epochs=1, verbose=True, save_rand=True)
        else:
            mytrainer.train(num_epochs=50, batch_size = 512, verbose=True, save_rand=True)
        outt = time.time()
        print(f'Successfully trained model {i+1} / {args.end_id - args.start_id} in {(outt-intime)/60} minutes.')

        best_models_arch, key_trained = load_df(model_type, arch_type)

        best_models_arch.at[i,key_trained] = True
        save_df(best_models_arch, model_type, arch_type)

    
if __name__=='__main__':
    parser = argparse.ArgumentParser(description='Training Convolutional Nets for PCR.')
    # parser.add_argument('--old_models', type=str, help='Name of old conv models',default='ALL_spatial_temporal')
    parser.add_argument('--type', type=str, help='Type of model',default='conv')
    parser.add_argument('--arch_type', type=str, help='Architecture of specific model',default='spatial_temporal')
    parser.add_argument('--exp_id', type=int, help='Experiment ID',default=7003)
    parser.add_argument('--start_id', type=int, help='Id of net to start',default=0)
    parser.add_argument('--end_id', type=int, help='Id of net to end',default=5)
    main(parser.parse_args())