state.py

from collections import OrderedDict

def prototype_state():
    state = {} 
     
    # Random seed
    state['seed'] = 1234
    
    # Logging level
    state['level'] = 'DEBUG'

    state['oov'] = '<unk>'
    state['len_sample'] = 40
    
    # These are end-of-sequence marks
    state['start_sym_sentence'] = '<s>'
    state['end_sym_sentence'] = '</s>'
    state['end_sym_triple'] = '</t>'
    
    state['unk_sym'] = 0
    state['eot_sym'] = 3
    state['eos_sym'] = 2
    state['sos_sym'] = 1
    
    state['maxout_out'] = False
    state['deep_out'] = True

    # ----- ACTIV ---- 
    state['sent_rec_activation'] = 'lambda x: T.tanh(x)'
    state['triple_rec_activation'] = 'lambda x: T.tanh(x)'
    
    state['decoder_bias_type'] = 'all' # first, or selective 

    state['sent_step_type'] = 'gated'
    state['triple_step_type'] = 'gated' 
    
    # ----- SIZES ----
    # Dimensionality of hidden layers
    state['qdim'] = 512
    # Dimensionality of triple hidden layer 
    state['sdim'] = 1000
    # Dimensionality of low-rank approximation
    state['rankdim'] = 256

    # Threshold to clip the gradient
    state['cutoff'] = 1.
    state['lr'] = 0.0001

    # Early stopping configuration
    state['patience'] = 5
    state['cost_threshold'] = 1.003
     
    # ----- TRAINING METHOD -----
    # Choose optimization algorithm
    state['updater'] = 'adam'  
    # Maximum sequence length / trim batches
    state['seqlen'] = 80
    # Batch size
    state['bs'] = 80
    # Sort by length groups of  
    state['sort_k_batches'] = 20
   
    # Maximum number of iterations
    state['max_iters'] = 10
    # Modify this in the prototype
    state['save_dir'] = './'
    
    # ----- TRAINING PROCESS -----
    # Frequency of training error reports (in number of batches)
    state['train_freq'] = 10
    # Validation frequency
    state['valid_freq'] = 5000
    # Number of batches to process
    state['loop_iters'] = 3000000
    # Maximum number of minutes to run
    state['time_stop'] = 24*60*31
    # Error level to stop at
    state['minerr'] = -1

    # ----- EVALUATION PROCESS -----
    state['track_extrema_validation_samples'] = True # If set to true will print the extrema (lowest and highest log-likelihood scoring) validation samples
    state['track_extrema_samples_count'] = 100 # Set of extrema samples to track
    state['print_extrema_samples_count'] = 5 # Number of extrema samples to print (chosen at random from the extrema sets)

    state['compute_mutual_information'] = True # If true, the empirical mutural information will be calculcated on the validation set


    return state

def prototype_test():
    state = prototype_state()
    
    # Fill your paths here! 
    state['train_triples'] = "./tests/data/ttrain.triples.pkl"
    state['test_triples'] = "./tests/data/ttest.triples.pkl"
    state['valid_triples'] = "./tests/data/tvalid.triples.pkl"
    state['dictionary'] = "./tests/data/ttrain.dict.pkl"
    state['save_dir'] = "./tests/models/"
    
    # Handle bleu evaluation
    state['bleu_evaluation'] = "./tests/bleu/bleu_evaluation"
    state['bleu_context_length'] = 2


    # Validation frequency
    state['valid_freq'] = 50
    
    # Varia
    state['prefix'] = "testmodel_" 
    state['updater'] = 'adam'
    
    state['maxout_out'] = False
    state['deep_out'] = True
     
    # If out of memory, modify this!
    state['bs'] = 80
    state['use_nce'] = True
    state['decoder_bias_type'] = 'all' #'selective' 
    
    state['qdim'] = 50 
    # Dimensionality of triple hidden layer 
    state['sdim'] = 100
    # Dimensionality of low-rank approximation
    state['rankdim'] = 25
    return state

def prototype_moviedic():
    state = prototype_state()
    
    # Fill your paths here! 
    state['train_triples'] = "Data/Training.triples.pkl"
    state['test_triples'] = "Data/Test.triples.pkl"
    state['valid_triples'] = "Data/Validation.triples.pkl"
    state['dictionary'] = "Data/Training.dict.pkl" 
    state['save_dir'] = "Output" 
    
    # Handle bleu evaluation
    state['bleu_evaluation'] = "Data/Validation_Shuffled_Dataset.txt"
    state['bleu_context_length'] = 2
    
    # Validation frequency
    state['valid_freq'] = 5000
    
    # Varia
    state['prefix'] = "MovieScriptModel_" 
    state['updater'] = 'adam'
    
    state['maxout_out'] = True
    state['deep_out'] = True
     
    # If out of memory, modify this!
    state['bs'] = 80
    state['use_nce'] = False
    state['decoder_bias_type'] = 'all' # Choose between 'first', 'all' and 'selective' 

    # Increase sequence length to fit movie dialogues better
    state['seqlen'] = 160

    state['qdim'] = 600
    # Dimensionality of triple hidden layer 
    state['sdim'] = 300
    # Dimensionality of low-rank approximation
    state['rankdim'] = 300
    return state