wn18_run.py

#import scipy.io

import efe
from efe.exp_generators import *
import efe.tools as tools

if __name__ =="__main__":

	#Load data, ensure that data is at path: 'path'/'name'/[train|valid|test].txt
	wn18exp = build_data(name = 'wn18',path = tools.cur_path + '/datasets/')


	#SGD hyper-parameters:
	params = Parameters(learning_rate = 0.5, 
						max_iter = 1000, 
						batch_size = int(len(wn18exp.train.values) / 100),  #Make 100 batches
						neg_ratio = 1, 
						valid_scores_every = 50,
						learning_rate_policy = 'adagrad',
						contiguous_sampling = False )

	#Here each model is identified by its name, i.e. the string of its class name in models.py
	#Parameters given here are the best ones for each model, validated from the grid-search described in the paper
	all_params = { "Complex_Logistic_Model" : params } ; emb_size = 150; lmbda =0.03;
	#all_params = { "DistMult_Logistic_Model" : params } ; emb_size = 200; lmbda =0.003; params.learning_rate = 1.0
	#all_params = { "CP_Logistic_Model" : params } ; emb_size = 100; lmbda =0.1; 
	#all_params = { "Rescal_Logistic_Model" : params } ; emb_size = 50; lmbda =0.1
	#all_params = { "TransE_L2_Model" : params } ; emb_size = 200; lmbda = 0.5 ; params.learning_rate=0.01


	tools.logger.info( "Learning rate: " + str(params.learning_rate))
	tools.logger.info( "Max iter: " + str(params.max_iter))
	tools.logger.info( "Generated negatives ratio: " + str(params.neg_ratio))
	tools.logger.info( "Batch size: " + str(params.batch_size))


	#Then call a local grid search, here only with one value of rank and regularization
	wn18exp.grid_search_on_all_models(all_params, embedding_size_grid = [emb_size], lmbda_grid = [lmbda], nb_runs = 1)

	#Print best averaged metrics:
	wn18exp.print_best_MRR_and_hits()

	#Print best averaged metrics per relation:
	wn18exp.print_best_MRR_and_hits_per_rel()


	#Save ComplEx embeddings (last trained model, not best on grid search if multiple embedding sizes and lambdas)
	#e1 = wn18exp.models["Complex_Logistic_Model"][0].e1.get_value(borrow=True)
	#e2 = wn18exp.models["Complex_Logistic_Model"][0].e2.get_value(borrow=True)
	#r1 = wn18exp.models["Complex_Logistic_Model"][0].r1.get_value(borrow=True)
	#r2 = wn18exp.models["Complex_Logistic_Model"][0].r2.get_value(borrow=True)
	#scipy.io.savemat('complex_embeddings.mat', \
	#		{'entities_real' : e1, 'relations_real' : r1, 'entities_imag' : e2, 'relations_imag' : r2  })