auxiliary.py

import sys
import json
import numpy as np
import pickle,os,torch
import data_loader as dl
from utils import prepare_transfer_learning as ptl
from utils import embeddings_interface as ei

ei.__check_prepared__()

#Should be shifted to some other locations
def load_inverse_relation(COMMON_DATA_DIR):
    """
        Function used once to load the relations dictionary
        (which keeps the log of IDified relations, their uri and other things.)

    :param relation_file: str
    :return: dict
    """

    if sys.version_info[0] == 3:
        relations = pickle.load(open(os.path.join(COMMON_DATA_DIR, 'relations.pickle'), 'rb'), encoding='latin1')
    else:
        relations = pickle.load(open(os.path.join(COMMON_DATA_DIR, 'relations.pickle'),'rb'))
    inverse_relations = {}
    for key in relations:
        value = relations[key]
        new_key = value[0]
        value[0] = key
        inverse_relations[new_key] = value

    return inverse_relations


#Loads word list from given COMMON_DATA_DIR. To be used by FlatEncoder.
def load_word_list(COMMON_DATA_DIR):
    print("NOT IMPLEMENTED FUNCTIONALITY NOT IMPLEMENTED FUNCTIONALITY !!!")
    return {}
    # if sys.version_info[0] == 3:
    #     word_list = pickle.load(open(COMMON_DATA_DIR + '/glove.300d.words','rb'), encoding='bytes')
    # else:
    #     word_list = pickle.load(open(COMMON_DATA_DIR + '/glove.300d.words','rb'))
    # word_to_id = {}
    # for index, word in enumerate(word_list):
    #     word_to_id[word] = index
    # return word_to_id


def save_location(problem, model_name, dataset):
    '''
            Location - data/models/problem/model_name/dataset/0X
            problem - core_chain
                    -intent
                    -rdf
                    -type_existence
            model_name - cnn_dense_dense ; pointwise_cnn_dense_dense ....

            dataset -
            return a dir data/models/problem/model_name/dataset/0X
    '''
    # Check if the path exists or not. If not create one.
    assert (problem in ['core_chain', 'intent', 'rdf_class', 'rdf_type'])
    assert (dataset in ['qald', 'lcquad', 'transfer-a', 'transfer-b', 'transfer-c', 'qg', 'transfer-d', 'qg_customcopy'
                        , 'qg_copy'])

    path = 'data/models/' + str(problem) + '/' + str(model_name) + '/' + str(dataset)
    if not os.path.exists(path):
        os.makedirs(path)
    dir_name = [int(name) for name in os.listdir(path + '/')]
    if not dir_name:
        new_path_dir = path + '/' + str(0)
        os.mkdir(new_path_dir)
        new_model = 0
    else:
        dir_name = max(dir_name)
        new_model = dir_name + 1
        new_path_dir = path + '/' + str(new_model)
        os.mkdir(new_path_dir)
    return new_path_dir


# Function to save the model
def save_model(loc, modeler, model_name='model.torch', epochs=0, optimizer=None, accuracy=0,aux_save_information={}):
    """
        Input:
            loc: str of the folder where the models are to be saved - data/models/core_chain/cnn_dense_dense/lcquad/5'
            models: dict of 'model_name': model_object
            epochs, optimizers are int, torch.optims (discarded right now).
    """

    state = {
        'epoch': epochs,
        'optimizer': optimizer.state_dict(),
        # 'state_dict': model.state_dict(),
        'accuracy': accuracy
    }
    for tup in modeler.prepare_save():
        state[tup[0]] = tup[1].state_dict()
    aux_save = loc + '/model_info.pickle'
    loc = loc + '/' + model_name
    print("model with accuracy ", accuracy, "stored at", loc)
    torch.save(state, loc)

    _aux_save_information = aux_save_information.copy()
    try:
        _aux_save_information['parameter_dict'].pop('vectors')
    except KeyError:
        print("in model save, no vectors were found.")
        pass
    pickle.dump(_aux_save_information,open(aux_save, 'wb+'))


# def validation_accuracy(valid_questions, valid_pos_paths, valid_neg_paths, valid_pos_paths_rel1, valid_pos_paths_rel2, valid_neg_paths_rel1, valid_neg_paths_rel2, modeler, device):
#     precision = []
#     with torch.no_grad():
#         for i in range(len(valid_questions)):
#             question = np.repeat(valid_questions[i].reshape(1, -1), len(valid_neg_paths[i]) + 1,
#                                  axis=0)  # +1 for positive path
#             # paths = np.vstack((valid_pos_paths[i].reshape(1, -1), valid_neg_paths[i]))
#             paths = np.vstack((valid_neg_paths[i],valid_pos_paths[i].reshape(1, -1)))
#             paths_rel1 = np.vstack((valid_neg_paths_rel1[i],valid_pos_paths_rel1[i].reshape(1, -1)))
#             paths_rel2 = np.vstack((valid_neg_paths_rel2[i],valid_pos_paths_rel2[i].reshape(1, -1)))
#             question = torch.tensor(question, dtype=torch.long, device=device)
#             paths = torch.tensor(paths, dtype=torch.long, device=device)
#             paths_rel1 = torch.tensor(paths_rel1, dtype = torch.long, device=device)
#             paths_rel2 = torch.tensor(paths_rel2, dtype = torch.long, device=device)
#             score = modeler.predict(question, paths, paths_rel1, paths_rel2, device)
#             arg_max = torch.argmax(score)
#             if arg_max.item() == len(paths)-1:  # 0 is the positive path index
#                 precision.append(1)
#             else:
#                 precision.append(0)
#     return sum(precision) * 1.0 / len(precision)


def validation_accuracy_old(valid_questions, valid_pos_paths, valid_neg_paths,  modeler, device, *path_rel):

    if path_rel:
        if len(path_rel) == 4:
            valid_pos_paths_rel1, valid_pos_paths_rel2, valid_neg_paths_rel1, valid_neg_paths_rel2 = path_rel[0],path_rel[1],path_rel[2],path_rel[3]
        else:
            valid_pos_paths_rel1, valid_pos_paths_rel2, \
            valid_pos_paths_rel1_randomvec, valid_pos_paths_rel2_randomvec, \
            valid_neg_paths_rel1, valid_neg_paths_rel2, \
            valid_neg_paths_rel1_randomvec, valid_neg_paths_rel2_randomvec    = path_rel[0], \
                                                                                                     path_rel[1], \
                                                                                                     path_rel[2], \
                                                                                                     path_rel[3], \
                                                                                path_rel[4], path_rel[5], path_rel[6], \
                                                                                path_rel[7]
    precision = []
    with torch.no_grad():
        print(len(valid_questions))
        for i in range(len(valid_questions)):

            vnp,valid_index = np.unique(valid_neg_paths[i],axis=0,return_index=True)
            if path_rel:
                vnr1 = [valid_neg_paths_rel1[i][ind] for ind in valid_index ]
                vnr2 = [valid_neg_paths_rel2[i][ind] for ind in valid_index ]
                if len(path_rel) > 4:
                    vnr1_randomvec = [valid_neg_paths_rel1_randomvec[i][ind] for ind in valid_index]
                    vnr2_randomvec = [valid_neg_paths_rel2_randomvec[i][ind] for ind in valid_index]
            # paths = np.vstack((valid_pos_paths[i].reshape(1, -1), valid_neg_paths[i]))
            paths = np.vstack((vnp,valid_pos_paths[i].reshape(1, -1)))
            question = np.repeat(valid_questions[i].reshape(1, -1), len(vnp) + 1,
                                 axis=0)  # +1 for positive path

            if path_rel:
                paths_rel1 = np.vstack((vnr1,valid_pos_paths_rel1[i].reshape(1, -1)))
                paths_rel2 = np.vstack((vnr2,valid_pos_paths_rel2[i].reshape(1, -1)))

                if len(path_rel) > 4:
                    paths_rel1_randomvec = np.vstack((vnr1_randomvec, valid_pos_paths_rel1[i].reshape(1, -1)))
                    paths_rel2_randomvec = np.vstack((vnr2_randomvec, valid_pos_paths_rel2[i].reshape(1, -1)))


            #introducing delay here. Code repeat
            # doing it for constructing tensors as late as possible

            if True:
                print(f"question.shape {question.shape}, paths shape is {paths.shape}, "
                      f"paths_rel1 shape is {paths_rel1.shape},"
                      f" paths_rel2_randomvec shape is {paths_rel2_randomvec.shape} ")

            if path_rel:
                paths_rel1 = torch.tensor(paths_rel1, dtype=torch.long, device=device)
                paths_rel2 = torch.tensor(paths_rel2, dtype=torch.long, device=device)
                if len(path_rel) > 4:
                    paths_rel1_randomvec = torch.tensor(paths_rel1_randomvec, dtype=torch.long, device=device)
                    paths_rel2_randomvec = torch.tensor(paths_rel2_randomvec, dtype=torch.long, device=device)


            question = torch.tensor(question, dtype=torch.long, device=device)
            paths = torch.tensor(paths, dtype=torch.long, device=device)


            '''
                To write a distributed version
            '''
            if path_rel:
                if len(path_rel) == 4:
                    score = modeler.predict(question, paths, paths_rel1, paths_rel2, device)
                else:
                    score = modeler.predict(question,paths,paths_rel1,paths_rel1_randomvec,
                                            paths_rel2,paths_rel2_randomvec,device)
            else:
                score = modeler.predict(question, paths, device)
            arg_max = torch.argmax(score)
            if arg_max.item() == len(paths)-1:  # 0 is the positive path index
                precision.append(1)
            else:
                precision.append(0)
        print(precision)
    return sum(precision) * 1.0 / len(precision)


def tensorized_score(question, paths, modeler, device, path_rel=[]):
    '''
        Converts the np matrices to tensor, calculates the score and returns bool.

    :return:
    '''
    # print(1, len(paths), len(question))
    with torch.no_grad():
        if path_rel:
            if len(path_rel) == 4:
                paths_rel1, paths_rel2,paths_rel1_randomvec,paths_rel2_randomvec = path_rel
            else:
                paths_rel1, paths_rel2 = path_rel

        if path_rel:
            paths_rel1 = torch.tensor(paths_rel1, dtype=torch.long, device=device)
            paths_rel2 = torch.tensor(paths_rel2, dtype=torch.long, device=device)
            if len(path_rel) == 4:
                paths_rel1_randomvec = torch.tensor(paths_rel1_randomvec, dtype=torch.long, device=device)
                paths_rel2_randomvec = torch.tensor(paths_rel2_randomvec, dtype=torch.long, device=device)

        question = torch.tensor(question, dtype=torch.long, device=device)
        paths = torch.tensor(paths, dtype=torch.long, device=device)

        '''
            To write a distributed version
        '''
        if path_rel:
            if len(path_rel) == 2:
                score = modeler.predict(question, paths, paths_rel1, paths_rel2, device)
                del paths_rel1
                del paths_rel2
            else:
                score = modeler.predict(question, paths, paths_rel1, paths_rel1_randomvec,
                                        paths_rel2, paths_rel2_randomvec, device)
                del paths_rel1
                del paths_rel2
                del paths_rel1_randomvec
                del paths_rel2_randomvec
        else:
            score = modeler.predict(question, paths, device)


        arg_max = torch.argmax(score)
        if arg_max.item() == len(paths) - 1:  # 0 is the positive path index
            del question
            del paths
            return True
        else:
            del question
            del paths
            return False


def validation_accuracy(valid_questions, valid_pos_paths, valid_neg_paths,  modeler, device, *path_rel):

    if path_rel:
        if len(path_rel) == 4:
            valid_pos_paths_rel1, valid_pos_paths_rel2, valid_neg_paths_rel1, valid_neg_paths_rel2 = path_rel[0],path_rel[1],path_rel[2],path_rel[3]
        else:
            valid_pos_paths_rel1, valid_pos_paths_rel2, \
            valid_pos_paths_rel1_randomvec, valid_pos_paths_rel2_randomvec, \
            valid_neg_paths_rel1, valid_neg_paths_rel2, \
            valid_neg_paths_rel1_randomvec, valid_neg_paths_rel2_randomvec    = path_rel[0], \
                                                                                                     path_rel[1], \
                                                                                                     path_rel[2], \
                                                                                                     path_rel[3], \
                                                                                path_rel[4], path_rel[5], path_rel[6], \
                                                                                path_rel[7]
    precision = []
    with torch.no_grad():
        # print(len(valid_questions))
        c = 0
        for i in range(len(valid_questions)):
            # i = i + 304
            # c = c + 1
            # print(i)
            vnp,valid_index = np.unique(valid_neg_paths[i],axis=0,return_index=True)
            # print(c,len(valid_index))
            if path_rel:
                vnr1 = [valid_neg_paths_rel1[i][ind] for ind in valid_index ]
                vnr2 = [valid_neg_paths_rel2[i][ind] for ind in valid_index ]
                if len(path_rel) > 4:
                    vnr1_randomvec = [valid_neg_paths_rel1_randomvec[i][ind] for ind in valid_index]
                    vnr2_randomvec = [valid_neg_paths_rel2_randomvec[i][ind] for ind in valid_index]
            # paths = np.vstack((valid_pos_paths[i].reshape(1, -1), valid_neg_paths[i]))
            # print(valid_pos_paths[i].reshape(1, -1))
            paths = np.vstack((vnp,valid_pos_paths[i].reshape(1, -1)))
            question = np.repeat(valid_questions[i].reshape(1, -1), len(vnp) + 1,
                                 axis=0)  # +1 for positive path

            if path_rel:
                paths_rel1 = np.vstack((vnr1,valid_pos_paths_rel1[i].reshape(1, -1)))
                paths_rel2 = np.vstack((vnr2,valid_pos_paths_rel2[i].reshape(1, -1)))

                if len(path_rel) > 4:
                    paths_rel1_randomvec = np.vstack((vnr1_randomvec, valid_pos_paths_rel1[i].reshape(1, -1)))
                    paths_rel2_randomvec = np.vstack((vnr2_randomvec, valid_pos_paths_rel2[i].reshape(1, -1)))


            #introducing delay here. Code repeat
            # doing it for constructing tensors as late as possible
            distributed = True
            if distributed:
                #split it into K clusters and then pass it through tesnorized_score function
                def distribute_it(np_array,k):
                    # print(len(np_array))
                    _temp = np.array_split(np_array[:-1],k,axis=0)
                    # if True:
                    #     print(np_array[-1])
                    #     print(np.vstack([_temp[0],np_array[-1]]).shape )
                    #     print(np.vstack([_temp[0], np_array[-1]])[-1])
                    return [np.vstack([p,np_array[-1]]) for p in _temp]

                k = 20
                paths_split = distribute_it(paths,k=k)
                # raise IOError
                question_split = distribute_it(question,k=k)
                if path_rel:
                    paths_rel1_split = distribute_it(paths_rel1,k)
                    paths_rel2_split = distribute_it(paths_rel2,k)

                    if len(path_rel) > 4:
                        paths_rel1_randomvec_split = distribute_it(paths_rel1_randomvec,k)
                        paths_rel2_randomvec_split = distribute_it(paths_rel2_randomvec,k)
                        score = [tensorized_score(question=x[0], paths=x[1], modeler=modeler,
                                                  device=device,path_rel = [x[2],x[3],x[4],x[5]] ) for x in zip(
                            question_split,paths_split,paths_rel1_split,paths_rel2_split,
                            paths_rel1_randomvec_split,paths_rel2_randomvec_split)]
                    else:
                        score = [tensorized_score(question=x[0], paths=x[1], modeler=modeler,
                                                  device=device, path_rel=[x[2], x[3]]) for x in zip(
                            question_split, paths_split, paths_rel1_split, paths_rel2_split)]
                else:
                    score = [tensorized_score(question=x[0], paths=x[1], modeler=modeler,
                                              device=device) for x in zip(
                        question_split, paths_split)]


                # print(score)
                if False in score:
                    precision.append(0)
                else:
                    precision.append(1)

            else:

                # if True:
                #     print(f"question.shape {question.shape}, paths shape is {paths.shape}, "
                #           f"paths_rel1 shape is {paths_rel1.shape},"
                #           f" paths_rel2_randomvec shape is {paths_rel2_randomvec.shape} ")

                if path_rel:
                    paths_rel1 = torch.tensor(paths_rel1, dtype=torch.long, device=device)
                    paths_rel2 = torch.tensor(paths_rel2, dtype=torch.long, device=device)
                    if len(path_rel) > 4:
                        paths_rel1_randomvec = torch.tensor(paths_rel1_randomvec, dtype=torch.long, device=device)
                        paths_rel2_randomvec = torch.tensor(paths_rel2_randomvec, dtype=torch.long, device=device)


                question = torch.tensor(question, dtype=torch.long, device=device)
                paths = torch.tensor(paths, dtype=torch.long, device=device)


                '''
                    To write a distributed version
                '''
                if path_rel:
                    if len(path_rel) == 4:
                        score = modeler.predict(question, paths, paths_rel1, paths_rel2, device)
                    else:
                        score = modeler.predict(question,paths,paths_rel1,paths_rel1_randomvec,
                                                paths_rel2,paths_rel2_randomvec,device)
                else:
                    score = modeler.predict(question, paths, device)
                arg_max = torch.argmax(score)
                if arg_max.item() == len(paths)-1:  # -1 is the positive path index
                    precision.append(1)
                else:
                    precision.append(0)
            # print(precision)
        print(sum(precision) * 1.0 / len(precision))
    return sum(precision) * 1.0 / len(precision)


def validation_accuracy_alter(valid_questions, valid_pos_paths, valid_neg_paths, modeler, device, qa):
    precision = []

    print(valid_pos_paths.shape)
    print(valid_neg_paths.shape)
    print(valid_questions.shape)


    for i in range(len(valid_questions)):

        question = valid_questions[i]
        paths = np.vstack((valid_pos_paths[i].reshape(1, -1), valid_neg_paths[i]))

        score = qa._predict_corechain(question, paths)
        arg_max = np.argmax(score)
        if arg_max.item() == 0:  # 0 is the positive path index
            precision.append(1)
        else:
            precision.append(0)

    return sum(precision) * 1.0 / len(precision)


def id_to_word(path, gloveid_to_word, remove_pad = True):
    '''


    :param path: embedding id arrray list
    :param gloveid_to_word:
    :param embeddingid_to_gloveid:
    :param remove_pad:
    :return:
    '''
    sent = []
    for q in path:
        try:
            w = gloveid_to_word[q]
            if w != '<MASK>' and remove_pad:
                sent.append(w)
        except:
            sent.append('<unk>')
    return " ".join(sent)


def load_embeddingid_gloveid(embedding='ulmfit'):
    '''
        Loads required dictionary files for id_to_word functionality
    '''

    word_to_gloveid = ei.vocab
    # location_gl = './resources/vocab_gl.pickle'
    # location_um = './resources/vocab_ul.pickle'
    # if embedding == 'ulmfit':
    #     location = location_um
    # elif embedding == 'glove':
    #     location = location_gl
    #
    # if sys.version_info[0] == 3:
    #
    #     word_to_gloveid = pickle.load(open(location,'rb'),encoding='latin1')
    # else:
    #     word_to_gloveid = pickle.load(open(location, 'rb'))

    gloveid_to_word = {}
    for keys in word_to_gloveid:
        gloveid_to_word[word_to_gloveid[keys]] = keys
    return word_to_gloveid, gloveid_to_word


def load_embeddingid_gloveid_legacy():
    '''
        Loads required dictionary files for id_to_word functionality
    '''
    if sys.version_info[0] == 3:
        gloveid_to_embeddingid = pickle.load(open('data/data/common/vocab.pickle','rb'),encoding='bytes')
    else:
        gloveid_to_embeddingid = pickle.load(open('data/data/common/vocab.pickle','rb'))
    # reverse vocab it
    embeddingid_to_gloveid = {}
    for keys in gloveid_to_embeddingid:
        embeddingid_to_gloveid[gloveid_to_embeddingid[keys]] = keys

    if sys.version_info[0] == 3:
        word_to_gloveid = pickle.load(open('./resources/glove_vocab.pickle','rb'),encoding='latin1')
    else:
        word_to_gloveid = pickle.load(open('./resources/glove_vocab.pickle', 'rb'))

    gloveid_to_word = {}
    for keys in word_to_gloveid:
        gloveid_to_word[word_to_gloveid[keys]] = keys
    return gloveid_to_embeddingid , embeddingid_to_gloveid, word_to_gloveid, gloveid_to_word

def to_bool(value):
    if str(value) == 'true' or str(value) == 'True':
        return True
    else:
        return False


def load_data(_dataset, _train_over_validation, _parameter_dict, _relations, _pointwise,_device,k=-1):

    ###### This is where we can add the question generation to have lcquad as test case.
    '''


    :param _dataset:
    :param _train_over_validation:
    :param _parameter_dict:
    :param _relations:
    :param _pointwise:
    :param _device:
    :param k:
    :return:

    '''
    TEMP = data_loading_parameters(_dataset, _parameter_dict)

    _dataset_specific_data_dir,_model_specific_data_dir,_file,\
               _max_sequence_length,_neg_paths_per_epoch_train,_neg_paths_per_epoch_validation,_training_split,_validation_split,_index= TEMP

    _a = dl.load_data(_dataset, _dataset_specific_data_dir, _model_specific_data_dir, _file, _max_sequence_length,
                      _neg_paths_per_epoch_train,
                      _neg_paths_per_epoch_validation, _relations,
                      _index, _training_split, _validation_split, _model='core_chain_pairwise', _pairwise=not _pointwise, _debug=True, _rdf=False,k=k)

    data = {}

#   if _dataset == 'lcquad':
#        train_questions, train_pos_paths, train_neg_paths, dummy_y_train,\
#        valid_questions, valid_pos_paths, valid_neg_paths, dummy_y_valid, test_questions, test_pos_paths, test_neg_paths,vectors = _a

    dataset = ['lcquad','qg','qg_copy','qg_customcopy', 'transfer-d']
    if _dataset not in dataset:
        print("warning: Test accuracy would not be calculated as the data has not been prepared.")

#        train_questions, train_pos_paths, train_neg_paths, dummy_y_train, valid_questions, valid_pos_paths, valid_neg_paths, dummy_y_valid, vectors = _a
#        test_questions,test_neg_paths,test_pos_paths = None,None,None

        data['test_pos_paths'] = None
        data['test_pos_paths_rel1_sp'] = None
        data['test_pos_paths_rel2_sp'] = None
        data['test_pos_paths_rel1_rd'] = None
        data['test_pos_paths_rel2_rd'] = None

        data['test_neg_paths'] = None
        data['test_neg_paths_rel1_sp'] = None
        data['test_neg_paths_rel2_sp'] = None
        data['test_neg_paths_rel1_rd'] = None
        data['test_neg_paths_rel2_rd'] = None

        data['test_questions'] = None
        # data['test_entity'] = None

    else:
        data['test_pos_paths'] = _a['test_pos_paths']
        data['test_pos_paths_rel1_sp'] = _a['test_pos_paths_rel1_sp']
        data['test_pos_paths_rel2_sp'] = _a['test_pos_paths_rel2_sp']
        data['test_pos_paths_rel1_rd'] = _a['test_pos_paths_rel1_rd']
        data['test_pos_paths_rel2_rd'] = _a['test_pos_paths_rel2_rd']


        data['test_neg_paths'] = _a['test_neg_paths']
        data['test_neg_paths_rel1_sp'] = _a['test_neg_paths_rel1_sp']
        data['test_neg_paths_rel2_sp'] = _a['test_neg_paths_rel2_sp']
        data['test_neg_paths_rel1_rd'] = _a['test_neg_paths_rel1_rd']
        data['test_neg_paths_rel2_rd'] = _a['test_neg_paths_rel2_rd']


        data['test_questions'] = _a['test_questions']
        # data['test_entity'] = _a['test_entity']
    #

    if _train_over_validation:
        data['train_questions'] = np.vstack((_a['train_questions'], _a['valid_questions']))
        # data['train_entity'] = np.vstack((_a['train_entity'], _a['valid_entity']))

        data['train_pos_paths'] = np.vstack((_a['train_pos_paths'], _a['valid_pos_paths']))
        data['train_pos_paths_rel1_sp'] = np.vstack((_a['train_pos_paths_rel1_sp'],_a['valid_pos_paths_rel1_sp']))
        data['train_pos_paths_rel2_sp'] = np.vstack((_a['train_pos_paths_rel2_sp'],_a['valid_pos_paths_rel2_sp']))
        data['train_pos_paths_rel1_rd'] = np.vstack((_a['train_pos_paths_rel1_rd'],_a['valid_pos_paths_rel1_rd']))
        data['train_pos_paths_rel2_rd'] = np.vstack((_a['train_pos_paths_rel2_rd'],_a['valid_pos_paths_rel2_rd']))


        data['train_neg_paths'] = np.vstack((_a['train_neg_paths'], _a['valid_neg_paths']))
        data['train_neg_paths_rel1_sp'] = np.vstack((_a['train_neg_paths_rel1_sp'],_a['valid_neg_paths_rel1_sp']))
        data['train_neg_paths_rel2_sp'] = np.vstack((_a['train_neg_paths_rel2_sp'], _a['valid_neg_paths_rel2_sp']))
        data['train_neg_paths_rel1_rd'] = np.vstack((_a['train_neg_paths_rel1_rd'], _a['valid_neg_paths_rel1_rd']))
        data['train_neg_paths_rel2_rd'] = np.vstack((_a['train_neg_paths_rel2_rd'], _a['valid_neg_paths_rel1_rd']))

    else:
        data['train_questions'] = _a['train_questions']
        # data['train_entity'] = _a['train_entity']

        data['train_pos_paths'] = _a['train_pos_paths']
        data['train_pos_paths_rel1_sp'] = _a['train_pos_paths_rel1_sp']
        data['train_pos_paths_rel2_sp'] = _a['train_pos_paths_rel2_sp']
        data['train_pos_paths_rel1_rd'] = _a['train_pos_paths_rel1_rd']
        data['train_pos_paths_rel2_rd'] = _a['train_pos_paths_rel2_rd']


        data['train_neg_paths'] = _a['train_neg_paths']
        data['train_neg_paths_rel1_sp'] = _a['train_neg_paths_rel1_sp']
        data['train_neg_paths_rel2_sp'] = _a['train_neg_paths_rel2_sp']
        data['train_neg_paths_rel1_rd'] = _a['train_neg_paths_rel1_rd']
        data['train_neg_paths_rel2_rd'] = _a['train_neg_paths_rel2_rd']


    data['valid_questions'] = _a['valid_questions']
    # data['valid_entity'] = _a['valid_entity']

    data['valid_pos_paths'] = _a['valid_pos_paths']
    data['valid_pos_paths_rel1_sp'] = _a['valid_pos_paths_rel1_sp']
    data['valid_pos_paths_rel2_sp'] = _a['valid_pos_paths_rel2_sp']
    data['valid_pos_paths_rel1_rd'] = _a['valid_pos_paths_rel1_rd']
    data['valid_pos_paths_rel2_rd'] = _a['valid_pos_paths_rel2_rd']

    data['valid_neg_paths'] = _a['valid_neg_paths']
    data['valid_neg_paths_rel1_sp'] = _a['valid_neg_paths_rel1_sp']
    data['valid_neg_paths_rel2_sp'] = _a['valid_neg_paths_rel2_sp']
    data['valid_neg_paths_rel1_rd'] = _a['valid_neg_paths_rel1_rd']
    data['valid_neg_paths_rel2_rd'] = _a['valid_neg_paths_rel2_rd']

    data['vectors'] = _a['vectors']
    data['dummy_y'] = torch.ones(_parameter_dict['batch_size'], device=_device)

    return data


def data_loading_parameters(dataset,parameter_dict,runtime=False):

    if dataset == 'lcquad':
        _dataset_specific_data_dir = 'data/data/lcquad/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/lcquad/'
        _file = 'id_big_data.json'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _index = None

    elif dataset == 'qg':
        _dataset_specific_data_dir = 'data/data/qg/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/qg/'
        _file = 'id_big_data.json'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _index = None

    elif dataset == 'qg_copy':
        _dataset_specific_data_dir = 'data/data/qg_copy/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/qg_copy/'
        _file = 'id_big_data.json'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _index = None

    elif dataset == 'qg_customcopy':
        _dataset_specific_data_dir = 'data/data/qg_customcopy/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/qg_customcopy/'
        _file = 'id_big_data.json'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _index = None

    elif dataset == 'qald':
        _dataset_specific_data_dir = 'data/data/qald/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/qald/'
        if not runtime:
            _file = 'combined_qald.json'
            id_train = json.load(
                open(os.path.join(_dataset_specific_data_dir % {'dataset': dataset}, "qald_id_big_data_train.json")))
            json.dump(id_train, open(os.path.join(_dataset_specific_data_dir % {'dataset': dataset}, _file), 'w+'))
        else:
            _file = 'qald_id_big_data_test.json'


        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        if not runtime:
            _index = int(7.0 * (len(id_train)) / 8.0) - 1
        else:
            _index = -1


    elif dataset == 'transfer-a':
        _data_dir = 'data/data/'
        _dataset_specific_data_dir = 'data/data/transfer-a/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/transfer-a/'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _file, _index = ptl.transfer_a()

    elif dataset == 'transfer-b':
        _data_dir = 'data/data/'
        _dataset_specific_data_dir = 'data/data/transfer-b/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/transfer-b/'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _file, _index = ptl.transfer_b()

    elif dataset == 'transfer-c':
        _data_dir = 'data/data/'
        _dataset_specific_data_dir = 'data/data/transfer-c/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/transfer-c/'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _file, _index = ptl.transfer_c()

    elif dataset == 'transfer-d':
        _data_dir = 'data/data/'
        _dataset_specific_data_dir = 'data/data/transfer-d/'
        _model_specific_data_dir = 'data/data/core_chain_pairwise/transfer-d/'
        _max_sequence_length = parameter_dict['max_length']
        _neg_paths_per_epoch_train = parameter_dict['_neg_paths_per_epoch_train']
        _neg_paths_per_epoch_validation = parameter_dict['_neg_paths_per_epoch_validation']
        _training_split = .7
        _validation_split = .8
        _file, _index = ptl.transfer_d()

    elif dataset == 'transfer-proper-qald':
        print("the functionality is still not supported. Kill few kittens to get it to work or give me an ice cream")

    return _dataset_specific_data_dir,_model_specific_data_dir,_file,\
           _max_sequence_length,_neg_paths_per_epoch_train,_neg_paths_per_epoch_validation,_training_split,_validation_split,_index