import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

if __name__ == "__main__":

    feat_names = [

        ##############
        ## Query id ##
        ##############
        ("qid", SimpleTransform()),

        ################
        ## Word count ##
        ################
        ('count_of_query_unigram', SimpleTransform(config.count_feat_transform)
         ),
        ('count_of_unique_query_unigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_query_unigram', SimpleTransform()),
        ('count_of_query_bigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_query_bigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_query_bigram', SimpleTransform()),
        ('count_of_query_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_query_trigram',
示例#2
0
import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

if __name__ == "__main__":

    feat_names = [

        ################
        ## Word count ##
        ################
        ('count_of_question1_unigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_unigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_unigram', SimpleTransform()),
        ('count_of_question1_bigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_bigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_bigram', SimpleTransform()),
        ('count_of_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_trigram', SimpleTransform()),
        ('count_of_digit_in_question1',
         SimpleTransform(config.count_feat_transform)),
        # ('question1_bow_common_vocabulary_question2_bow_common_vocabulary_bow_common_svd100_cosine_sim', SimpleTransform()),
        # ('question1_bow_common_vocabulary_question2_bow_common_vocabulary_bow_common_svd150_cosine_sim', SimpleTransform()),

        # ('question1_tfidf_common_vocabulary_individual_svd100', SimpleTransform()),
        # ('question2_tfidf_common_vocabulary_individual_svd100', SimpleTransform()),
        # ('question1_tfidf_common_vocabulary_individual_svd150', SimpleTransform()),
        # ('question2_tfidf_common_vocabulary_individual_svd150', SimpleTransform()),

        # ('question1_bow_common_vocabulary_individual_svd100', SimpleTransform()),
        # ('question2_bow_common_vocabulary_individual_svd100', SimpleTransform()),
        # ('question1_bow_common_vocabulary_individual_svd150', SimpleTransform()),
        # ('question2_bow_common_vocabulary_individual_svd150', SimpleTransform()),

        #########################
        ## Cooccurrence TF-IDF ##
        #########################
        # ('question1_unigram_question2_unigram', SimpleTransform()),
        # ('question1_unigram_question2_bigram', SimpleTransform()),
        # ('question1_bigram_question2_unigram', SimpleTransform()),
        # ('question1_bigram_question2_bigram', SimpleTransform()),

        ######################
        ## word match share ##
        ######################
        ('ratio_of_question1_question2_unigram_share', SimpleTransform()),
        ('ratio_of_question1_question2_unigram_share_tfidf',
         SimpleTransform()),
    ]

    gen_info(feat_path_name="LSA_and_stats_feat_May03_CV_random")
    # combine_feat(feat_names, feat_path_name="LSA_and_stats_feat_May03_CV_random")
示例#4
0
import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

if __name__ == "__main__":

    feat_names = [

        ################
        ## Word count ##
        ################
        ('count_of_question1_unigram',
         SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_unigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_unigram', SimpleTransform()),
        ('count_of_question1_bigram',
         SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_bigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_bigram', SimpleTransform()),
        ('count_of_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_trigram', SimpleTransform()),

        # ('count_of_digit_in_question1', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_digit_in_question1', SimpleTransform()),
        ('count_of_question2_unigram',
示例#5
0
import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

            
if __name__ == "__main__":

    feat_names = [

        ################
        ## Word count ##
        ################
        ('count_of_question1_unigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_unigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_unigram', SimpleTransform()),

        ('count_of_question1_bigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_bigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_bigram', SimpleTransform()),

        ('count_of_question1_trigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_trigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_trigram', SimpleTransform()),

        # ('count_of_digit_in_question1', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_digit_in_question1', SimpleTransform()),

        ('count_of_question2_unigram', SimpleTransform(config.count_feat_transform)),
示例#6
0
from param_config import config
from combine_feat import combine_feat, SimpleTransform

if __name__ == "__main__":

    feat_names = [

        ##############
        ## Query id ##
        ##############
        #        ("qid", SimpleTransform()),

        ################
        ## Question   ##
        ################
        ('q1_who', SimpleTransform()),
        ('q2_who', SimpleTransform()),
        ('who_both', SimpleTransform()),
        ('q1_where', SimpleTransform()),
        ('q2_where', SimpleTransform()),
        ('where_both', SimpleTransform()),
        ('q1_when', SimpleTransform()),
        ('q2_when', SimpleTransform()),
        ('when_both', SimpleTransform()),
        ('q1_why', SimpleTransform()),
        ('q2_why', SimpleTransform()),
        ('why_both', SimpleTransform()),
        ('question1_can', SimpleTransform()),
        ('question2_can', SimpleTransform()),
        ('question1_could', SimpleTransform()),
        ('question2_could', SimpleTransform()),
示例#7
0
import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

if __name__ == "__main__":

    feat_names = [

        ################
        ## Word count ##
        ################
        ('count_of_question1_unigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_unigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_unigram', SimpleTransform()),
        ('count_of_question1_bigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_bigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_bigram', SimpleTransform()),
        ('count_of_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_trigram', SimpleTransform()),
        ('count_of_digit_in_question1',
         SimpleTransform(config.count_feat_transform)),
"""

import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

            
if __name__ == "__main__":

    feat_names = [

        # ## id feat
        ("qid", SimpleTransform()),

        ################
        ## Word count ##
        ################
        ('count_of_query_unigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_query_unigram', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_query_unigram', SimpleTransform()),
        ('count_of_query_bigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_query_bigram', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_query_bigram', SimpleTransform()),
        ('count_of_query_trigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_query_trigram', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_query_trigram', SimpleTransform()),
        ('count_of_digit_in_query', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_digit_in_query', SimpleTransform()),
示例#9
0
import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

            
if __name__ == "__main__":

    feat_names = [

        ################
        ## Word count ##
        ################
        ('count_of_question1_unigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_unigram', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_unigram', SimpleTransform()),

        ('count_of_question1_bigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_bigram', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_bigram', SimpleTransform()),

        ('count_of_question1_trigram', SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_trigram', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_unique_question1_trigram', SimpleTransform()),

        ('count_of_digit_in_question1', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_digit_in_question1', SimpleTransform()),

        ('count_of_question2_unigram', SimpleTransform(config.count_feat_transform)),
示例#10
0
        ## Word count ##
        ################
        # ('count_of_question1_unigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_unigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_unigram', SimpleTransform()),

        # ('count_of_question1_bigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_bigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_bigram', SimpleTransform()),

        # ('count_of_question1_trigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_trigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_trigram', SimpleTransform()),

        # ('count_of_digit_in_question1', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_digit_in_question1', SimpleTransform()),

        # ('count_of_question2_unigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question2_unigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question2_unigram', SimpleTransform()),

        # ('count_of_question2_bigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question2_bigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question2_bigram', SimpleTransform()),

        # ('count_of_question2_trigram', SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question2_trigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question2_trigram', SimpleTransform()),

        # ('count_of_digit_in_question2', SimpleTransform(config.count_feat_transform)),
        ('ratio_of_digit_in_question2', SimpleTransform()),
示例#11
0
import sys
sys.path.append("../")
from param_config import config
from gen_info import gen_info
from combine_feat import combine_feat, SimpleTransform

if __name__ == "__main__":

    feat_names = [

        ################
        ## Word count ##
        ################
        ('count_of_question1_unigram',
         SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_unigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_unigram', SimpleTransform()),
        ('count_of_question1_bigram',
         SimpleTransform(config.count_feat_transform)),
        # ('count_of_unique_question1_bigram', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_bigram', SimpleTransform()),
        ('count_of_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        ('count_of_unique_question1_trigram',
         SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_unique_question1_trigram', SimpleTransform()),

        # ('count_of_digit_in_question1', SimpleTransform(config.count_feat_transform)),
        # ('ratio_of_digit_in_question1', SimpleTransform()),
        ('count_of_question2_unigram',