store.py

import time
import pickle
import random
random.seed(1234)
import numpy as np
from tqdm import tqdm
from sklearn import preprocessing
import matplotlib.pyplot as plt
from metrics import jaccard, precision, jaccard_sim, print_all_metrics

from greedy import kMIQP as greedy_kMIQP
from gurobi import kMIQP as gurobi_kMIQP

 
min_max_scaler = preprocessing.MinMaxScaler()
def _preprocess(one_tuple):
  groundtruth, preds, scores = one_tuple

  #scores = np.exp(scores)
  #scores = min_max_scaler.fit_transform(np.reshape(scores, [-1, 1]))
  #scores = scores.flatten()

  M = []
  for i in range(len(preds)):
    for j in range(i+1, len(preds)):
      M.append((i, j, jaccard_sim(preds[i], preds[j])))
  return scores, M


def _watch_log(res):
  for one_tuple in res:
    r, M = _preprocess(one_tuple)
    vx, max_res = kMIQP(r, M, lamb=1.0, k=10, outputFlag=True)
    print(vx, max_res)
    break


def _watch_time_cost(res):
  start_time = time.time()
  T = 20
  for one_tuple in res[:T]:
    r, M = _preprocess(one_tuple)
    vx, max_res = kMIQP(r, M, lamb=1.0, k=10)
    print(vx, max_res)
  cost_time = time.time() - start_time
  print('User Per Second: %.4fs' % (cost_time / T))


def _watch_converge(res):
  random.shuffle(res)
  tqdmInput = tqdm(res, ncols=77, leave=True)
  prec, jacc = 0.0, 0.0
  for iter, one_tuple in enumerate(tqdmInput):
    r, M = _preprocess(one_tuple)
    vx, max_res = kMIQP(r, M, lamb=1.0, k=10)

    groundtruth, preds, scores = one_tuple
    preds = [preds[x] for x in vx]

    prec += precision(groundtruth, preds)
    jacc += jaccard(preds)

    tqdmInput.set_description('Prec@10: %.3f%% Div: %.3f'
        % (prec*100/(iter+1), jacc/(iter+1)))

def reduce_by_kMIQP(algoname,res, source_file, save_path=None):
    outputs = []
    k = 10
    pd=[]
    div=[]
    xa=[]
    for li in np.arange(0,1,0.05):
        lamb=li
        xa.append(lamb)
        for one_tuple in tqdm(res, ncols=77):
            r, M = _preprocess(one_tuple)
            if algoname=='greedy':
              vx, max_res = greedy_kMIQP(r, M, lamb, k=k)
            elif algoname=='gurobi':
              vx, max_res = gurobi_kMIQP(r, M, lamb, k=k)

            #vx, max_res = kMIQP(r, M, lamb, k=k)
            groundtruth, preds, scores = one_tuple
            preds = [preds[x] for x in vx]
            outputs.append((groundtruth, preds, max_res))
        if save_path is None:
            prec, jacc = 0.0, 0.0
            for groundtruth, preds, scores in outputs:
                preds=preds[:k]
                jacc += jaccard(preds)
                prec += precision(groundtruth, preds)
            pd.append(prec*100/len(outputs))
            div.append(jacc/len(outputs))
        else:
            with open(save_path, 'wb') as f:
                pickle.dump(outputs, f, pickle.HIGHEST_PROTOCOL)
    
    
    return xa,pd,div
  

if __name__ == '__main__':
  #source_file = 'res_steam_50.pkl'
  #source_file = 'res_ele_50.pkl'
  #source_file = 'res_clo_50.pkl'
  source_file = 'res_ali_50.pkl'
  target_file = None
  # target_file = 'res_ele_05_MIQP.pkl'
  with open(source_file, 'rb') as f:
    res = pickle.load(f)
 
  # _watch_log(res)
  # _watch_time_cost(res)
  # _watch_converge(res)
  '''
  greedy_x,greedy_p,greedy_div=reduce_by_kMIQP('greedy',res, source_file,target_file)
  print(greedy_x)
  print(greedy_p)
  print(greedy_div)
  '''
  
  gurobi_x,gurobi_p,gurobi_div=reduce_by_kMIQP('gurobi',res, source_file,target_file)
  print(gurobi_x)
  print(gurobi_p)
  print(gurobi_div)
  
'''
  with open('new_clo_k=10_0to1.pkl', 'wb') as f:
    pickle.dump(greedy_p, f, pickle.HIGHEST_PROTOCOL)
    pickle.dump(greedy_div, f, pickle.HIGHEST_PROTOCOL)
    pickle.dump(gurobi_p, f, pickle.HIGHEST_PROTOCOL)
    pickle.dump(gurobi_div, f, pickle.HIGHEST_PROTOCOL)
    '''