def create_index(self):
        try:
            self.start_time = time.time()
            if not os.path.exists("output"):
                os.makedirs("output")

            for i in range(0,self.num_files):
                print "Indexing File: " + str(i)
                length = 0
                content_start = 0
                content_end = 0
                index_counter = 0

                index = self.open_index_file(i)
                content = self.open_data_file(i)

                while content_end < len(content) and index_counter < len(index):
                    content_start = content_end
                    details = index[index_counter].split()

                    url = details[0]
                    length = int(details[3])
                    status = details[6]

                    index_counter += 1
                    self.page_id += 1
                    content_end += length

                    if not status == 'ok':
                        continue

                    try:
                        page = content[content_start:content_end]
                        c_page = page
                        tokenized = parser.parser(url,page,c_page,length+1,length+1)[1]

                        self.doc_id_url_file.write(str(self.page_id) + ": " + str(url) + "\n")

                        self.interim_index = intermediate_posting(tokenized,self.page_id)
                    except TypeError as e:
                        pass

                interim_index_creator(self.interim_index,i)

                merge_interim(i)

                #Delete intermediate files

                os.system('rm output/index_'+str(i)+'.txt')

                 #Making the final file which will contain the final index
            os.system('mv output/index_X' + str(self.num_files-1) + '.txt INDEX.txt')
            self.doc_id_url_file.close()
            self.time_elapsed = time.time() - self.start_time
            print "Time Elapsed: " + str(self.time_elapsed)
            os.rmdir("output")
        except Exception as e:
            print "Exception: " + str(e)
Example #2
0
 def init_team(self):
   # parser & preprocessing
   self.params['stamp'] = self.params.get('stamp') or "%s_%s" % (self.params['alg'], self.timestamp)
   self.params['data_cache'] = "%s/data/cache/data_cache_size%.2f_split%i_x%.2fy%.2f.pkl" % (self.params['root'], self.params['size'], self.params['train_test_split_time'], self.params['x_step'], self.params['y_step'])
   self.pas = parser.parser(self.params)
   if not os.path.exists(self.params['data_cache']):
     df_train, df_valid, _ = self.pas.get_data()
     # self.pas.init_data_cache(pd.concat([df_train, df_valid]), self.params)
     self.pas.init_data_cache(df_train, self.params)
   # workers
   self.tra = trainer.trainer(self.params)
   self.eva = evaluator.evaluator(self.params)
   print("=====[Start] @ %s=====" % (datetime.now()))
   for k, v in self.params.items(): print("%s = %s" % (k,v))
   print("="*50)
Example #3
0
 def init_team(self):
     # parser & preprocessing
     self.params['stamp'] = self.params.get(
         'stamp') or "%s_%s" % (self.params['alg'], self.timestamp)
     self.params[
         'data_cache'] = "%s/data/cache/data_cache_size%.2f_split%i_x%.2fy%.2f.pkl" % (
             self.params['root'], self.params['size'],
             self.params['train_test_split_time'], self.params['x_step'],
             self.params['y_step'])
     self.pas = parser.parser(self.params)
     if not os.path.exists(self.params['data_cache']):
         df_train, df_valid, _ = self.pas.get_data()
         # self.pas.init_data_cache(pd.concat([df_train, df_valid]), self.params)
         self.pas.init_data_cache(df_train, self.params)
     # workers
     self.tra = trainer.trainer(self.params)
     self.eva = evaluator.evaluator(self.params)
     print("=====[Start] @ %s=====" % (datetime.now()))
     for k, v in self.params.items():
         print("%s = %s" % (k, v))
     print("=" * 50)
Example #4
0
 def getmail(self, content, target):
     return parser.parser(content, target).email()
def main():
    """
    None -> None
    This serves as the main program.
    """

    # Initialize classes. Argparser, statistics, information collector, graph and parser.
    arg_parser = argparser()
    stats_record = statistics()
    info_collector = collector()
    epi_graph = graph()
    file_parser = parser()

    # Get the options from the arguments passed in by the user.
    print("Gathering simulation parameters...")
    options = arg_parser.collect_and_return_args()
    options.R_0 = abs(float(options.R_0))
    options.life_time = abs(float(options.life_time))
    options.death_rate = abs(float(options.death_rate))
    options.infected_count = abs(int(options.infected_count))
    options.daily_travel_percentage = abs(
        float(options.daily_travel_percentage))
    travel_p = options.daily_travel_percentage
    if (travel_p >= .003):
        os.system('cls' if os.name == 'nt' else 'clear')
        raise Exception(
            "ERROR: Daily travel percentage must be less than .003.")
    # Get the total amount of initially infected people.
    initial_inf_count = abs(options.infected_count)
    file_parser.open_and_read_city_file(
        options.cities_file)  # Read the city file and save info into parser.
    file_parser.open_and_read_plane_file(
        options.planes_file)  # Read the plane file and save info into parser.
    # Get the total number of hours the program should simulate based on the number of days it should run.
    days_to_run = abs(int(round(float(options.sim_time))))

    if (options.life_time == 0):
        os.system('cls' if os.name == 'nt' else 'clear')
        raise Exception("ERROR: Life time must be greater than zero.")
    hours_to_run = (days_to_run * 24)

    cities = list(
    )  # Create a list to hold all city classes used in simulation.
    # Declare rate of reproduction, hour, and day variables for the main loop.
    hour = 1
    day = 1
    total_person_count = 0
    if (days_to_run < 2):
        os.system('cls' if os.name == 'nt' else 'clear')
        raise Exception(
            "ERROR: Epidemic simulation needs to run longer than 2 days.")
    # Create list of cities.
    for c in file_parser.cities_list:
        nc = city(c, file_parser.planes_list, travel_p, options)
        cities.append(nc)
        stats_record.add_city(nc)

    # Add cities as locations to visit and calculate distance between cities.
    for i in cities:
        for j in cities:
            i.add_cities(j)
        total_person_count += len(i.people)
    # Infect the correct amount of people.
    num_inf = 0
    while (num_inf < initial_inf_count):
        # Choose the city and person randomly to infect.
        city_to_inf = random.choice(cities)
        #choose a random person to infect in that city
        person_to_inf = random.choice(city_to_inf.people)
        #check to make sure that person is not already infected
        if (person_to_inf.infected == True):
            #if that person is already infected continue and find somebody who is not
            continue
        #once you found somebody infect them
        person_to_inf.infect()
        #add to the infected count and decrease the healthy count for that city
        city_to_inf.inf_count += 1
        city_to_inf.healthy_count -= 1
        num_inf += 1

    # Clear the system to display proper program information.
    os.system('cls' if os.name == 'nt' else 'clear')

    # indexes for totals, used in people totals
    dead_count_ind = 0
    infected_count_ind = 1
    immune_count_ind = 2
    healthy_count_ind = 3

    infected_travelers_per_day = 0

    try:
        while (stats_record.Re > 0.3):

            # Program has run for the total number of hours requested, exit.
            if (hours_to_run == hour):
                break

            # Increment hour after checking if the simulation reached the end.
            hour += 1

            # totals of people status
            people_totals = [0, 0, 0, 0]
            flight_total = 0
            healthy_each_day = 0
            # Call update methods for city objects and record data.
            for location in cities:
                stats_record.add_vessels(location.tick())
                # If end of day, add totals for each location.
                people_totals[dead_count_ind] += location.dead_count
                people_totals[infected_count_ind] += location.inf_count
                people_totals[immune_count_ind] += location.immune_count
                people_totals[healthy_count_ind] += location.healthy_count
                healthy_each_day += location.healthy_count
                flight_total += location.flights_counter
                if (hour % 24 == 0):
                    info_collector.track_healthy(location.healthy_count,
                                                 location.name)
                    infected_travelers_per_day += location.sent_infected_people
                    location.sent_infected_people = 0
                    location.flights_counter = 0

            stats_record.Re = float(people_totals[healthy_count_ind] /
                                    stats_record.totalPop) * options.R_0
            if not people_totals[infected_count_ind]:
                break

            # Collect daily contagion information for graphing purposes.

            if (hour % 24 == 0):
                info_collector.add_to_daysplot(day)
                info_collector.add_to_dplot(people_totals[dead_count_ind])
                info_collector.add_to_iplot(people_totals[infected_count_ind])
                info_collector.add_to_implot(people_totals[immune_count_ind])
                info_collector.add_flights(flight_total)
                info_collector.add_infected_travelers(
                    infected_travelers_per_day)
                infected_travelers_per_day = 0

                info_collector.total_healthy.append(healthy_each_day)
                day += 1

            # Call update method for vÆ’essel objects and update the active and inactive vessel lists.
            for vessel in stats_record.activevessels:
                if vessel.tick():
                    stats_record.activevessels.remove(
                        vessel)  #remove an active flight from actives list
                    stats_record.inactivevessels.append(
                        vessel)  #add flight to inactive flights list

            # Display the current contagion information
            stats_record.curr_contagion_info(hour, hours_to_run)

    except:
        print("\nWARNING: Keyboard interrupt. Printing statistics...")
        stats_record.print_stats(days_to_run, total_person_count)
        sys.stdout.write("\n")
        return

    #print overal simulation statistics
    stats_record.print_stats(days_to_run, total_person_count)
    sys.stdout.write("\n")
    #produce a time series graph of the contagion spreading over the period of time the simulation modeled.
    stats_record.print_time_series_table(info_collector.days_plot,
                                         info_collector.immune_plot,
                                         info_collector.infected_plot,
                                         info_collector.dead_plot)
    epi_graph.create_and_show_graphs(
        info_collector.days_plot, info_collector.immune_plot,
        info_collector.infected_plot, info_collector.dead_plot,
        info_collector.healthy_city_info, info_collector.flight_info,
        info_collector.infected_travelers_plot)
    sys.stdout.write("\n")

    return
Example #6
0
File: main.py Project: Shruubi/cml
import sys
import os
from lib.filehandler import FileHandler
from lib.parser import parser

#ensure that we have more than one command line argument
if(len(sys.argv) == 1):
	print("error, no file specified")
	sys.exit()

#continue on here
file = FileHandler(sys.argv[1], "r")
contents = file.fetchList()

#init our parser
parser = parser(contents)
parser.parse()

outputFilename = sys.argv[1][:sys.argv[1].find(".")+1]
outputFile = outputFilename + "c"
output = FileHandler(outputFile, "w+")
for line in parser.getGenerated():
    output.getFile().write("%s\n" % line)
output.cleanup()

os.system("gcc " + outputFile + " -o " + outputFilename + "o")
print("successfully converted and compiled")