def my_mapper_simulation(input_directory, output_directory, my_mapper_input_parameters): # 1. We create the map_simulation folder # 1.1. If it already existed, then we remove it if os.path.exists(output_directory + "1. my_map_simulation/"): shutil.rmtree(output_directory + "1. my_map_simulation/") # 1.2. We create it again os.makedirs(output_directory + "1. my_map_simulation/") # 2. We collect the list of files we have to process file_names = os.listdir(input_directory) # 3. We process each file sequentially for file in file_names: # 3.1. We open the file to be read my_input_stream = codecs.open(input_directory + file, "r", encoding='utf-8') # 3.2. We open the file we want to write to my_output_stream = codecs.open(output_directory + "1. my_map_simulation/map_" + file, "w", encoding='utf-8') # 3.4. We process it my_mapper.my_map(my_input_stream, my_output_stream, my_mapper_input_parameters) # 3.4. We close the files my_input_stream.close() my_output_stream.close()
def my_mapper_simulation(input_directory, output_directory, my_mapper_input_parameters): # 1. We create the results file my_output_stream = codecs.open(output_directory + "my_mapper_results.txt", "w", encoding='utf-8') # 2. We collect the list of files we have to process file_names = os.listdir(input_directory) # 3. We process each file sequentially for file in file_names: # 3.1. We open the file to be read my_input_stream = codecs.open(input_directory + file, "r", encoding='utf-8') # 3.2. We process it my_mapper.my_map(my_input_stream, my_output_stream, my_mapper_input_parameters) # 3.3. We close the file my_input_stream.close() # 4. We close the results file my_output_stream.close()
def simulating_my_map(directory, extension, output_stream, languages, num_top_entries): # 1. We get the files to be processed input_files = select_files_from_directory_with_concrete_extension(directory, extension) # 2. We process them for i in range(0, len(input_files)): # 3.1. We open the file to be read input_stream = codecs.open(input_files[i], "r", encoding='utf-8') # 3.2. We process it my_mapper.my_map(input_stream, languages, num_top_entries, output_stream) # 3.3. We close the file input_stream.close()
def simulating_my_map(directory, extension, output_stream): # 1. We get the files to be processed input_files = select_files_from_directory_with_concrete_extension( directory, extension) # 2. We process them for i in range(0, len(input_files)): # 3.1. We open the file to be read input_stream = open(input_files[i], "r") # 3.2. We process it my_mapper.my_map(input_stream, output_stream) # 3.3. We close the file input_stream.close() output_stream.close()