def wordlist_dir_dialog(self): """ Pop up the "open a file" dialog and ask for which corpus text file to use """ self.corpus_filename = self._get_filename_from_dialog(ftype='wordlist') process_all_gui_events() if type(self.corpus_filename) != str: return # note that self.corpus_filename is an absolute full path self.corpus_name = os.path.basename(self.corpus_filename) self.corpus_stem_name = Path(self.corpus_name).stem self.lexicon = read_wordlist(self.corpus_filename) self.initialize_lexicon_tree() self.load_main_window(major_display=QWidget(), parameter_window=QWidget()) process_all_gui_events() self.status.clearMessage() self.status.showMessage( 'Wordlist selected: {}'.format(self.corpus_filename))
def test_read_wordlist(): assert isinstance(read_wordlist(wordlist_path), Lexicon)
def test_wordlist_from_wordlist_file(): lxa_object = lxa.read_wordlist(wordlist_path) test_object = lxa_object.wordlist() assert type(test_object) == list # TODO: not actually testing contents...
def main(): print( '\n================================================================\n' 'Welcome to Linguistica {}!\n' '================================================================'. format(lxa_version)) # -------------------------------------------------------------------------- # determine if file is a wordlist or a corpus text use_wordlist = determine_use_wordlist() print('--------------------------------------------') # -------------------------------------------------------------------------- # get file path file_abspath = get_file_abspath() print('\nFull file path:\n{}'.format(file_abspath)) print('--------------------------------------------') # -------------------------------------------------------------------------- # determine output directory output_dir = os.path.join(os.path.dirname(file_abspath), 'lxa_outputs') print('\nDefault output directory:\n{}'.format(output_dir)) output_dir = get_output_dir(output_dir) if not os.path.isdir(output_dir): os.mkdir(output_dir) print('--------------------------------------------') # -------------------------------------------------------------------------- # change encoding, if instructed encoding = get_encoding() print('--------------------------------------------') # -------------------------------------------------------------------------- # create the Linguistica object if use_wordlist: lxa_object = lxa.read_wordlist(file_abspath, encoding=encoding) else: lxa_object = lxa.read_corpus(file_abspath, encoding=encoding) # -------------------------------------------------------------------------- # change parameters, if instructed print('\nParameters:\n{}'.format(pformat(lxa_object.parameters()))) new_parameter_value_pairs = get_new_parameters() if new_parameter_value_pairs: lxa_object.change_parameters(**dict(new_parameter_value_pairs)) print('\nParameters after the changes:\n{}'.format( pformat(lxa_object.parameters()))) print('--------------------------------------------') # -------------------------------------------------------------------------- # run all Linguistica modules on the given file print('\nRunning all Linguistica modules on the given file:') lxa_object.run_all_modules(verbose=True) print('--------------------------------------------') # -------------------------------------------------------------------------- # output results as files print('\nGenerating output files...\n') lxa_object.output_all_results(directory=output_dir, verbose=True) print('\nResults are in ' + output_dir)
def main(): print('\n================================================================\n' 'Welcome to Linguistica {}!\n' '================================================================' .format(lxa_version)) # -------------------------------------------------------------------------- # determine if file is a wordlist or a corpus text use_wordlist = determine_use_wordlist() print('--------------------------------------------') # -------------------------------------------------------------------------- # get file path file_abspath = get_file_abspath() print('\nFull file path:\n{}'.format(file_abspath)) print('--------------------------------------------') # -------------------------------------------------------------------------- # determine output directory output_dir = os.path.join(os.path.dirname(file_abspath), 'lxa_outputs') print('\nDefault output directory:\n{}'.format(output_dir)) output_dir = get_output_dir(output_dir) if not os.path.isdir(output_dir): os.mkdir(output_dir) print('--------------------------------------------') # -------------------------------------------------------------------------- # change encoding, if instructed encoding = get_encoding() print('--------------------------------------------') # -------------------------------------------------------------------------- # create the Linguistica object if use_wordlist: lxa_object = lxa.read_wordlist(file_abspath, encoding=encoding) else: lxa_object = lxa.read_corpus(file_abspath, encoding=encoding) # -------------------------------------------------------------------------- # change parameters, if instructed print('\nParameters:\n{}'.format(pformat(lxa_object.parameters()))) new_parameter_value_pairs = get_new_parameters() if new_parameter_value_pairs: lxa_object.change_parameters(**dict(new_parameter_value_pairs)) print('\nParameters after the changes:\n{}' .format(pformat(lxa_object.parameters()))) print('--------------------------------------------') # -------------------------------------------------------------------------- # run all Linguistica modules on the given file print('\nRunning all Linguistica modules on the given file:') lxa_object.run_all_modules(verbose=True) print('--------------------------------------------') # -------------------------------------------------------------------------- # output results as files print('\nGenerating output files...\n') lxa_object.output_all_results(directory=output_dir, verbose=True) print('\nResults are in ' + output_dir)