コード例 #1
0
    def setUp(self, path, structure_file, input_file):
        """Set up some common variables.

        :param str path: The path that contains both the structure_file and
            input_file.
        :param str structure_file: The file with a JSON description of the
            XML structure.
        :param str input_file: The XML file to test.

        """
        database.clean()
        self.path = path
        self.structure_file = path + structure_file
        self.input_file = path + input_file

        string_processor.project = Project()

        self.input_project = Project()
        self.input_project.document_files.append(
            DocumentFile(path=self.input_file))
        self.input_project.save()

        with open(self.structure_file) as f:
            self.json = json.load(f)

        self.xml = etree.parse(self.input_file)
        self.extractor = StructureExtractor(self.input_project,
                                            self.structure_file,
                                            string_processor)
コード例 #2
0
    def setUp(self, path, structure_file, input_file):
        """Set up some common variables.

        :param str path: The path that contains both the structure_file and
            input_file.
        :param str structure_file: The file with a JSON description of the
            XML structure.
        :param str input_file: The XML file to test.

        """
        database.clean()
        self.path = path
        self.structure_file = path + structure_file
        self.input_file = path + input_file

        string_processor.project = Project()

        self.input_project = Project()
        self.input_project.document_files.append(
            DocumentFile(path=self.input_file))
        self.input_project.save()

        with open(self.structure_file) as f:
            self.json = json.load(f)

        self.xml = etree.parse(self.input_file)
        self.extractor = StructureExtractor(self.input_project,
            self.structure_file, string_processor)
コード例 #3
0
 def setUpClass(self, text=""):
     """Set up some local variables.
     """
     database.clean()
     t.project = Project()
     self.example = text
     self.result = t.tokenize(self.example)
     self.raw = t.parser.raw_parse(self.example)
コード例 #4
0
    def test_sanity(self):
        """Method should output the same result as running raw_parse directly
        when run on a normal sentence text.
        """
        database.clean()
        text = "The fox is brown."
        result = t.parse_with_error_handling(text)
        expected_result = t.parser.raw_parse(text)

        self.failUnless(result == expected_result)
コード例 #5
0
 def setUpClass(self, text=""):
     """Set up some local variables.
     """
     database.clean()
     t.project = Project()
     self.example = text
     # TODO: this method doesn't exist anymore, it was making
     # a redundant parser call
     # self.result = t.tokenize(self.example)
     self.raw = t.parser.raw_parse(self.example)
コード例 #6
0
 def setUpClass(self, text=""):
     """Set up some local variables.
     """
     database.clean()
     t.project = Project()
     self.example = text
     # TODO: this method doesn't exist anymore, it was making
     # a redundant parser call
     # self.result = t.tokenize(self.example)
     self.raw = t.parser.raw_parse(self.example)
コード例 #7
0
    def test_sanity(self):
        """Method should output the same result as running raw_parse directly
        when run on a normal sentence text.
        """
        database.clean()
        text = "The fox is brown."
        result = t.parse_with_error_handling(text)
        expected_result = t.parser.raw_parse(text)

        self.failUnless(result == expected_result)
コード例 #8
0
    def setUp(self):
        """Obtain a SequenceProcessor.
        """
        database.clean()
        self.project = mock.create_autospec(Project)
        self.seq_proc = SequenceProcessor(self.project)

        self.words = [Word(lemma="first", word="first"),
            Word(lemma="second", word="second"),
            Word(lemma="third", word="third")]
        self.string = "first second third"
コード例 #9
0
ファイル: testmodels.py プロジェクト: xiaobaozi34/wordseer
    def setUpClass(cls):
        database.clean()

        cls.set = Set()
        cls.sequenceset = SequenceSet()
        cls.sentenceset = SentenceSet()
        cls.documentset = DocumentSet()

        db.session.add_all([cls.set, cls.sequenceset, cls.sentenceset,
            cls.documentset])
        db.session.commit()
コード例 #10
0
    def setUp(self):
        """Get the documentparser instance.
        """
        database.clean()
        self.project = Project()
        self.project.save()

        self.mock_str_proc = MagicMock()
        with patch("app.preprocessor.documentparser.SequenceProcessor"):
            self.docparser = documentparser.DocumentParser(
                self.mock_str_proc, self.project)
コード例 #11
0
    def setUpClass(cls):
        database.clean()

        cls.set = Set()
        cls.sequenceset = SequenceSet()
        cls.sentenceset = SentenceSet()
        cls.documentset = DocumentSet()

        db.session.add_all(
            [cls.set, cls.sequenceset, cls.sentenceset, cls.documentset])
        db.session.commit()
コード例 #12
0
ファイル: testuploader.py プロジェクト: xiaobaozi34/wordseer
    def setUp(self):
        """Clear the database for the next unit test.
        """
        self.client = application.test_client()
        database.clean()
        self.user = user_datastore.create_user(email="*****@*****.**",
            password="******")
        db.session.commit()

        with self.client.session_transaction() as sess:
            sess["user_id"] = self.user.id
            sess["_fresh"] = True
コード例 #13
0
    def setUp(self):
        """Get the documentparser instance.
        """
        database.clean()
        self.project = Project()
        self.project.save()

        self.mock_str_proc = MagicMock()
        with patch("app.preprocessor.documentparser.SequenceProcessor"):
            self.docparser = documentparser.DocumentParser(
                self.mock_str_proc,
                self.project)
コード例 #14
0
    def setUp(self):
        """Clear the database for the next unit test.
        """
        self.client = application.test_client()
        database.clean()
        self.user = user_datastore.create_user(email="*****@*****.**",
                                               password="******")
        db.session.add(self.user)
        db.session.commit()

        with self.client.session_transaction() as sess:
            db.session.add(self.user)
            sess["user_id"] = self.user.id
            sess["_fresh"] = True
コード例 #15
0
ファイル: testutils.py プロジェクト: Wordseer/wordseer
    def setUpClass(cls):
        database.clean()
        cls.word1 = Word(lemma="bar")
        cls.word2 = Word(lemma="baz")
        cls.word3 = Word(lemma="bar")
        cls.word4 = Word(lemma="qux")

        sequence1 = Sequence(words=[cls.word1, cls.word2])
        sequence2 = Sequence(words=[cls.word4])
        sequence3 = Sequence(words=[cls.word3])
        cls.sequenceset1 = SequenceSet(sequences=[sequence1, sequence2])
        cls.sequenceset2 = SequenceSet(sequences=[sequence3])

        db.session.add_all([sequence1, sequence2, sequence3, cls.sequenceset1,
            cls.sequenceset2, cls.word1, cls.word2, cls.word3, cls.word4])
        db.session.commit()
コード例 #16
0
ファイル: testuploader.py プロジェクト: Wordseer/wordseer
 def setUp(self):
     database.clean()
     self.client = application.test_client()
     self.user1 = user_datastore.create_user(email="*****@*****.**",
         password="******")
     self.user2 = user_datastore.create_user(email="*****@*****.**",
         password="******")
     db.session.commit()
     with self.client.session_transaction() as sess:
         sess["user_id"] = self.user1.get_id()
         sess["_fresh"] = True
     self.project1 = Project(name="Foos project")
     self.project2 = Project(name="Bars project")
     self.user1.add_project(self.project1, ProjectsUsers.ROLE_ADMIN)
     self.user2.add_project(self.project2, ProjectsUsers.ROLE_ADMIN)
     self.project1.save()
     self.project2.save()
コード例 #17
0
 def setUp(self):
     database.clean()
     self.client = application.test_client()
     self.user1 = user_datastore.create_user(email="*****@*****.**",
                                             password="******")
     self.user2 = user_datastore.create_user(email="*****@*****.**",
                                             password="******")
     db.session.commit()
     with self.client.session_transaction() as sess:
         sess["user_id"] = self.user1.get_id()
         sess["_fresh"] = True
     self.project1 = Project(name="Foos project")
     self.project2 = Project(name="Bars project")
     self.user1.add_project(self.project1, ProjectsUsers.ROLE_ADMIN)
     self.user2.add_project(self.project2, ProjectsUsers.ROLE_ADMIN)
     self.project1.save()
     self.project2.save()
コード例 #18
0
    def setUpClass(cls):
        """Reset the DB and create a dummy project and document.
        """
        database.clean()
        cls.client = application.test_client()
        user = User()
        db.session.add(user)
        db.session.commit()
        project = Project(name="Bars project", users=[user])
        project.save()

        cls.file_handle, cls.file_path = tempfile.mkstemp()
        cls.file = os.fdopen(cls.file_handle, "r+")
        cls.file.write("foobar")
        cls.file_name = os.path.split(cls.file_path)[1]

        document_file = DocumentFile(projects=[project], path=cls.file_path)
        document_file.save()
コード例 #19
0
ファイル: testuploader.py プロジェクト: xiaobaozi34/wordseer
    def setUp(self):
        """Reset the DB and create a dummy project and document.
        """
        database.clean()
        self.client = application.test_client()
        user = User()
        db.session.add(user)
        db.session.commit()
        project = Project(name="Bars project", user=user)
        project.save()

        self.file_handle, self.file_path = tempfile.mkstemp()
        self.file = os.fdopen(self.file_handle, "r+")
        self.file.write("foobar")
        self.file_name = os.path.split(self.file_path)[1]

        document_file = DocumentFile(projects=[project], path=self.file_path)
        document_file.save()
コード例 #20
0
    def setUpClass(cls):
        database.clean()
        cls.word1 = Word(lemma="bar")
        cls.word2 = Word(lemma="baz")
        cls.word3 = Word(lemma="bar")
        cls.word4 = Word(lemma="qux")

        sequence1 = Sequence(words=[cls.word1, cls.word2])
        sequence2 = Sequence(words=[cls.word4])
        sequence3 = Sequence(words=[cls.word3])
        cls.sequenceset1 = SequenceSet(sequences=[sequence1, sequence2])
        cls.sequenceset2 = SequenceSet(sequences=[sequence3])

        db.session.add_all([
            sequence1, sequence2, sequence3, cls.sequenceset1,
            cls.sequenceset2, cls.word1, cls.word2, cls.word3, cls.word4
        ])
        db.session.commit()
コード例 #21
0
    def setUp(self):
        database.clean()
        colproc.parse_documents = mock.create_autospec(colproc.parse_documents)
        #name="parse_documents",)
        colproc.extract_record_metadata = mock.create_autospec(
            colproc.extract_record_metadata)
        #name="extract_record_metadata",)

        # Set up the dict that is our "logging database" and set the arguments
        # for calling process()
        self.log_dict = {
            "finished_recording_text_and_metadata": "true",
            "finished_grammatical_processing": "true",
            "finished_sequence_processing": "true",
            "word_counts_done": "true",
            "tfidf_done": "true",
            "word_similarity_calculations_done": "true"
        }

        self.args = ["", "", "", False]
コード例 #22
0
    def setUp(self):
        """Parse the brief example"""
        database.clean()
        self.path = "tests/data/plays/"
        self.structure_file = self.path + "structure.json"
        self.input_file = self.path + "brief_example.xml"

        self.input_project = Project()
        t.project = self.input_project

        self.input_project.document_files.append(
            DocumentFile(path=self.input_file))
        self.input_project.save()

        with open(self.structure_file) as f:
            self.json = json.load(f)

        self.xml = etree.parse(self.input_file)
        self.extractor = StructureExtractor(self.input_project,
                                            self.structure_file, t)
コード例 #23
0
    def setUp(self):
        """Parse the brief example"""
        database.clean()
        self.path = "tests/data/plays/"
        self.structure_file = self.path + "structure.json"
        self.input_file = self.path + "brief_example.xml"

        self.input_project = Project()
        t.project = self.input_project

        self.input_project.document_files.append(
            DocumentFile(path=self.input_file))
        self.input_project.save()

        with open(self.structure_file) as f:
            self.json = json.load(f)

        self.xml = etree.parse(self.input_file)
        self.extractor = StructureExtractor(self.input_project,
            self.structure_file, t)
コード例 #24
0
    def setUp(self):
        database.clean()
        colproc.parse_documents = mock.create_autospec(
            colproc.parse_documents)
            #name="parse_documents",)
        colproc.extract_record_metadata = mock.create_autospec(
            colproc.extract_record_metadata)
            #name="extract_record_metadata",)

        # Set up the dict that is our "logging database" and set the arguments
        # for calling process()
        self.log_dict = {"finished_recording_text_and_metadata": "true",
            "finished_grammatical_processing": "true",
            "finished_sequence_processing": "true",
            "word_counts_done": "true",
            "tfidf_done": "true",
            "word_similarity_calculations_done": "true"
        }

        self.args = ["", "", "", False]
コード例 #25
0
    def setUp(self):
        database.clean()
        self.client = application.test_client()
        self.user1 = user_datastore.create_user(email="*****@*****.**",
                                                password="******")
        self.user2 = user_datastore.create_user(email="*****@*****.**",
                                                password="******")
        db.session.commit()
        with self.client.session_transaction() as sess:
            sess["user_id"] = self.user1.get_id()
            sess["_fresh"] = True

        self.project = Project(name="Bars project")
        self.user2.add_project(self.project, role=ProjectsUsers.ROLE_ADMIN)

        file_handle, file_path = tempfile.mkstemp()
        file_handle = os.fdopen(file_handle, "r+")
        file_handle.write("foobar")

        self.file_path = os.path.join(file_path)
        self.document_file = DocumentFile(projects=[self.project],
                                          path=self.file_path)
        self.document_file.save()
コード例 #26
0
ファイル: testuploader.py プロジェクト: xiaobaozi34/wordseer
    def setUp(self):
        database.clean()
        self.client = application.test_client()
        self.user1 = user_datastore.create_user(email="*****@*****.**",
            password="******")
        self.user2 = user_datastore.create_user(email="*****@*****.**",
            password="******")
        db.session.commit()
        with self.client.session_transaction() as sess:
            sess["user_id"] = self.user1.get_id()
            sess["_fresh"] = True

        self.project = Project(name="Bars project", user=self.user2)
        self.project.save()

        file_handle, file_path = tempfile.mkstemp()
        file_handle = os.fdopen(file_handle, "r+")
        file_handle.write("foobar")

        self.file_path = os.path.join(file_path)
        self.document_file = DocumentFile(projects=[self.project],
                path=self.file_path)
        self.document_file.save()
コード例 #27
0
    t.start()

if __name__ == '__main__':

    # Import Psyco if available
    try:
        import psyco

        psyco.full()
    except ImportError:
        pass

    if len(sys.argv) == 1:
        usage()
    elif len(sys.argv) > 1:
        if sys.argv[1] == 'createdb':
            database.create()
        elif sys.argv[1] == 'wenxue':
            wenxue()
        elif sys.argv[1] == 'singtao':
            singtao()
        elif sys.argv[1] == 'list':
            database.list_news()
        elif sys.argv[1] == 'clean':
            database.clean(sys.argv[2])
        else:
            fetch((sys.argv[1]), debug=False)

    # wait all threads done
    q.join()
コード例 #28
0
import eupol
import eurojust
import f4e
import satcen
import ema
import cpvo
import esma
import bbi
import eba
import cdt
import eacea
import etf
import efsa
import eiopa

database.clean()

logging.basicConfig(
    level=logging.INFO,
    format='[%(levelname)s] (%(threadName)-10s) %(message)s',
)

epsoThread = threading.Thread(target=epso.scrapEPSO)

eupolThread = threading.Thread(target=eupol.scrapEUROPOL)

eujustThread = threading.Thread(target=eurojust.scrapEurojust)

emsaThread = threading.Thread(target=emsa.scrapEMSA)

f4eThread = threading.Thread(target=f4e.scrapF4E)
コード例 #29
0
 def setUp(self):
     """Mock out the parser for testing.
     """
     database.clean()
コード例 #30
0
 def setUp(self):
     """Obtain a SequenceProcessor.
     """
     database.clean()
     self.project = Project()
     self.seq_proc = SequenceProcessor(self.project)
コード例 #31
0
 def setUp(self):
     database.clean()
コード例 #32
0
 def setUp(self):
     """Clean the database.
     """
     database.clean()
コード例 #33
0
ファイル: JobScrapper.py プロジェクト: agitheo/EUJobs
import eupol
import eurojust
import f4e
import satcen
import ema
import cpvo
import esma
import bbi
import eba
import cdt
import eacea
import etf
import efsa
import eiopa

database.clean()

logging.basicConfig(level=logging.INFO,
                    format='[%(levelname)s] (%(threadName)-10s) %(message)s',
                    )


epsoThread = threading.Thread(target=epso.scrapEPSO)

eupolThread = threading.Thread(target=eupol.scrapEUROPOL)

eujustThread = threading.Thread(target= eurojust.scrapEurojust)

emsaThread = threading.Thread(target=emsa.scrapEMSA)

f4eThread = threading.Thread(target=f4e.scrapF4E)
コード例 #34
0
ファイル: testmodels.py プロジェクト: xiaobaozi34/wordseer
 def setUp(self):
     """Clean the current database.
     """
     database.clean()
コード例 #35
0
ファイル: testmodels.py プロジェクト: xiaobaozi34/wordseer
 def setUp(self):
     """Clean the current database.
     """
     database.clean()
     Project.active_project = Project()
コード例 #36
0
ファイル: testlogger.py プロジェクト: Wordseer/wordseer
 def setUp(self):
     """Clean the database.
     """
     database.clean()
コード例 #37
0
 def setUp(self):
     """Clean the current database.
     """
     database.clean()
コード例 #38
0
 def setUp(self):
     database.clean()
コード例 #39
0
 def setUp(self):
     """Mock out the parser for testing.
     """
     database.clean()
コード例 #40
0
 def setUp(self):
     """Clean the current database.
     """
     database.clean()
     Project.active_project = Project()