def testMinimalExample(self):
     file_ = os.path.abspath(os.path.join('..','testFiles','minimalExample.tex'))
     sArgs = sortArgs([])
     repRE, extRE, puncRE, delRE = compileRegex(sArgs[0], sArgs[1], sArgs[3],
                                        sArgs[4], sArgs[2])
     text = extractText(file_, repRE, extRE, puncRE, delRE)
     self.assertEqual(text, "")
 def testSampleOneReplaceClass(self):
     file_ = os.path.abspath(os.path.join('..','testFiles','example1.tex'))
     sArgs = sortArgs(["--replace-class","hword","Header"])
     repRE, extRE, puncRE, delRE = compileRegex(sArgs[0], sArgs[1], sArgs[3],
                                        sArgs[4], sArgs[2])
     text = extractText(file_, repRE, extRE, puncRE, delRE)
     self.assertEqual(text, "Header Header Header This is a sample document to test expected extraction."+\
                      " Header Header Header This is section one. Header Header This is section two.")
 def testSampleOneIgnoreDefault(self):
     file_ = os.path.abspath(os.path.join('..','testFiles','example1.tex'))
     sArgs = sortArgs(["--ignore-default-extraction","--extract-class","word"])
     repRE, extRE, puncRE, delRE = compileRegex(sArgs[0], sArgs[1], sArgs[3],
                                        sArgs[4], sArgs[2])
     text = extractText(file_, repRE, extRE, puncRE, delRE)
     self.assertEqual(text, "This is a sample document to test expected extraction."+\
                      " This is section one. This is section two.")
 def testSampleOneNoPunc(self):
     file_ = os.path.abspath(os.path.join('..','testFiles','example1.tex'))
     sArgs = sortArgs(["--no-punctuation"])
     repRE, extRE, puncRE, delRE = compileRegex(sArgs[0], sArgs[1], sArgs[3],
                                        sArgs[4], sArgs[2])
     text = extractText(file_, repRE, extRE, puncRE, delRE)
     self.assertEqual(text, "Sample Article One This is a sample document to test expected extraction"+\
                      " Section One Title This is section one Section Two This is section two")
 def testSample2ReplaceInlineMath(self):
     file_ = os.path.abspath(os.path.join('..','testFiles','example2.tex'))
     sArgs = sortArgs(["--replace-inline-math","inline_math"])
     repRE, extRE, puncRE, delRE = compileRegex(sArgs[0], sArgs[1], sArgs[3],
                                        sArgs[4], sArgs[2])
     text = extractText(file_, repRE, extRE, puncRE, delRE)
     self.assertEqual(text, "Sample Article Two This is a sample document to test expected extraction."+\
                      " Section One Title This is section one. This is an inline equation inline_math with text surrounding it."+\
                      " This is a normal equation This is a figure")
 def testSample2PuncFile(self):
     file_ = os.path.abspath(os.path.join('..','testFiles','example2.tex'))
     pFile = os.path.abspath(os.path.join('..','testFiles','samplePuncFile.txt'))
     sArgs = sortArgs(["--punctuation-file",pFile])
     repRE, extRE, puncRE, delRE = compileRegex(sArgs[0], sArgs[1], sArgs[3],
                                        sArgs[4], sArgs[2])
     text = extractText(file_, repRE, extRE, puncRE, delRE)
     self.assertEqual(text, "Sample Article Two This is a sample document to test expected extraction."+\
                      " Section One Title This is section one. This is an inline equation with text surrounding it."+\
                      " This is a normal equation This is a figure:")