Example #1
0
 def testSimple(self):
     con = Connector(getDataLoader())
     self.assertEqual(-5447, con.getCost(1283, 1298))
     with self.assertRaises(RuntimeError):
         con.getCost(-1, 101)
     with self.assertRaises(RuntimeError):
         con.getCost(1, 100000001)
Example #2
0
 def post(self, request, *args, **kwargs):
     logging.info('Get a message!')
     if request.method == 'POST':
         userText = request.POST['text']
         addWord = request.POST['word']
         addReading = request.POST['reading']
         addDefinition = request.POST['definition']
         addSentence = request.POST['sentence']
         unknownWordsOnly = request.POST['unknownWordsOnly']
         logger = logging.getLogger('console')
         logger.info('POST settings: userTextLen:%s, word:%s, reading:%s, '
                      'definition:%s, sentence:%s, unknownWordsOnly:%s',
                      len(userText), addWord, addReading, addDefinition,
                      addSentence, unknownWordsOnly)
         unknownWordsOnly = int(unknownWordsOnly)
         result = []
         textProc = TextProcessor(getDataLoader())
         contents = textProc.do(userText, Settings.NoExcessiveReading(), True)
         for word, startPos, reading, definition, sentence in contents:
             isKnown = self.getWordStatus(word)
             if not unknownWordsOnly or not isKnown:
                 result.append((word, reading, definition, sentence, isKnown))
         logger.info('# of words to return: %d', len(result))
         #contents = list(contents)
       #  logging.info("%d records sent", len(result))
         data = simplejson.dumps(result)
         h = HttpResponse(data, mimetype="application/json", status=200)
         return h
Example #3
0
 def testCharCategories(self):
     prop = CharProperty(getDataLoader())
     self.assertEqual(['DEFAULT', 'SPACE', 'KANJI', 'SYMBOL',
                       'NUMERIC', 'ALPHA', 'HIRAGANA', 'KATAKANA',
                       'KANJINUMERIC', 'GREEK', 'CYRILLIC'], prop.getCategories())
     self.assertEqual(['SPACE'], prop.getCharCaterogies(' '))
     self.assertEqual(['NUMERIC'], prop.getCharCaterogies('1'))
     self.assertEqual(['ALPHA'], prop.getCharCaterogies('a'))
     self.assertEqual(['KANJI'], prop.getCharCaterogies('吗'))
Example #4
0
 def __init__(self):
   webapp2.WSGIApplication.__init__(self, [('/', MainPage),
                                           ('/mydeck', DeckPage),
                                           ('/about', AboutPage),
                                           ('/addcard', AddCardPage),
                                           ('/deletecard', DeleteCardPage),
                                           ('/export', ExportDeckPage),
                                           ('/backend', BackendPage)],
                                           debug=True)
   try:
       get_url()
       logging.info('Starting backend')
       self.textProc = TextProcessor(getDataLoader())
   except InvalidBackendError:
       logging.info('Starting frontend')
Example #5
0
def dryBurn():
    from pkgutil import iter_modules
    a=iter_modules()
    while True:
        try: x=a.next()
        except: break
        print (x[1], '<br>')

    setupLogger()
    contents = '船が検疫所に着いたのは'
    textProc = TextProcessor(getDataLoader())
    for word, reading, definition, sentence in textProc.do(contents, Settings.NoExcessiveReading(), True):
        line = text_type('{0:<10}  {1:<10}  {2:<10}  {3}\n').format(word, reading, definition,sentence)
        line = line.strip('\n')
        print(line.encode('utf-8'))
Example #6
0
def main():
    parser = argparse.ArgumentParser(description='Get the list word in the text.')
    parser.add_argument('inputfile', metavar='input file name',
                   help='input file name')
    parser.add_argument('-d', metavar='deck file name', required=False,
                   help='deck file nime')
    parser.add_argument('-t', metavar='tag', required=False,
                   help='optional tag appended to the list')
    parser.add_argument('-o', metavar='output file name', required=False,
                   help='output file name')
    args = parser.parse_args()
    if args.o:
        sys.stdout = open(args.o, 'w', encoding='utf-8')

    setupLogger()
    with openInputFile(args.inputfile) as file:
        contents = file.read()
        if isPy2():
            contents = unicode(contents, 'utf-8')
        textProc = TextProcessor(getDataLoader())
        getUniqueCSVList(textProc, contents, args.d, args.t)
Example #7
0
 def setUp(self):
     self.dictionary = dartsdict.DartsDictionary(getDataLoader().load('jdict'))
Example #8
0
 def setUp(self):
     self.pyparser = PyPortSentenceParser(getDataLoader())
     self.exeparser = MecabSentenceParser()
Example #9
0
 def setUp(self):
     self.textProc = TextProcessor(getDataLoader())
     self.maxDiff = None
Example #10
0
 def setUp(self):
     self.defaultText = '船が検疫所に着いたのは、朝の四時頃にちがいない。'
     self.viterbi = Viterbi(getDataLoader())
Example #11
0
 def setUp(self):
     self.viterbi = Viterbi(getDataLoader())
     self.maxDiff = None
Example #12
0
 def setUp(self):
     self.tokenizer = Tokenizer(getDataLoader())