def testParseAll(): srcBbClient = DbClient('localhost', 27017, "jobaly_daily_test") newCol = srcBbClient.getCollection("daily_job_webdev") job = DbClient.findById(newCol,jid) # paragraph = JobParser.parseParagraph(job) for job in newCol.find(): print "\n\n\n======",job["_id"],"============================\n" jobDesc = JobDescParser.parseJobDesc(job)
def testParseAll(): srcBbClient = DbClient('localhost', 27017, "jobaly_daily_test") newCol = srcBbClient.getCollection("daily_job_webdev") job = DbClient.findById(newCol, jid) # paragraph = JobParser.parseParagraph(job) for job in newCol.find(): print "\n\n\n======", job["_id"], "============================\n" jobDesc = JobDescParser.parseJobDesc(job)
def testParseParagraph(): srcBbClient = DbClient('localhost', 27017, "jobaly_daily_test") newCol = srcBbClient.getCollection("daily_job_webdev") jid = "9e216b2d65bd864b" jid = "matrixga/78237-51" jid = "cybercod/CN-.NETwebDev-CA3" jid = "f3c336fa35c28771" jid = "10116717/638726" jid = "ocs/54391" jid = "0e230c368a34322b" jid = "6718adb8b28b9b39" job = DbClient.findById(newCol,jid) jobDesc = JobDescParser.parseJobDesc(job) jobDesc.printParagraphs()
def testParseParagraph(): srcBbClient = DbClient('localhost', 27017, "jobaly_daily_test") newCol = srcBbClient.getCollection("daily_job_webdev") jid = "9e216b2d65bd864b" jid = "matrixga/78237-51" jid = "cybercod/CN-.NETwebDev-CA3" jid = "f3c336fa35c28771" jid = "10116717/638726" jid = "ocs/54391" jid = "0e230c368a34322b" jid = "6718adb8b28b9b39" job = DbClient.findById(newCol, jid) jobDesc = JobDescParser.parseJobDesc(job) jobDesc.printParagraphs()