def loadCouchDB(db_name, view_name, excel_name): tweet_dict = {} couch_server = Server("http://115.146.94.12:5984") couch_server.resource.credentials = ('admin', 'admin') couch_server.config() db = couch_server[db_name] wb = Workbook() ws = wb.active ws.title = "range names" rowid = 1 for row in db.view(view_name): coordinate = re.sub(r"\[|\]", "", str(row.key)) # write coordinate col = get_column_letter(1) ws.cell('%s%s'%(col, rowid)).value = coordinate #write polarity col = get_column_letter(2) ws.cell('%s%s'%(col, rowid)).value = getPolarity(row.value) #write text col = get_column_letter(3) ws.cell('%s%s'%(col, rowid)).value = row.value rowid += 1 ws = wb.create_sheet() ws.title = 'coordinate' wb.save(filename = excel_name) return tweet_dict
def loadCouchDB(db_name, view_name, start_key, end_key): tweet_dict = [] couch_server = Server("http://115.146.94.12:5984") couch_server.resource.credentials = ("admin", "admin") couch_server.config() db = couch_server[db_name] start_reading_db_time = time.time() try: logger.info(socket.gethostname() + " Start reading " + view_name + " on database") for row in db.view(view_name, reduce=False, startkey=start_key, endkey=end_key): text = row.value if re.search(r"[^\x00-\x7F]+", text) is None: tweet_dict.append(row.key + "@@##$$" + text) except: logger.error(socket.gethostname() + " Reading " + view_name + " error.") end_reading_db_time = time.time() reading_db_time = end_reading_db_time - start_reading_db_time logger.info(socket.gethostname() + " Finished reading " + view_name + ".") logger.info( socket.gethostname() + " Read " + view_name + " from " + start_key + " to " + end_key + " for " + str(reading_db_time) + "s." ) return tweet_dict
__author__ = 'josh' from couchdb import Server import couchdb if __name__ == "__main__": import sys source_name = sys.argv[1] dbname = sys.argv[2] couch_server = Server("http://115.146.94.12:5984") couch_server.resource.credentials = ('admin', 'admin') couch_server.config() try: couch_db = couch_server.create(dbname) except couchdb.http.PreconditionFailed, e: couch_db = couch_server[dbname] for line in open(source_name): line = line.strip() if line == '': continue else: (key, count) = line.split(" ###### ") couch_db[key] = {"count": count}