-
Notifications
You must be signed in to change notification settings - Fork 0
/
AvroAppender.py
57 lines (47 loc) · 1.74 KB
/
AvroAppender.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
import Queue
import avro.schema
import time
import threading
from avro.datafile import DataFileReader, DataFileWriter
from avro.io import DatumReader, DatumWriter
schema = avro.schema.parse(open("log_schema.avsc").read())
class AvroAppender(threading.Thread):
def __init__(self, file):
threading.Thread.__init__(self)
self.avro_writer = DataFileWriter(open(file, "w"), DatumWriter(), schema)
self.queue = Queue.Queue()
self.should_stop = False
self.mutex = threading.Lock()
self.start()
def log_append(self, user, advertiser, **kwargs):
if user is not None and advertiser is not None:
record = dict(user=user, advertiser=advertiser)
if kwargs["ip"]:
record["ip"] = kwargs["ip"]
if kwargs["agent"]:
record["agent"] = kwargs["agent"]
if kwargs["time"]:
record["timestamp"] = float(kwargs["time"])
else:
record["timestamp"] = float(time.time())
if kwargs["keywords"]:
record["keywords"] = list(set([string.strip() for string in kwargs["keywords"].split(",")]))
self.queue.put_nowait(record)
else:
print "Missing user"
def close_appender(self):
self.mutex.acquire()
self.should_stop = True
self.mutex.release()
def run(self):
while True:
try:
record = self.queue.get(False, 1000)
self.avro_writer.append(record)
except Queue.Empty:
self.mutex.acquire()
stop = self.should_stop
self.mutex.release()
if stop:
break
self.avro_writer.close()