def consume(self, topic): #consumer=KafkaConsumer(topic,group_id=self.configs["group_id"],bootstrap_servers=self.configs["zookeeper"].split(","), auto_commit_enable=False) client=KafkaClient(self.configs["broker_list"].split(",")) consumer=SimpleConsumer(topic=topic,group=self.configs["group_id"],client=client, auto_commit=False) while(True): # message is (partition, msg). for msg, it has key, value as param. for message in consumer.get_messages(10): #print("[%s.consumer] %s-part-%d: value=%s" % (self.configs["group_id"],topic,message[0],message[1])) print("[%s.consumer] %s-part-%d: key=%s value=%s" % (self.configs["group_id"],topic, message[0], message[1].key,message[1].value))
def test_writer(): topic = '%s-mutations' % (uuid.uuid1().hex,) client = KafkaClient('kafka') producer = SimpleProducer(client) writer = KafkaWriter(producer, topic) inputs = list(transaction) writer.push(inputs) consumer = SimpleConsumer(client, 'test', topic, auto_offset_reset='smallest') outputs = map( writer.codec.decode, map( operator.attrgetter('message.value'), list(consumer.get_messages(count=3)), ), ) assert outputs == inputs
def test_handler(): topic = '%s-mutations' % (uuid.uuid1().hex,) codec = BinaryCodec(Message) client = KafkaClient('kafka') producer = SimpleProducer(client) writer = KafkaWriter(producer, topic, codec) inputs = list(transaction) writer.push(inputs) consumer = SimpleConsumer(client, 'test', topic, auto_offset_reset='smallest') outputs = map( codec.decode, map( operator.attrgetter('message.value'), list(consumer.get_messages(count=3)), ), ) assert outputs == inputs
class KafkaBroker(object): USER_PRODUCER = 0 FIXED_PRODUCER = 1 SIMPLE_PRODUCER = 2 NON_PRODUCER = 3 SIMPLE_CONSUMER = 0 NON_CONSUMER = 1 SOCKET_TIMEOUT = 60 #second def __init__(self, kafkaHost=None, kafkaGroup=None, kafkaTopic=None, consumerType=NON_CONSUMER, consumerPartitions=[], producerType=NON_PRODUCER, producerPartitions=[]): self.kafkaHost = kafkaHost self.kafkaGroup = kafkaGroup self.kafkaTopic = kafkaTopic self.consumerPartitions = consumerPartitions self.producerPartitions = producerPartitions self.connect(kafkaHost) try: if producerType == self.SIMPLE_PRODUCER: self.producer = SimpleProducer(self.kafkaClient, async=False, req_acks=KeyedProducer.ACK_NOT_REQUIRED) elif producerType == self.FIXED_PRODUCER: self.producer = FixedProducer(self.kafkaClient, producerPartitions[0], async=False, req_acks=KeyedProducer.ACK_NOT_REQUIRED) elif producerType == self.USER_PRODUCER: self.producer = UserProducer(self.kafkaClient, async=False, req_acks=KeyedProducer.ACK_NOT_REQUIRED) elif producerType == self.NON_PRODUCER: self.producer = None else: raise Exception("wrong producer type {}".format(producerType)) if consumerType == self.SIMPLE_CONSUMER: if not consumerPartitions: self.consumer = SimpleConsumer(self.kafkaClient, self.kafkaGroup, self.kafkaTopic) else: self.consumer = SimpleConsumer(self.kafkaClient, self.kafkaGroup, self.kafkaTopic, partitions=self.consumerPartitions) logger.debug('consumer is listening on {}@{}'.format(self.kafkaTopic, self.consumerPartitions)) elif consumerType == self.NON_CONSUMER: self.consumer = None else: raise Exception("wrong consumer type {}".format(consumerType)) except Exception as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) self.consumer = None self.producer = None self.kafkaClient = None def close(self): if self.consumer: self.consumer.commit() self.consumer.stop() self.consumer = None if self.producer: self.producer.stop() self.producer = None if self.kafkaClient: self.kafkaClient.close() self.kafkaClient = None logger.info('Kafka connection closed') def connect(self, kafkaHost, countdown=COUNT_DOWN): if countdown == 0: logger.error('kafka server can not be connected in {} times'.format(COUNT_DOWN)) return try: self.kafkaClient = KafkaClient(kafkaHost, timeout=self.SOCKET_TIMEOUT) except: logger.warning('try to connect kafka server again {}'.format(countdown)) self.connect(kafkaHost, countdown - 1) logger.info('Kafka client connected {}'.format(self.kafkaClient)) def reconnect(self, countdown=COUNT_DOWN): if countdown == 0: logger.error('kafka server can not be connected in {} times'.format(COUNT_DOWN)) return try: self.kafkaClient.reinit() except: self.reconnect(countdown - 1) def produce(self, op, name, **kwargs): # TODO: when name is None, the operation is propagated to all partitions if not op or not name: logger.warning('op or name must not be empty') return try: dictMessage = dict(kwargs) dictMessage['op'] = op dictMessage['name'] = name encodedMessage = simplejson.dumps(dictMessage) self.producer.send(self.kafkaTopic, name, encodedMessage) except KafkaError as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) self.reconnect() except Exception as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) def echo(self, message=''): self.produce('Echo', 'testing', message=message) def set_consumer_partition(self, consumerPartitions): if not consumerPartitions: logger.warning('consumer partitions can not be empty') return if self.consumer: self.consumer.commit() self.consumer.stop() self.consumer = None self.consumerPartitions = consumerPartitions try: self.consumer = SimpleConsumer(self.kafkaClient, self.kafkaGroup, self.kafkaTopic, partitions=self.consumerPartitions) except KafkaError as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) self.reconnect() except Exception as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) def is_consumer_ready(self): if not self.consumer: logger.warning('Consumer is not ready yet') return False return True def seek(self, skip): if self.is_consumer_ready(): if skip == -1: self.consumer.seek(0, 2) else: self.consumer.seek(skip, 1) def commit(self): if self.is_consumer_ready(): self.consumer.commit() def consume_one(self): if not self.is_consumer_ready(): return None try: message = self.consumer.get_message() if not message: return None logger.debug('received message {}'.format(message.message.value)) return message.message.value except Exception as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) self.reconnect() return None def consume(self, count=10): if not self.is_consumer_ready(): return [] try: messages = self.consumer.get_messages(count=count) return [message.message.value for message in messages] except Exception as e: logger.warning('Exception {}'.format(e)) logger.debug(traceback.format_exc()) self.reconnect() return []