1.1安装模块
            
              pip install pykafka
            
          
          1.2基本使用
            
              # -* coding:utf8 *-  
from pykafka import KafkaClient  
host = 'IP:9092, IP:9092, IP:9092'
client = KafkaClient(hosts = host)  
# 生产者  
topicdocu = client.topics['my-topic']  
producer = topicdocu.get_producer()  
for i in range(100):  
    print i  
    producer.produce('test message ' + str(i ** 2))  
producer.stop()
            
          
          1.3简单封装
            
              class KafkaProduct():
    def __init__(self,hosts,topic):
        """
        初始化实例
        :param hosts: 连接地址
        :param topic:
        """
        self.__client = KafkaClient(hosts=hosts)
        self.__topic = self.__client.topics[topic.encode()]
    def __set_topic(self, topic):
        self.__topic = self.__client.topics[topic.encode()]
    def set_topic(self, topic):
        """
        设置topic
        :param topic:
        :return:
        """
        self.__set_topic(topic)
    def get_topics(self):
        """
        获取当前所有topic
        :return:
        """
        return self.__client.topics
    def get_topic(self):
        """
        获取当前topic
        :return:
        """
        return self.__topic
    def Producer(self):
        """
        生产者对象
        :return:
        """
        with self.__topic.get_producer(delivery_reports=True) as producer:
            next_data = ''
            while True:
                if next_data:
                    producer.produce(str(next_data).encode())
                next_data = yield True
    def send_data(self,datas):
        """
        发送数据
        :param datas:需要传入的可迭代对象
        :return:
        """
        c = self.Producer()
        next(c)
        for i in datas:
            c.send(i)
if __name__ == '__main__':
hosts = "1.2.3.4:9999,2.3.4.5:9090" #连接hosts
topic = "test_523"
K = KafkaProduct(hosts=hosts, topic=topic)  #
#K.set_topic("test")  #切换设置新的topic
K.get_topic()  #获取当前设置的topic
#K.get_topics() #获取所有topic
data = range(10000)  #要发送的可迭代对象
K.send_data(data)
            
          
          1.4引用来源
博客园:Python测试Kafka集群(pykafka)
知乎:使用生成器把Kafka写入效率提高1000倍


 
					 
					