Python 操作ES(elastics

发布时间：2019-09-02 07:56:04编辑：auto阅读（2645）

# -*- coding: utf-8 -*-

#http://www.cnblogs.com/letong/p/4749234.html
#http://elasticsearch-py.readthedocs.io/en/master/api.html#elasticsearch
#http://blog.csdn.net/xiaoxinwenziyao/article/details/49471977
#https://github.com/Parsely/pykafka

from datetime import datetime
from elasticsearch import Elasticsearch
from elasticsearch.helpers import bulk

#使用kafka 走正式流程操作
from pykafka import KafkaClient
topicName = ""
kafkaHosts = ""
client = KafkaClient(hosts=kafkaHosts)
topic = client.topics[topicName]
producer = topic.get_producer()

es = Elasticsearch([{"host":"","port":9200,"timeout":15000}])
es_Test = Elasticsearch([{"host":"","port":9200}])

#{"method":"save","data":[{},{}]}
# def save4Kafka(result):
# 	DATAS=[]
# 	for rdata in result["hits"]["hits"]:
# 		source = rdata["_source"]
# 		DATAS.append(source)

# 	producer.produce({"method":"save","data":DATAS}.toString)
#
def save4ES(result):
	ACTIONS=[];
	for rdata in result["hits"]["hits"]:
		source = rdata["_source"]
		action = {
			"_index":indexName,
			"_type":typeName,
			"_source":source
		}
		ACTIONS.append(action)

	success = bulk(es_Test,ACTIONS,index=indexName,raise_on_error=True)

	print success,x,page

indexName = ""
typeName = ""

#总条数
count = es.count(index=indexName)["count"]

#每页多少条
pageLine = 1000;

#多少页
# page = (count&pageLine) == 0?(count/pageLine):(count/pageLine+1)
page = count/pageLine if (count%pageLine) == 0 else count/pageLine+1

#获取数据.分页获取
for x in xrange(7233,page):
	result = es.search(index=indexName,from_=x*pageLine,size=pageLine)
	# save4Kafka(result)
	save4ES(result)


                        
                        
                            
关键字：
                                                                
                                
                                
                            
                        

                
                            上一篇：
                                                                    用Python实现一个简易的WebSoc                            
                            下一篇：
                                                                    Python 编写几个经典例子



        


    
    

    
    
    


    
    
        
             
            
                
                    
                        Run博客上线，欢迎访问
                        内容如有侵犯，请立即联系管理员删除
                        本站内容仅供学习和参阅，不做任何商业用途
                    
                
            
        
    

    
    
        
            标签云
        
        
            
                python3djangopython3爬虫python运维开发linuxpyspiderpython基础dockergitsvnpython练习requestsscrapy系统/运维python全栈人工智能bs4tkinterseleniumurllibphppythonrequests_htmlvue图像处理                
                
                
                
                
                
                
                
            
        
    

    



    
    
        
            搜索
        
        
            
                
                    
                        
                        
                    
                
            
        
    

    
    
        
            热门推荐
        
        
            
                 H3C基本命令大全
                                         53532 
                    

                    
                        
                            
                            
                        

                     H3C IRF原理及 配置                      40353 
                    

                    
                        
                            
                            
                        

                     Python exit()函数
                                         34757 
                    

                    
                        
                            
                            
                        

                     python全系列官方中文文档                     30515 
                    

                    
                        
                            
                            
                        

                     python 获取网卡实时流量
                                         25394 
                    

                    
                        
                            
                            
                        

                     1.常用turtle功能函数                     25183 
                    

                    
                        
                            
                            
                        

                     python 获取Linux和Windows硬件信息
                                         23597 
                    

                    
                        
                            
                            
                        

                     天天基金网数据接口                     18873 
                    

                    
                        
                            
                            
                        

                     Selenium使用代理IP&无头模式访问网站
                                         15175 
                    

                    
                        
                            
                            
                        

                     Selenium&Pytesseract模拟登录+验证码识别                     14688 
                    

                    
                        
                            
                            
                        

                    

            
        
    

    
    
        
            最新文章
        
        
            
                 LangGraph Studio可视化
                                         1151° 
                    
                    
                        
                        
                     LangSmith开发-应用入门                     1075° 
                    
                    
                        
                        
                     LangGraph开发-多轮对话问答机器人
                                         1145° 
                    
                    
                        
                        
                     LangGraph开发-条件分支/循环图实战                     1164° 
                    
                    
                        
                        
                     LangGraph开发-生态介绍，入门demo实战
                                         1199° 
                    
                    
                        
                        
                     LangChain-接入12306-HTTP MCP智能体                     1353° 
                    
                    
                        
                        
                     LangChain接入自定义爬虫-MCP工具
                                         1313° 
                    
                    
                        
                        
                     LangChain接入Filesystem-MCP工具                     1286° 
                    
                    
                        
                        
                     LangChain搭建MCP服务端和客户端流程
                                         1384° 
                    
                    
                        
                        
                     LangGraph与MCP技术概述                     1327° 
                    
                    
                        
                        
                                
        
    

    
    
        
            博主信息
        
        
            
                姓名：Run
                职业：谜
                邮箱：383697894@qq.com
                定位：上海 · 松江
            
        
    
    
    
        
            扫我打开
        
        
	    
        
    

    
    
        
            友情链接
        
        
            百度
            淘宝
            腾讯
            慕课网
            CSDN
            博客园
            51cto博客