es数据迁移脚本(python)

#!/usr/bin/python

# -*- coding: UTF-8 -*-

# 文件名：indiceCreate.py

import sys

import base64

import time

import httplib

import json

## 老集群host（ip+port）

oldClusterHost = "192.168.1.85:9200"

## 老集群用户名，可为空

oldClusterUserName = "elastic"

## 老集群密码，可为空

oldClusterPassword = "elastic"

## 新集群host（ip+port）

newClusterHost = "192.168.1.118:9200"

## 新集群用户名，可为空

newClusterUser = ""

## 新集群密码，可为空

newClusterPassword = ""

DEFAULT_REPLICAS = 0

def httpRequest(method, host, endpoint, params="", username="", password=""):

    conn = httplib.HTTPConnection(host)

    headers = {}

    if (username != "") :

        'Hello {name}, your age is {age} !'.format(name = 'Tom', age = '')

        base64string = base64.encodestring('{username}:{password}'.format(username = username, password = password)).replace('\n', '')

        headers["Authorization"] = "Basic %s" % base64string;

    if "GET" == method:

        headers["Content-Type"] = "application/x-www-form-urlencoded"

        conn.request(method=method, url=endpoint, headers=headers)

    else :

        headers["Content-Type"] = "application/json"

        conn.request(method=method, url=endpoint, body=params, headers=headers)

    response = conn.getresponse()

    res = response.read()

    return res

def httpGet(host, endpoint, username="", password=""):

    return httpRequest("GET", host, endpoint, "", username, password)

def httpPost(host, endpoint, params, username="", password=""):

    return httpRequest("POST", host, endpoint, params, username, password)

def httpPut(host, endpoint, params, username="", password=""):

    return httpRequest("PUT", host, endpoint, params, username, password)

def getIndices(host, username="", password=""):

    endpoint = "/_cat/indices"

    indicesResult = httpGet(oldClusterHost, endpoint, oldClusterUserName, oldClusterPassword)

    indicesList = indicesResult.split("\n")

    indexList = []

    for indices in indicesList:

        if (indices.find("open") > 0):

            indexList.append(indices.split()[2])

    return indexList

def getSettings(index, host, username="", password=""):

    endpoint = "/" + index + "/_settings"

    indexSettings = httpGet(host, endpoint, username, password)

    print index + " 原始settings如下：\n" + indexSettings

    settingsDict = json.loads(indexSettings)

    ## 分片数默认和老集群索引保持一致

    number_of_shards = settingsDict[index]["settings"]["index"]["number_of_shards"]

    ## 副本数默认为0

    number_of_replicas = DEFAULT_REPLICAS

    newSetting = "\"settings\": {\"number_of_shards\": %s, \"number_of_replicas\": %s}" % (number_of_shards, number_of_replicas)

    return newSetting

def getMapping(index, host, username="", password=""):

    endpoint = "/" + index + "/_mapping"

    indexMapping = httpGet(host, endpoint, username, password)

    print index + " 原始mapping如下：\n" + indexMapping

    mappingDict = json.loads(indexMapping)

    mappings = json.dumps(mappingDict[index]["mappings"])

    newMapping = "\"mappings\" : " + mappings

    return newMapping

def createIndexStatement(oldIndexName):

    settingStr = getSettings(oldIndexName, oldClusterHost, oldClusterUserName, oldClusterPassword)

    mappingStr = getMapping(oldIndexName, oldClusterHost, oldClusterUserName, oldClusterPassword)

    createstatement = "{\n" + str(settingStr) + ",\n" + str(mappingStr) + "\n}"

    return createstatement

def createIndex(oldIndexName, newIndexName=""):

    if (newIndexName == "") :

        newIndexName = oldIndexName

    createstatement = createIndexStatement(oldIndexName)

    print "新索引 " + newIndexName + " 的setting和mapping如下：\n" + createstatement

    endpoint = "/" + newIndexName

    createResult = httpPut(newClusterHost, endpoint, createstatement, newClusterUser, newClusterPassword)

    print "新索引 " + newIndexName + " 创建结果：" + createResult

## main

indexList = getIndices(oldClusterHost, oldClusterUserName, oldClusterPassword)

systemIndex = []

for index in indexList:

    if (index.startswith(".")):

        systemIndex.append(index)

    else :

        createIndex(index, index)

if (len(systemIndex) > 0) :

    for index in systemIndex:

        print index + " 或许是系统索引，不会重新创建，如有需要，请单独处理～"

以上同步的时候设置的副本数是0,目的是加快同步速度，同步完成后需要设置副本数，如下:
curl -H "Content-Type: application/json" -XPUT 'http://192.168.1.118:9200/db_customer/_settings' -d '{
"number_of_replicas" : 1
}'

es数据迁移脚本(python)的更多相关文章

运维脚本-elasticsearch数据迁移python3脚本
elasticsearch数据迁移python3脚本 #!/usr/bin/python3 #elsearch 数据迁移脚本 #迁移工具路径 import time,os #下面命令是用到了一个go语 ...
ELK数据迁移,ES快照备份迁移
通过curl命令或者kibana快照备份,恢复的方式进行数据迁移环境介绍之前创建的ELK 因为VPC环境的问题,需要对ELK从新部署,但是还需要保留现有的数据,于是便有了这篇文档. 10.0.20 ...
Entity Framework Code First Migrations--EF 的数据迁移
1. 为了演示方便,首先新建一个控制台项目,然后添加对entityframework的引用使用nuget控制台执行: Install-Package EntityFramework 2.新建一个实体 ...
Mycat 分片规则详解--数据迁移及节点扩容
使用的是 Mycat 提供的 dataMigrate 脚本进行对数据进行迁移和节点扩容,目前支持的 Mycat 是1.6 版本,由于 Mycat 是由 Java 编写的因此在做数据迁移及节点扩容时需要 ...
MySQL 到 ES 数据实时同步技术架构
MySQL 到 ES 数据实时同步技术架构我们已经讨论了数据去规范化的几种实现方式.MySQL 到 ES 数据同步本质上是数据去规范化多种实现方式中的一种,即通过"数据迁移同步" ...
使用rdb文件进行redis数据迁移--python脚本
查找了一些redis迁移的方法,一般做法就是 1. 从源数据库把rdb文件保存,然后传到新的主机上,启动新的redis即可 2. 把新的redis当做源数据库的slave,同步数据今天开发提了一个测 ...
【Python】Django删除数据迁移记录
find . -path "*migrations*" -name "*.py" -not -path "*__init__*" -exec ...
Python进行Redis数据迁移
Python进行Redis数据迁移由于开发时的误操作,导致redis数据损坏,所以需要进行redis的数据迁移,网上大佬的教程基本都是需要下载附加工具,亦或是需要一些复杂的操作,个人觉得麻烦还不如写 ...
elasticsearch-dump 迁移es数据（elasticdump）
elasticsearch 部分查询语句 # 获取集群的节点列表: curl 'localhost:9200/_cat/nodes?v' # 列出所有索引: curl 'localhost:9200/ ...

随机推荐

jQuery发布1.9正式版，最后支持IE 6/7/8
jQuery 于 2013/1/15 正式发布了 1.9 版本,这个版本最值得关注的,不是又增加了什么新功能,而是它去掉了哪些东西!jQuery 1.9 删除和改动了不少过时的 API,升级后可能会导 ...
Entity Framework学习初级篇2
Entity Framework 学习初级篇2--ObjectContext.ObjectQuery.ObjectStateEntry.ObjectStateManager类的介绍本节,简单的介绍E ...
Locust性能测试
https://www.cnblogs.com/yoyoketang/p/9638151.html https://www.cnblogs.com/yoyoketang/p/9642242.html ...
漏洞复现：Struts2 S2-032 漏洞环境
Struts2 S2-032 漏洞环境 http://vulapps.evalbug.com/s_struts2_s2-032/ POC: http://127.0.0.1/memoindex.act ...
javascript 面向对象之路.1 - 小蜜蜂
写这个系列文章是想通过几个案例来学习javascript html5 css3,其实这个小游戏谁都能做出来,但对于一个作为后端.net程序员的我来说还是有学习的必要,毕竟javascript的面向对象 ...
Android Studio -- 关联源码
1,昨天刚把SDK升级到25,然后准备开始新的一年码代码,结果发现查看源码的时候出现了一堆的“ throw new RuntimeException("Stub!");” 网上搜 ...
Rest概念学习
参考文章 http://www.cnblogs.com/shanyou/archive/2012/05/12/2496959.html http://www.cnblogs.com/loveis715 ...
<1>Cocos Creator安装和启动
学习之间需要了解JavaScritp基本语法和面向对象,详情参考https://blog.csdn.net/jadeshu/article/category/7476938 1.下载Cocos Cre ...
linux正则
正则表达式分两类: 基本正则表达式:BRE 扩展正则表达式:ERE :grep -E, egrep 正则表达式引擎: 采用不同算法,检查处理正则表达式的软件模块 PCRE(Perl ...
Yii2 Restful api搜索实现

es数据迁移脚本(python)

es数据迁移脚本(python)的更多相关文章

随机推荐

热门专题