elasticsearch-1.3.0

发送请求

创建

[root@centos ~]# curl -XPUT 172.16.136.159:9200/customer?pretty

{

  "acknowledged" : true

}

索引

[root@centos ~]# curl -XPUT 172.16.136.159:9200/customer/external/1?pretty '-d { "name":"JOhn Doe"}'

{

  "_index" : "customer",

  "_type" : "external",

  "_id" : "1",

  "_version" : 1,

  "created" : true

}

[root@centos ~]# curl -XPUT 172.16.136.159:9200/customer/external/1?pretty '-d { "name":"JOhn Doe"}'

{

  "_index" : "customer",

  "_type" : "external",

  "_id" : "1",

  "_version" : 2,

  "created" : false

}

这里先跟踪下索引的流程，netty的bootstrap暂且不管，从HttpRequestHandler的messageReceived说起

public void messageReceived(ChannelHandlerContext ctx, MessageEvent e) throws Exception {

    HttpRequest request = (HttpRequest) e.getMessage();

    // the netty HTTP handling always copy over the buffer to its own buffer, either in NioWorker internally

    // when reading, or using a cumalation buffer

    NettyHttpRequest httpRequest = new NettyHttpRequest(request, e.getChannel());

    serverTransport.dispatchRequest(httpRequest, new NettyHttpChannel(serverTransport, e.getChannel(), httpRequest));

    super.messageReceived(ctx, e);

}

这里的dispatchRequest启示就是NettyHttpServerTransport

NettyHttpServerTransport

void dispatchRequest(HttpRequest request, HttpChannel channel) {

    httpServerAdapter.dispatchRequest(request, channel);

}

Dispatcher,static class Dispatcher implements HttpServerAdapter

public void dispatchRequest(HttpRequest request, HttpChannel channel) {

    server.internalDispatchRequest(request, channel);

}

HttpServer

public void internalDispatchRequest(final HttpRequest request, final HttpChannel channel) {

    if (request.rawPath().startsWith("/_plugin/")) {

        RestFilterChain filterChain = restController.filterChain(pluginSiteFilter);

        filterChain.continueProcessing(request, channel);

        return;

    }

    restController.dispatchRequest(request, channel);

}

RestController的dispatchRequest()主要是executeHandler（）

try {

    executeHandler(request, channel);

} catch (Throwable e) {

executeHandler方法中不同的handler处理请求,这里的handler是RestIndexAction，继承自

final RestHandler handler = getHandler(request);

if (handler != null) {

    handler.handleRequest(request, channel);

}

在BaseRestHandler中

public final void handleRequest(RestRequest request, RestChannel channel) throws Exception {

    handleRequest(request, channel, usefulHeaders.length == 0 ? client : new HeadersCopyClient(client, request, usefulHeaders));

}

protected abstract void handleRequest(RestRequest request, RestChannel channel, Client client) throws Exception;

实现父类在BaseRestHandler的handleRequest方法,最后调用NodeClient的index方法

client.index(indexRequest, new RestBuilderListener<IndexResponse>(channel) {

NodeClient的父类AbstractClient中index的实现

public void index(final IndexRequest request, final ActionListener<IndexResponse> listener) {

    execute(IndexAction.INSTANCE, request, listener);

}

NodeClient中的execute方法实现

public <Request extends ActionRequest, Response extends ActionResponse, RequestBuilder extends ActionRequestBuilder<Request, Response, RequestBuilder, Client>> void execute(Action<Request, Response, RequestBuilder, Client> action, Request request, ActionListener<Response> listener) {

    TransportAction<Request, Response> transportAction = actions.get((ClientAction)action);

    transportAction.execute(request, listener);//TransportIndexAction extends TransportShardReplicationOperationAction

}

这里的transportAction是TransportIndexAction，

其中TransportShardReplicationOperationAction是TransportIndexAction的父类，中TransportShardReplicationOperationAction继承自TransportAction,TransportAction中execute的实现

public void execute(Request request, ActionListener<Response> listener) {

    if (request.listenerThreaded()) {

        listener = new ThreadedActionListener<>(threadPool, listener, logger);

    }

    ActionRequestValidationException validationException = request.validate();

    if (validationException != null) {

        listener.onFailure(validationException);

        return;

    }

    try {

        doExecute(request, listener);

    } catch (Throwable e) {

        logger.trace("Error during transport action execution.", e);

        listener.onFailure(e);

    }

}

直接调用TransportIndexAction的doExecute

 protected void doExecute(final IndexRequest request, final ActionListener<IndexResponse> listener) {

        // if we don't have a master, we don't have metadata, that's fine, let it find a master using create index API

        if (autoCreateIndex.shouldAutoCreate(request.index(), clusterService.state())) {

            request.beforeLocalFork(); // we fork on another thread...

            createIndexAction.execute(new CreateIndexRequest(request.index()).cause("auto(index api)").masterNodeTimeout(request.timeout()), new ActionListener<CreateIndexResponse>() {

                @Override

                public void onResponse(CreateIndexResponse result) {

                    innerExecute(request, listener);

                }

                @Override

                public void onFailure(Throwable e) {

                    if (ExceptionsHelper.unwrapCause(e) instanceof IndexAlreadyExistsException) {

                        // we have the index, do it

                        try {

                            innerExecute(request, listener);

                        } catch (Throwable e1) {

                            listener.onFailure(e1);

                        }

                    } else {

                        listener.onFailure(e);

                    }

                }

            });

        } else {

            innerExecute(request, listener);

        }

    }

这里走 innerExecute(request, listener);

private void innerExecute(final IndexRequest request, final ActionListener<IndexResponse> listener) {

    super.doExecute(request, listener);

}

这里的super就是TransportShardReplicationOperationAction了,TransportShardReplicationOperationAction中doExecute的实现

protected void doExecute(Request request, ActionListener<Response> listener) {

    new AsyncShardOperationAction(request, listener).start();

}

主要两个方法，一个是获取shard,另一个是shardOperationOnPrimary;

其中shard后边再说,shardOperationOnPrimary在TransportIndexAction实现

protected PrimaryResponse<IndexResponse, IndexRequest> shardOperationOnPrimary(ClusterState clusterState, PrimaryOperationRequest shardRequest) {

    final IndexRequest request = shardRequest.request;

    // validate, if routing is required, that we got routing

    IndexMetaData indexMetaData = clusterState.metaData().index(request.index());

    MappingMetaData mappingMd = indexMetaData.mappingOrDefault(request.type());

    if (mappingMd != null && mappingMd.routing().required()) {

        if (request.routing() == null) {

            throw new RoutingMissingException(request.index(), request.type(), request.id());

        }

    }

    IndexService indexService = indicesService.indexServiceSafe(shardRequest.request.index());

    IndexShard indexShard = indexService.shardSafe(shardRequest.shardId);

    SourceToParse sourceToParse = SourceToParse.source(SourceToParse.Origin.PRIMARY, request.source()).type(request.type()).id(request.id())

            .routing(request.routing()).parent(request.parent()).timestamp(request.timestamp()).ttl(request.ttl());

    long version;

    boolean created;

    Engine.IndexingOperation op;

    if (request.opType() == IndexRequest.OpType.INDEX) {

        Engine.Index index = indexShard.prepareIndex(sourceToParse, request.version(), request.versionType(), Engine.Operation.Origin.PRIMARY, request.canHaveDuplicates());

        if (index.parsedDoc().mappingsModified()) {

            mappingUpdatedAction.updateMappingOnMaster(request.index(), index.docMapper(), indexService.indexUUID());

        }

        indexShard.index(index);

        version = index.version();

        op = index;

        created = index.created();

    } else {

        Engine.Create create = indexShard.prepareCreate(sourceToParse,

                request.version(), request.versionType(), Engine.Operation.Origin.PRIMARY, request.canHaveDuplicates(), request.autoGeneratedId());

        if (create.parsedDoc().mappingsModified()) {

            mappingUpdatedAction.updateMappingOnMaster(request.index(), create.docMapper(), indexService.indexUUID());

        }

        indexShard.create(create);

        version = create.version();

        op = create;

        created = true;

    }

    if (request.refresh()) {

        try {

            indexShard.refresh(new Engine.Refresh("refresh_flag_index").force(false));

        } catch (Throwable e) {

            // ignore

        }

    }

    // update the version on the request, so it will be used for the replicas

    request.version(version);

    request.versionType(request.versionType().versionTypeForReplicationAndRecovery());

    assert request.versionType().validateVersionForWrites(request.version());

    IndexResponse response = new IndexResponse(request.index(), request.type(), request.id(), version, created);

    return new PrimaryResponse<>(shardRequest.request, response, op);

}

走request.opType() == IndexRequest.OpType.INDEX分支，主要是indexShard.prepareIndex，indexShard.index(index)这里IndexShard是InternalIndexShard，的index实现

public ParsedDocument index(Engine.Index index) throws ElasticsearchException {

    writeAllowed(index.origin());

    index = indexingService.preIndex(index);

    try {

        if (logger.isTraceEnabled()) {

            logger.trace("index [{}][{}]{}", index.type(), index.id(), index.docs());

        }

        engine.index(index);

        index.endTime(System.nanoTime());

    } catch (RuntimeException ex) {

        indexingService.failedIndex(index);

        throw ex;

    }

    indexingService.postIndex(index);

    return index.parsedDoc();

}

indexingService对应ShardIndexingService, engine是InternalEngine，InternalEngine的index()

public void index(Index index) throws EngineException {

    final IndexWriter writer;

    try (InternalLock _ = readLock.acquire()) {

        writer = currentIndexWriter();

        try (Releasable r = throttle.acquireThrottle()) {

            innerIndex(index, writer);

        }

        dirty = true;

        possibleMergeNeeded = true;

        flushNeeded = true;

    } catch (OutOfMemoryError | IllegalStateException | IOException t) {

        maybeFailEngine(t, "index");

        throw new IndexFailedEngineException(shardId, index, t);

    }

    checkVersionMapRefresh();

}

最终在InternalEngine的innerIndex方法中调用lunece的IndexWriter的,依据是不是存在有版本，来通过 writer.addDocuments或者updateDocument方法添加或者更新索引

添加add索引

if (index.docs().size() > 1) {

    writer.addDocuments(index.docs(), index.analyzer());

} else {

    writer.addDocument(index.docs().get(0), index.analyzer());

}

更新update索引

if (index.docs().size() > 1) {

    writer.updateDocuments(index.uid(), index.docs(), index.analyzer());

} else {

    writer.updateDocument(index.uid(), index.docs().get(0), index.analyzer());

}

最后Translog

Translog.Location translogLocation = translog.add(new Translog.Index(index));

具体代码

private void innerIndex(Index index, IndexWriter writer) throws IOException {

    synchronized (dirtyLock(index.uid())) {

        final long currentVersion;

        VersionValue versionValue = versionMap.getUnderLock(index.uid().bytes());

        if (versionValue == null) {

            currentVersion = loadCurrentVersionFromIndex(index.uid());

        } else {

            if (enableGcDeletes && versionValue.delete() && (threadPool.estimatedTimeInMillis() - versionValue.time()) > gcDeletesInMillis) {

                currentVersion = Versions.NOT_FOUND; // deleted, and GC

            } else {

                currentVersion = versionValue.version();

            }

        }

        long updatedVersion;

        long expectedVersion = index.version();

        if (index.versionType().isVersionConflictForWrites(currentVersion, expectedVersion)) {

            if (index.origin() == Operation.Origin.RECOVERY) {

                return;

            } else {

                throw new VersionConflictEngineException(shardId, index.type(), index.id(), currentVersion, expectedVersion);

            }

        }

        updatedVersion = index.versionType().updateVersion(currentVersion, expectedVersion);

        index.updateVersion(updatedVersion);

        if (currentVersion == Versions.NOT_FOUND) {

            // document does not exists, we can optimize for create

            index.created(true);

            if (index.docs().size() > 1) {

                writer.addDocuments(index.docs(), index.analyzer());

            } else {

                writer.addDocument(index.docs().get(0), index.analyzer());

            }

        } else {

            if (versionValue != null) {

                index.created(versionValue.delete()); // we have a delete which is not GC'ed...

            }

            if (index.docs().size() > 1) {

                writer.updateDocuments(index.uid(), index.docs(), index.analyzer());

            } else {

                writer.updateDocument(index.uid(), index.docs().get(0), index.analyzer());

            }

        }

        Translog.Location translogLocation = translog.add(new Translog.Index(index));

        versionMap.putUnderLock(index.uid().bytes(), new VersionValue(updatedVersion, translogLocation));

        indexingService.postIndexUnderLock(index);

    }

}

link

分布式搜索Elasticsearch源码分析之二------索引过程源码概要分析

elasticsearch-1.3.0 之索引代码粗略梳理的更多相关文章

Elasticsearch 7.4.0官方文档操作
官方文档地址 https://www.elastic.co/guide/en/elasticsearch/reference/current/index.html 1.0.0 设置Elasticsea ...
Linux下,非Docker启动Elasticsearch 6.3.0,安装ik分词器插件,以及使用Kibana测试Elasticsearch,
Linux下,非Docker启动Elasticsearch 6.3.0 查看java版本,需要1.8版本 java -version yum -y install java 创建用户,因为elasti ...
ElasticSearch基本操作（安装，索引的创建和删除，映射）
ElasticSearch基于Lucene的搜索服务器,支持分布式,提供REST接口,可用于云计算,可以实现实时搜索,开源免费.这时很官方的一句话,在使用之前,我们简单的介绍一下安装过程.在官网下载之 ...
Elasticsearch－基础介绍及索引原理分析（转载）
最近在参与一个基于Elasticsearch作为底层数据框架提供大数据量(亿级)的实时统计查询的方案设计工作,花了些时间学习Elasticsearch的基础理论知识,整理了一下,希望能对Elastic ...
Elasticsearch－基础介绍及索引原理分析
介绍 Elasticsearch 是一个分布式可扩展的实时搜索和分析引擎,一个建立在全文搜索引擎 Apache Lucene(TM) 基础上的搜索引擎.当然 Elasticsearch 并不仅仅是 L ...
elasticsearch简介和倒排序索引介绍
介绍我们为什么要用搜索引擎?我们的所有数据在数据库里面都有,而且 Oracle.SQL Server 等数据库里也能提供查询检索或者聚类分析功能,直接通过数据库查询不就可以了吗?确实,我们大部分的查 ...
lucene&solr学习——创建和查询索引(代码篇)
1. Lucene的下载 Lucene是开发全文检索功能的工具包,从官网下载Lucene4.10.3并解压. 官网:http://lucene.apache.org/ 版本:lucene7.7.0 ( ...
【拆分版】Docker-compose构建Elasticsearch 7.1.0集群
写在前边搞了两三天了,一直有个问题困扰着我,ES集群中配置怎么能正确映射到主机上,这边经常报ClusterFormationFailureHelper master not discovered o ...
elasticsearch——海量文档高性能索引系统
elasticsearch elasticsearch是一个高性能高扩展性的索引系统,底层基于apache lucene. 可结合kibana工具进行可视化. 概念: index 索引: 类似SQL中 ...

随机推荐

Stm32F107VCT6硬件资源
一直在用stm32系列的单片机,最近因为需要使用到以太网,所以采用了stm32f107vc这款芯片.对于存储资源一直不是非常清楚,今天专门到官网看了一下. 如下: RAM------>64kB ...
转载：Centos7 从零编译配置Memcached
序言 Memcached 是一个高性能的分布式内存对象缓存系统,用于动态Web应用以减轻数据库负载.它通过在内存中缓存数据和对象来减少读取数据库的次数,从而提高动态.数据库驱动网站的速度. Memca ...
jvm--3.内存管理
5.JVM内存管理 JAVA虚拟机在执行java程序的过程中,会把它管理的内存分成若干个不同的数据区域. ----------------------------------------------- ...
python爬虫小项目实战
[Python] from scipy import sparse 报 DLL load failed：找不到指定模块错误
依赖vc运行环境.需要安装 vc_redist Py3.5要安装2015版传送门: https://www.microsoft.com/zh-CN/download/details.aspx?id= ...
js array push 添加内容
向数组中天机内容: var array = new Array(); array.push('newItem');
ROW_NUMBER()与PARTITION BY 实例
环境:SQL Server 2008 R2 数据表结构 SELECT A.* FROM [tbiz_AssScoreWeidu] A SELECT A.* ,ROW_NUMBER() OVER ( P ...
Solr使用入门指南
本文转自http://chuanliang2007.spaces.live.com/blog/cns!E5B7AB2851A4C9D2!499.entry?wa=wsignin1.0 由于搜索引擎功能 ...
tomcat7 IP限制配置
server.xml </Host>前添加<Valve className="org.apache.catalina.valves.RemoteAddrValve&quo ...
Windows 网络通讯开发
Windows 网络通讯开发一.Windows网络开发API 由于C++标准库中没有网络库,所以进行网络开发的时候要调用系统API.Windows通讯开发API包括以下几个基本函数及成员类型: 1. ...

elasticsearch-1.3.0 之索引代码粗略梳理

elasticsearch-1.3.0

elasticsearch-1.3.0 之索引代码粗略梳理的更多相关文章

随机推荐

热门专题