mirror of
https://github.com/minio/minio.git
synced 2025-01-14 16:25:01 -05:00
573 lines
15 KiB
Go
573 lines
15 KiB
Go
|
// Copyright 2012-present Oliver Eilhard. All rights reserved.
|
||
|
// Use of this source code is governed by a MIT-license.
|
||
|
// See http://olivere.mit-license.org/license.txt for details.
|
||
|
|
||
|
package elastic
|
||
|
|
||
|
import (
|
||
|
"fmt"
|
||
|
"net/url"
|
||
|
)
|
||
|
|
||
|
// ReindexService is a method to copy documents from one index to another.
|
||
|
// It was introduced in Elasticsearch 2.3.0.
|
||
|
//
|
||
|
// Notice that Elastic already had a Reindexer service that pre-dated
|
||
|
// the Reindex API. Use that if you're on an earlier version of Elasticsearch.
|
||
|
//
|
||
|
// It is documented at https://www.elastic.co/guide/en/elasticsearch/plugins/master/plugins-reindex.html.
|
||
|
type ReindexService struct {
|
||
|
client *Client
|
||
|
pretty bool
|
||
|
consistency string
|
||
|
refresh *bool
|
||
|
timeout string
|
||
|
waitForCompletion *bool
|
||
|
bodyJson interface{}
|
||
|
bodyString string
|
||
|
source *ReindexSource
|
||
|
destination *ReindexDestination
|
||
|
conflicts string
|
||
|
size *int
|
||
|
script *Script
|
||
|
}
|
||
|
|
||
|
// NewReindexService creates a new ReindexService.
|
||
|
func NewReindexService(client *Client) *ReindexService {
|
||
|
return &ReindexService{
|
||
|
client: client,
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// Consistency specifies an explicit write consistency setting for the operation.
|
||
|
func (s *ReindexService) Consistency(consistency string) *ReindexService {
|
||
|
s.consistency = consistency
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Refresh indicates whether Elasticsearch should refresh the effected indexes
|
||
|
// immediately.
|
||
|
func (s *ReindexService) Refresh(refresh bool) *ReindexService {
|
||
|
s.refresh = &refresh
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Timeout is the time each individual bulk request should wait for shards
|
||
|
// that are unavailable.
|
||
|
func (s *ReindexService) Timeout(timeout string) *ReindexService {
|
||
|
s.timeout = timeout
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// WaitForCompletion indicates whether Elasticsearch should block until the
|
||
|
// reindex is complete.
|
||
|
func (s *ReindexService) WaitForCompletion(waitForCompletion bool) *ReindexService {
|
||
|
s.waitForCompletion = &waitForCompletion
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Pretty indicates that the JSON response be indented and human readable.
|
||
|
func (s *ReindexService) Pretty(pretty bool) *ReindexService {
|
||
|
s.pretty = pretty
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Source specifies the source of the reindexing process.
|
||
|
func (s *ReindexService) Source(source *ReindexSource) *ReindexService {
|
||
|
s.source = source
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// SourceIndex specifies the source index of the reindexing process.
|
||
|
func (s *ReindexService) SourceIndex(index string) *ReindexService {
|
||
|
if s.source == nil {
|
||
|
s.source = NewReindexSource()
|
||
|
}
|
||
|
s.source = s.source.Index(index)
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Destination specifies the destination of the reindexing process.
|
||
|
func (s *ReindexService) Destination(destination *ReindexDestination) *ReindexService {
|
||
|
s.destination = destination
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// DestinationIndex specifies the destination index of the reindexing process.
|
||
|
func (s *ReindexService) DestinationIndex(index string) *ReindexService {
|
||
|
if s.destination == nil {
|
||
|
s.destination = NewReindexDestination()
|
||
|
}
|
||
|
s.destination = s.destination.Index(index)
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// DestinationIndexAndType specifies both the destination index and type
|
||
|
// of the reindexing process.
|
||
|
func (s *ReindexService) DestinationIndexAndType(index, typ string) *ReindexService {
|
||
|
if s.destination == nil {
|
||
|
s.destination = NewReindexDestination()
|
||
|
}
|
||
|
s.destination = s.destination.Index(index)
|
||
|
s.destination = s.destination.Type(typ)
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Conflicts indicates what to do when the process detects version conflicts.
|
||
|
// Possible values are "proceed" and "abort".
|
||
|
func (s *ReindexService) Conflicts(conflicts string) *ReindexService {
|
||
|
s.conflicts = conflicts
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// AbortOnVersionConflict aborts the request on version conflicts.
|
||
|
// It is an alias to setting Conflicts("abort").
|
||
|
func (s *ReindexService) AbortOnVersionConflict() *ReindexService {
|
||
|
s.conflicts = "abort"
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// ProceedOnVersionConflict aborts the request on version conflicts.
|
||
|
// It is an alias to setting Conflicts("proceed").
|
||
|
func (s *ReindexService) ProceedOnVersionConflict() *ReindexService {
|
||
|
s.conflicts = "proceed"
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Size sets an upper limit for the number of processed documents.
|
||
|
func (s *ReindexService) Size(size int) *ReindexService {
|
||
|
s.size = &size
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Script allows for modification of the documents as they are reindexed
|
||
|
// from source to destination.
|
||
|
func (s *ReindexService) Script(script *Script) *ReindexService {
|
||
|
s.script = script
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// BodyJson specifies e.g. the query to restrict the results specified with the
|
||
|
// Query DSL (optional). The interface{} will be serialized to a JSON document,
|
||
|
// so use a map[string]interface{}.
|
||
|
func (s *ReindexService) BodyJson(body interface{}) *ReindexService {
|
||
|
s.bodyJson = body
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Body specifies e.g. a query to restrict the results specified with
|
||
|
// the Query DSL (optional).
|
||
|
func (s *ReindexService) BodyString(body string) *ReindexService {
|
||
|
s.bodyString = body
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// buildURL builds the URL for the operation.
|
||
|
func (s *ReindexService) buildURL() (string, url.Values, error) {
|
||
|
// Build URL path
|
||
|
path := "/_reindex"
|
||
|
|
||
|
// Add query string parameters
|
||
|
params := url.Values{}
|
||
|
if s.pretty {
|
||
|
params.Set("pretty", "1")
|
||
|
}
|
||
|
if s.consistency != "" {
|
||
|
params.Set("consistency", s.consistency)
|
||
|
}
|
||
|
if s.refresh != nil {
|
||
|
params.Set("refresh", fmt.Sprintf("%v", *s.refresh))
|
||
|
}
|
||
|
if s.timeout != "" {
|
||
|
params.Set("timeout", s.timeout)
|
||
|
}
|
||
|
if s.waitForCompletion != nil {
|
||
|
params.Set("wait_for_completion", fmt.Sprintf("%v", *s.waitForCompletion))
|
||
|
}
|
||
|
return path, params, nil
|
||
|
}
|
||
|
|
||
|
// Validate checks if the operation is valid.
|
||
|
func (s *ReindexService) Validate() error {
|
||
|
var invalid []string
|
||
|
if s.source == nil {
|
||
|
invalid = append(invalid, "Source")
|
||
|
} else {
|
||
|
if len(s.source.indices) == 0 {
|
||
|
invalid = append(invalid, "Source.Index")
|
||
|
}
|
||
|
}
|
||
|
if s.destination == nil {
|
||
|
invalid = append(invalid, "Destination")
|
||
|
}
|
||
|
if len(invalid) > 0 {
|
||
|
return fmt.Errorf("missing required fields: %v", invalid)
|
||
|
}
|
||
|
return nil
|
||
|
}
|
||
|
|
||
|
// body returns the body part of the document request.
|
||
|
func (s *ReindexService) body() (interface{}, error) {
|
||
|
if s.bodyJson != nil {
|
||
|
return s.bodyJson, nil
|
||
|
}
|
||
|
if s.bodyString != "" {
|
||
|
return s.bodyString, nil
|
||
|
}
|
||
|
|
||
|
body := make(map[string]interface{})
|
||
|
|
||
|
if s.conflicts != "" {
|
||
|
body["conflicts"] = s.conflicts
|
||
|
}
|
||
|
if s.size != nil {
|
||
|
body["size"] = *s.size
|
||
|
}
|
||
|
if s.script != nil {
|
||
|
out, err := s.script.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
body["script"] = out
|
||
|
}
|
||
|
|
||
|
src, err := s.source.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
body["source"] = src
|
||
|
|
||
|
dst, err := s.destination.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
body["dest"] = dst
|
||
|
|
||
|
return body, nil
|
||
|
}
|
||
|
|
||
|
// Do executes the operation.
|
||
|
func (s *ReindexService) Do() (*ReindexResponse, error) {
|
||
|
// Check pre-conditions
|
||
|
if err := s.Validate(); err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
// Get URL for request
|
||
|
path, params, err := s.buildURL()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
// Setup HTTP request body
|
||
|
body, err := s.body()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
// Get HTTP response
|
||
|
res, err := s.client.PerformRequest("POST", path, params, body)
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
// Return operation response
|
||
|
ret := new(ReindexResponse)
|
||
|
if err := s.client.decoder.Decode(res.Body, ret); err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
return ret, nil
|
||
|
}
|
||
|
|
||
|
// ReindexResponse is the response of ReindexService.Do.
|
||
|
type ReindexResponse struct {
|
||
|
Took interface{} `json:"took"` // 2.3.0 returns "37.7ms" while 2.2 returns 38 for took
|
||
|
TimedOut bool `json:"timed_out"`
|
||
|
Total int64 `json:"total"`
|
||
|
Updated int64 `json:"updated"`
|
||
|
Created int64 `json:"created"`
|
||
|
Deleted int64 `json:"deleted"`
|
||
|
Batches int64 `json:"batches"`
|
||
|
VersionConflicts int64 `json:"version_conflicts"`
|
||
|
Noops int64 `json:"noops"`
|
||
|
Retries int64 `json:"retries"`
|
||
|
Canceled string `json:"canceled"`
|
||
|
Failures []shardOperationFailure `json:"failures"`
|
||
|
}
|
||
|
|
||
|
// -- Source of Reindex --
|
||
|
|
||
|
// ReindexSource specifies the source of a Reindex process.
|
||
|
type ReindexSource struct {
|
||
|
searchType string // default in ES is "query_then_fetch"
|
||
|
indices []string
|
||
|
types []string
|
||
|
routing *string
|
||
|
preference *string
|
||
|
requestCache *bool
|
||
|
scroll string
|
||
|
query Query
|
||
|
sorts []SortInfo
|
||
|
sorters []Sorter
|
||
|
searchSource *SearchSource
|
||
|
}
|
||
|
|
||
|
// NewReindexSource creates a new ReindexSource.
|
||
|
func NewReindexSource() *ReindexSource {
|
||
|
return &ReindexSource{
|
||
|
indices: make([]string, 0),
|
||
|
types: make([]string, 0),
|
||
|
sorts: make([]SortInfo, 0),
|
||
|
sorters: make([]Sorter, 0),
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// SearchType is the search operation type. Possible values are
|
||
|
// "query_then_fetch" and "dfs_query_then_fetch".
|
||
|
func (r *ReindexSource) SearchType(searchType string) *ReindexSource {
|
||
|
r.searchType = searchType
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) SearchTypeDfsQueryThenFetch() *ReindexSource {
|
||
|
return r.SearchType("dfs_query_then_fetch")
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) SearchTypeQueryThenFetch() *ReindexSource {
|
||
|
return r.SearchType("query_then_fetch")
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) Index(indices ...string) *ReindexSource {
|
||
|
r.indices = append(r.indices, indices...)
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) Type(types ...string) *ReindexSource {
|
||
|
r.types = append(r.types, types...)
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) Preference(preference string) *ReindexSource {
|
||
|
r.preference = &preference
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) RequestCache(requestCache bool) *ReindexSource {
|
||
|
r.requestCache = &requestCache
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) Scroll(scroll string) *ReindexSource {
|
||
|
r.scroll = scroll
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
func (r *ReindexSource) Query(query Query) *ReindexSource {
|
||
|
r.query = query
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Sort adds a sort order.
|
||
|
func (s *ReindexSource) Sort(field string, ascending bool) *ReindexSource {
|
||
|
s.sorts = append(s.sorts, SortInfo{Field: field, Ascending: ascending})
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// SortWithInfo adds a sort order.
|
||
|
func (s *ReindexSource) SortWithInfo(info SortInfo) *ReindexSource {
|
||
|
s.sorts = append(s.sorts, info)
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// SortBy adds a sort order.
|
||
|
func (s *ReindexSource) SortBy(sorter ...Sorter) *ReindexSource {
|
||
|
s.sorters = append(s.sorters, sorter...)
|
||
|
return s
|
||
|
}
|
||
|
|
||
|
// Source returns a serializable JSON request for the request.
|
||
|
func (r *ReindexSource) Source() (interface{}, error) {
|
||
|
source := make(map[string]interface{})
|
||
|
|
||
|
if r.query != nil {
|
||
|
src, err := r.query.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
source["query"] = src
|
||
|
} else if r.searchSource != nil {
|
||
|
src, err := r.searchSource.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
source["source"] = src
|
||
|
}
|
||
|
|
||
|
if r.searchType != "" {
|
||
|
source["search_type"] = r.searchType
|
||
|
}
|
||
|
|
||
|
switch len(r.indices) {
|
||
|
case 0:
|
||
|
case 1:
|
||
|
source["index"] = r.indices[0]
|
||
|
default:
|
||
|
source["index"] = r.indices
|
||
|
}
|
||
|
|
||
|
switch len(r.types) {
|
||
|
case 0:
|
||
|
case 1:
|
||
|
source["type"] = r.types[0]
|
||
|
default:
|
||
|
source["type"] = r.types
|
||
|
}
|
||
|
|
||
|
if r.preference != nil && *r.preference != "" {
|
||
|
source["preference"] = *r.preference
|
||
|
}
|
||
|
|
||
|
if r.requestCache != nil {
|
||
|
source["request_cache"] = fmt.Sprintf("%v", *r.requestCache)
|
||
|
}
|
||
|
|
||
|
if r.scroll != "" {
|
||
|
source["scroll"] = r.scroll
|
||
|
}
|
||
|
|
||
|
if len(r.sorters) > 0 {
|
||
|
sortarr := make([]interface{}, 0)
|
||
|
for _, sorter := range r.sorters {
|
||
|
src, err := sorter.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
sortarr = append(sortarr, src)
|
||
|
}
|
||
|
source["sort"] = sortarr
|
||
|
} else if len(r.sorts) > 0 {
|
||
|
sortarr := make([]interface{}, 0)
|
||
|
for _, sort := range r.sorts {
|
||
|
src, err := sort.Source()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
sortarr = append(sortarr, src)
|
||
|
}
|
||
|
source["sort"] = sortarr
|
||
|
}
|
||
|
|
||
|
return source, nil
|
||
|
}
|
||
|
|
||
|
// -source Destination of Reindex --
|
||
|
|
||
|
// ReindexDestination is the destination of a Reindex API call.
|
||
|
// It is basically the meta data of a BulkIndexRequest.
|
||
|
//
|
||
|
// See https://www.elastic.co/guide/en/elasticsearch/reference/2.3/docs-reindex.html
|
||
|
// fsourcer details.
|
||
|
type ReindexDestination struct {
|
||
|
index string
|
||
|
typ string
|
||
|
routing string
|
||
|
parent string
|
||
|
opType string
|
||
|
version int64 // default is MATCH_ANY
|
||
|
versionType string // default is "internal"
|
||
|
}
|
||
|
|
||
|
// NewReindexDestination returns a new ReindexDestination.
|
||
|
func NewReindexDestination() *ReindexDestination {
|
||
|
return &ReindexDestination{}
|
||
|
}
|
||
|
|
||
|
// Index specifies name of the Elasticsearch index to use as the destination
|
||
|
// of a reindexing process.
|
||
|
func (r *ReindexDestination) Index(index string) *ReindexDestination {
|
||
|
r.index = index
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Type specifies the Elasticsearch type to use for reindexing.
|
||
|
func (r *ReindexDestination) Type(typ string) *ReindexDestination {
|
||
|
r.typ = typ
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Routing specifies a routing value for the reindexing request.
|
||
|
// It can be "keep", "discard", or start with "=". The latter specifies
|
||
|
// the routing on the bulk request.
|
||
|
func (r *ReindexDestination) Routing(routing string) *ReindexDestination {
|
||
|
r.routing = routing
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Keep sets the routing on the bulk request sent for each match to the routing
|
||
|
// of the match (the default).
|
||
|
func (r *ReindexDestination) Keep() *ReindexDestination {
|
||
|
r.routing = "keep"
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Discard sets the routing on the bulk request sent for each match to null.
|
||
|
func (r *ReindexDestination) Discard() *ReindexDestination {
|
||
|
r.routing = "discard"
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Parent specifies the identifier of the parent document (if available).
|
||
|
func (r *ReindexDestination) Parent(parent string) *ReindexDestination {
|
||
|
r.parent = parent
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// OpType specifies if this request should follow create-only or upsert
|
||
|
// behavior. This follows the OpType of the standard document index API.
|
||
|
// See https://www.elastic.co/guide/en/elasticsearch/reference/current/docs-index_.html#operation-type
|
||
|
// for details.
|
||
|
func (r *ReindexDestination) OpType(opType string) *ReindexDestination {
|
||
|
r.opType = opType
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Version indicates the version of the document as part of an optimistic
|
||
|
// concurrency model.
|
||
|
func (r *ReindexDestination) Version(version int64) *ReindexDestination {
|
||
|
r.version = version
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// VersionType specifies how versions are created.
|
||
|
func (r *ReindexDestination) VersionType(versionType string) *ReindexDestination {
|
||
|
r.versionType = versionType
|
||
|
return r
|
||
|
}
|
||
|
|
||
|
// Source returns a serializable JSON request for the request.
|
||
|
func (r *ReindexDestination) Source() (interface{}, error) {
|
||
|
source := make(map[string]interface{})
|
||
|
if r.index != "" {
|
||
|
source["index"] = r.index
|
||
|
}
|
||
|
if r.typ != "" {
|
||
|
source["type"] = r.typ
|
||
|
}
|
||
|
if r.routing != "" {
|
||
|
source["routing"] = r.routing
|
||
|
}
|
||
|
if r.opType != "" {
|
||
|
source["op_type"] = r.opType
|
||
|
}
|
||
|
if r.parent != "" {
|
||
|
source["parent"] = r.parent
|
||
|
}
|
||
|
if r.version > 0 {
|
||
|
source["version"] = r.version
|
||
|
}
|
||
|
if r.versionType != "" {
|
||
|
source["version_type"] = r.versionType
|
||
|
}
|
||
|
return source, nil
|
||
|
}
|