feat: migration with bulk skip exit docs

This commit is contained in:
hardy 2024-01-31 14:13:26 +08:00 committed by hardy
parent dc562c0d74
commit 50f12de6a8
2 changed files with 15 additions and 12 deletions

View File

@ -129,11 +129,12 @@ func (p *processor) handleSplitSubTask(taskItem *task.Task) error {
Processor: []util.MapStr{
{
"es_scroll": util.MapStr{
"remove_type": docType == "",
"slice_size": cfg.Source.SliceSize,
"batch_size": cfg.Source.BatchSize,
"indices": indexName,
"elasticsearch": sourceClusterID,
"remove_type": docType == "",
"slice_size": cfg.Source.SliceSize,
"batch_size": cfg.Source.BatchSize,
"indices": indexName,
"elasticsearch": sourceClusterID,
"skip_exist_documents": cfg.Target.Bulk.SkipExistDocuments,
"queue": util.MapStr{
"name": scrollID,
"labels": util.MapStr{
@ -186,10 +187,11 @@ func (p *processor) handleSplitSubTask(taskItem *task.Task) error {
"bulk_indexing": util.MapStr{
"detect_active_queue": false,
"bulk": util.MapStr{
"batch_size_in_mb": cfg.Target.Bulk.BatchSizeInMB,
"batch_size_in_docs": cfg.Target.Bulk.BatchSizeInDocs,
"invalid_queue": "bulk_indexing_400",
"compress": cfg.Target.Bulk.Compress,
"batch_size_in_mb": cfg.Target.Bulk.BatchSizeInMB,
"batch_size_in_docs": cfg.Target.Bulk.BatchSizeInDocs,
"invalid_queue": "bulk_indexing_400",
"compress": cfg.Target.Bulk.Compress,
"skip_exist_documents": cfg.Target.Bulk.SkipExistDocuments,
},
"max_worker_size": cfg.Target.Bulk.MaxWorkerSize,
"num_of_slices": cfg.Target.Bulk.SliceSize,

View File

@ -9,8 +9,8 @@ import (
)
type ClusterMigrationTaskConfig struct {
Name string `json:"name"`
Tags []string `json:"tags"`
Name string `json:"name"`
Tags []string `json:"tags"`
Cluster struct {
Source ClusterInfo `json:"source"`
Target ClusterInfo `json:"target"`
@ -42,7 +42,7 @@ type ClusterMigrationIndexConfig struct {
Percent float64 `json:"percent,omitempty"`
ErrorPartitions int `json:"error_partitions,omitempty"`
RunningChildren int `json:"running_children,omitempty"`
ExportedPercent float64 `json:"exported_percent,omitempty"`
ExportedPercent float64 `json:"exported_percent,omitempty"`
}
type ClusterMigrationTaskState struct {
@ -92,6 +92,7 @@ type IndexMigrationBulkConfig struct {
IdleTimeoutInSeconds int `json:"idle_timeout_in_seconds"`
SliceSize int `json:"slice_size"`
Compress bool `json:"compress"`
SkipExistDocuments bool `json:"skip_exist_documents"`
}
type IndexMigrationTargetConfig struct {