我有一个6个数据节点和3个主节点的集群elasticsearch。
执行快照时,我收到错误“process\u cluster\u event\u timeout\u exception”。
我在集群“/\u cat/pending\u tasks”中查看它有69个具有高优先级和源-输出Map的任务
我的群集用于集中式日志,并使用此进程将数据放入群集:
logstash-从redis收集并放入elasticsearch
apm服务器
filebeat公司
节拍
我一直在从apm服务器上删除beats和一些应用程序
是否可以将任务创建快照的优先级从正常更改为高或紧急?
这不是一个解决方案,如何检查我的集群的正确大小?
- 通常我在群集中保留7天索引,因为备份。但由于这个错误,我删除了排除旧数据的过程
获取\u cat/nodes?v&s=节点。role:desc
Perceptram.percupulip.perpercupuloeap.percucuculuload\u 1mloload\u 1mlo负载\u 5mlo负载\u 15节点.RolemaSteraname10.0.2.8475000.000.000.000.00。perpercupuload。percucupuload\u 1mload\u 1mloload\u 1mlolo负载\u 5mlo负载\u 15节点.RoleemaSteranamam10.0.0.2.8475000.000.000.000.000.000.000.00 mi-prd-prd-弹性ElasticSearch-prd-ElasticSearch-prd-ElasticSearch-0.0.0.0.0.0.0.0.0.0.0.0 0.0.0.0 0.0.0 0 0 0 0.0.0 0.0.0.0.0 0.758989898951895189518951898.0.0 878个.89d-prd-elasticsearch-i-0ff10.0.0.66797258.9710.4510.47d-prd-elasticsearch-i-01a10.0.0.957983211.639.649.17d-prd-elasticsearch-i-00510.0.1.062961910.459.539.31d-prd-elasticsearch-i-088
我的群集定义:
{
"_nodes": {
"total": 9,
"successful": 9,
"failed": 0
},
"cluster_name": "prd-elasticsearch",
"cluster_uuid": "xxxx",
"timestamp": 1607609607018,
"status": "green",
"indices": {
"count": 895,
"shards": {
"total": 14006,
"primaries": 4700,
"replication": 1.98,
"index": {
"shards": {
"min": 2,
"max": 18,
"avg": 15.649162011173184
},
"primaries": {
"min": 1,
"max": 6,
"avg": 5.251396648044692
},
"replication": {
"min": 1,
"max": 2,
"avg": 1.9787709497206705
}
}
},
"docs": {
"count": 14896803950,
"deleted": 843126
},
"store": {
"size_in_bytes": 16778620001453
},
"fielddata": {
"memory_size_in_bytes": 4790672272,
"evictions": 0
},
"query_cache": {
"memory_size_in_bytes": 7689832903,
"total_count": 2033762560,
"hit_count": 53751516,
"miss_count": 1980011044,
"cache_size": 4087727,
"cache_count": 11319866,
"evictions": 7232139
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 155344,
"memory_in_bytes": 39094918196,
"terms_memory_in_bytes": 31533157295,
"stored_fields_memory_in_bytes": 5574613712,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 449973760,
"points_memory_in_bytes": 886771949,
"doc_values_memory_in_bytes": 650401480,
"index_writer_memory_in_bytes": 905283962,
"version_map_memory_in_bytes": 1173400,
"fixed_bit_set_memory_in_bytes": 12580800,
"max_unsafe_auto_id_timestamp": 1607606224903,
"file_sizes": {}
}
},
"nodes": {
"count": {
"total": 9,
"data": 6,
"coordinating_only": 0,
"master": 3,
"ingest": 3
},
"versions": [
"6.8.1"
],
"os": {
"available_processors": 108,
"allocated_processors": 108,
"names": [
{
"name": "Linux",
"count": 9
}
],
"pretty_names": [
{
"pretty_name": "CentOS Linux 7 (Core)",
"count": 9
}
],
"mem": {
"total_in_bytes": 821975162880,
"free_in_bytes": 50684043264,
"used_in_bytes": 771291119616,
"free_percent": 6,
"used_percent": 94
}
},
"process": {
"cpu": {
"percent": 349
},
"open_file_descriptors": {
"min": 429,
"max": 9996,
"avg": 6607
}
},
"jvm": {
"max_uptime_in_millis": 43603531934,
"versions": [
{
"version": "1.8.0_222",
"vm_name": "OpenJDK 64-Bit Server VM",
"vm_version": "25.222-b10",
"vm_vendor": "Oracle Corporation",
"count": 9
}
],
"mem": {
"heap_used_in_bytes": 137629451248,
"heap_max_in_bytes": 205373571072
},
"threads": 1941
},
"fs": {
"total_in_bytes": 45245361229824,
"free_in_bytes": 28231010959360,
"available_in_bytes": 28231011147776
},
"plugins": [
{
"name": "repository-s3",
"version": "6.8.1",
"elasticsearch_version": "6.8.1",
"java_version": "1.8",
"description": "The S3 repository plugin adds S3 repositories",
"classname": "org.elasticsearch.repositories.s3.S3RepositoryPlugin",
"extended_plugins": [],
"has_native_controller": false
}
],
"network_types": {
"transport_types": {
"security4": 9
},
"http_types": {
"security4": 9
}
}
}
}
数据节点:6个r4.4XL示例
主节点:3个示例m5.large
1条答案
按热度按时间moiiocjp1#
不,无法更改任务创建快照的优先级。
由于您有69个挂起的任务,似乎您正在进行太多的Map更新。
关于集群的正确大小,我建议您浏览以下博文:
https://www.elastic.co/blog/found-sizing-elasticsearch
https://docs.aws.amazon.com/elasticsearch-service/latest/developerguide/sizing-domains.html