Related
Currently im running into a disk space issue on my server and seem to have found the culprit:
Supposibly according to some people the size of this index is ~ 40 gb. Which sounds ridiculous because the average list of coords that I save is about 5 elements.
This index has 11k documents.
What I have tried:
Deleted the index and filled it up again, this resulted in a MUCH MUCH smaller index on elasticsearch 40GB -> 14MB?? Which is why im very skeptical as to if this will work at all.
Tried to research trough google without any concrete solutions.
I really hope someone might have some insight why it could possibly be this big.
My Elasticsearch version is: 5.6.11
my settings:
{
"my_polygons_1": {
"settings": {
"index": {
"number_of_shards": "5",
"provided_name": "my_polygons_1",
"creation_date": "1514988794703",
"analysis": {
"filter": {
"addresstranslation": {
"type": "synonym",
"synonyms": [
"1e,eerste",
"2e,tweede",
"3e,derde",
"1ste,eerste",
"2de,tweede",
"3de,derde"
]
},
"translation": {
"token_chars": [
"letter",
"digit",
"whitespace"
],
"min_gram": "3",
"type": "nGram",
"max_gram": "50"
}
},
"analyzer": {
"translation_index_analyzer": {
"filter": "standard,lowercase,asciifolding,translation",
"type": "custom",
"tokenizer": "standard"
},
"address_search_analyzer": {
"filter": "standard,lowercase,asciifolding,addresstranslation",
"type": "custom",
"tokenizer": "standard"
},
"address_index_analyzer": {
"filter": "standard,lowercase,asciifolding,addresstranslation,translation",
"type": "custom",
"tokenizer": "standard"
},
"translation_search_analyzer": {
"filter": "standard,lowercase,asciifolding",
"type": "custom",
"tokenizer": "standard"
}
}
},
"number_of_replicas": "1",
"uuid": "lQPnGOZ6TdKx9xZwNPfs2g",
"version": {
"created": "5060399"
}
}
}
}
}
my _stats:
{
"_shards": {
"total": 10,
"successful": 10,
"failed": 0
},
"_all": {
"primaries": {
"docs": {
"count": 11331,
"deleted": 646
},
"store": {
"size_in_bytes": 22095974914,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 1184,
"index_time_in_millis": 1166437,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 368507,
"time_in_millis": 159070,
"exists_total": 354156,
"exists_time_in_millis": 157586,
"missing_total": 14351,
"missing_time_in_millis": 1484,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 185,
"query_time_in_millis": 46,
"query_current": 0,
"fetch_total": 30,
"fetch_time_in_millis": 89,
"fetch_current": 0,
"scroll_total": 2,
"scroll_time_in_millis": 2444,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 132,
"total_time_in_millis": 714437,
"total_docs": 6268,
"total_size_in_bytes": 9036940847,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 88138,
"total_auto_throttle_in_bytes": 73181749
},
"refresh": {
"total": 3971,
"total_time_in_millis": 1052798,
"listeners": 0
},
"flush": {
"total": 1063,
"total_time_in_millis": 10994
},
"warmer": {
"current": 0,
"total": 3474,
"total_time_in_millis": 55
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 123,
"memory_in_bytes": 597667360,
"terms_memory_in_bytes": 597553396,
"stored_fields_memory_in_bytes": 38640,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 7872,
"points_memory_in_bytes": 368,
"doc_values_memory_in_bytes": 67084,
"index_writer_memory_in_bytes": 0,
"version_map_memory_in_bytes": 0,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 0,
"size_in_bytes": 215
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 8,
"hit_count": 0,
"miss_count": 100
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
},
"total": {
"docs": {
"count": 22662,
"deleted": 2356
},
"store": {
"size_in_bytes": 46187867347,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 2263,
"index_time_in_millis": 2216831,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 657621,
"time_in_millis": 250947,
"exists_total": 628867,
"exists_time_in_millis": 247657,
"missing_total": 28754,
"missing_time_in_millis": 3290,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 375,
"query_time_in_millis": 128,
"query_current": 0,
"fetch_total": 73,
"fetch_time_in_millis": 219,
"fetch_current": 0,
"scroll_total": 5,
"scroll_time_in_millis": 6110,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 252,
"total_time_in_millis": 1134358,
"total_docs": 10222,
"total_size_in_bytes": 13797985517,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 160514,
"total_auto_throttle_in_bytes": 155271619
},
"refresh": {
"total": 7539,
"total_time_in_millis": 1978415,
"listeners": 0
},
"flush": {
"total": 2030,
"total_time_in_millis": 21846
},
"warmer": {
"current": 0,
"total": 6641,
"total_time_in_millis": 105
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 261,
"memory_in_bytes": 1246021155,
"terms_memory_in_bytes": 1245778862,
"stored_fields_memory_in_bytes": 81992,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 16704,
"points_memory_in_bytes": 769,
"doc_values_memory_in_bytes": 142828,
"index_writer_memory_in_bytes": 0,
"version_map_memory_in_bytes": 0,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 0,
"size_in_bytes": 430
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 16,
"hit_count": 0,
"miss_count": 200
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
}
},
"indices": {
"my_polygons_1": {
"primaries": {
"docs": {
"count": 11331,
"deleted": 646
},
"store": {
"size_in_bytes": 22095974914,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 1184,
"index_time_in_millis": 1166437,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 368507,
"time_in_millis": 159070,
"exists_total": 354156,
"exists_time_in_millis": 157586,
"missing_total": 14351,
"missing_time_in_millis": 1484,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 185,
"query_time_in_millis": 46,
"query_current": 0,
"fetch_total": 30,
"fetch_time_in_millis": 89,
"fetch_current": 0,
"scroll_total": 2,
"scroll_time_in_millis": 2444,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 132,
"total_time_in_millis": 714437,
"total_docs": 6268,
"total_size_in_bytes": 9036940847,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 88138,
"total_auto_throttle_in_bytes": 73181749
},
"refresh": {
"total": 3971,
"total_time_in_millis": 1052798,
"listeners": 0
},
"flush": {
"total": 1063,
"total_time_in_millis": 10994
},
"warmer": {
"current": 0,
"total": 3474,
"total_time_in_millis": 55
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 123,
"memory_in_bytes": 597667360,
"terms_memory_in_bytes": 597553396,
"stored_fields_memory_in_bytes": 38640,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 7872,
"points_memory_in_bytes": 368,
"doc_values_memory_in_bytes": 67084,
"index_writer_memory_in_bytes": 0,
"version_map_memory_in_bytes": 0,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 0,
"size_in_bytes": 215
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 8,
"hit_count": 0,
"miss_count": 100
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
},
"total": {
"docs": {
"count": 22662,
"deleted": 2356
},
"store": {
"size_in_bytes": 46187867347,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 2263,
"index_time_in_millis": 2216831,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 657621,
"time_in_millis": 250947,
"exists_total": 628867,
"exists_time_in_millis": 247657,
"missing_total": 28754,
"missing_time_in_millis": 3290,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 375,
"query_time_in_millis": 128,
"query_current": 0,
"fetch_total": 73,
"fetch_time_in_millis": 219,
"fetch_current": 0,
"scroll_total": 5,
"scroll_time_in_millis": 6110,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 252,
"total_time_in_millis": 1134358,
"total_docs": 10222,
"total_size_in_bytes": 13797985517,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 160514,
"total_auto_throttle_in_bytes": 155271619
},
"refresh": {
"total": 7539,
"total_time_in_millis": 1978415,
"listeners": 0
},
"flush": {
"total": 2030,
"total_time_in_millis": 21846
},
"warmer": {
"current": 0,
"total": 6641,
"total_time_in_millis": 105
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 261,
"memory_in_bytes": 1246021155,
"terms_memory_in_bytes": 1245778862,
"stored_fields_memory_in_bytes": 81992,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 16704,
"points_memory_in_bytes": 769,
"doc_values_memory_in_bytes": 142828,
"index_writer_memory_in_bytes": 0,
"version_map_memory_in_bytes": 0,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 0,
"size_in_bytes": 430
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 16,
"hit_count": 0,
"miss_count": 200
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
}
}
}
}
and my mapping:
{
"my_polygons_1": {
"aliases": {},
"mappings": {
"my_polygons_1": {
"properties": {
"client_id": {
"type": "integer"
},
"id": {
"type": "integer"
},
"name": {
"type": "keyword"
},
"polygon": {
"type": "geo_shape",
"tree": "quadtree",
"precision": "1.0m"
}
}
}
},
"settings": {
"index": {
"number_of_shards": "5",
"provided_name": "my_polygons_1",
"creation_date": "1514988794703",
"analysis": {
"filter": {
"addresstranslation": {
"type": "synonym",
"synonyms": [
"1e,eerste",
"2e,tweede",
"3e,derde",
"1ste,eerste",
"2de,tweede",
"3de,derde"
]
},
"translation": {
"token_chars": [
"letter",
"digit",
"whitespace"
],
"min_gram": "3",
"type": "nGram",
"max_gram": "50"
}
},
"analyzer": {
"translation_index_analyzer": {
"filter": "standard,lowercase,asciifolding,translation",
"type": "custom",
"tokenizer": "standard"
},
"address_search_analyzer": {
"filter": "standard,lowercase,asciifolding,addresstranslation",
"type": "custom",
"tokenizer": "standard"
},
"address_index_analyzer": {
"filter": "standard,lowercase,asciifolding,addresstranslation,translation",
"type": "custom",
"tokenizer": "standard"
},
"translation_search_analyzer": {
"filter": "standard,lowercase,asciifolding",
"type": "custom",
"tokenizer": "standard"
}
}
},
"number_of_replicas": "1",
"uuid": "lQPnGOZ6TdKx9xZwNPfs2g",
"version": {
"created": "5060399"
}
}
}
}
}
I am trying to create and restore snapshots to make a huge data set for my testing purposes. Initially, I created few snapshots and restored them successfully. But suddenly I can't restore newly created indices. I haven't made any changes to the system and the only difference is data volume is bigger now.
Elasticsearch version: 6.3.0, single node setup
Snapshot Created
PUT /_snapshot/nuwan-backup2/snapshot_transactions-cl2-2018.11.27-reindexed-x3?wait_for_completion=true
{
"indices": "transactions-2018.11.27-reindexed-1543757375.64",
"ignore_unavailable": true,
"include_global_state": false
}
Output
{
"snapshot": {
"snapshot": "snapshot_transactions-cl2-2018.11.27-reindexed-x3",
"uuid": "JhsmFXmVR12OR-65fCtFXw",
"version_id": 6030099,
"version": "6.3.0",
"indices": [
"transactions-2018.11.27-reindexed-1543757375.64"
],
"include_global_state": false,
"state": "SUCCESS",
"start_time": "2018-12-12T12:32:26.645Z",
"start_time_in_millis": 1544617946645,
"end_time": "2018-12-12T12:32:26.750Z",
"end_time_in_millis": 1544617946750,
"duration_in_millis": 105,
"failures": [],
"shards": {
"total": 5,
"failed": 0,
"successful": 5
}
}
}
Snapshot status
GET /_snapshot/nuwan-backup2/snapshot_transactions-cl2-2018.11.27-reindexed-x3/_status
Output
{
"snapshots": [
{
"snapshot": "snapshot_transactions-cl2-2018.11.27-reindexed-x3",
"repository": "nuwan-backup2",
"uuid": "JhsmFXmVR12OR-65fCtFXw",
"state": "SUCCESS",
"include_global_state": false,
"shards_stats": {
"initializing": 0,
"started": 0,
"finalizing": 0,
"done": 5,
"failed": 0,
"total": 5
},
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946662,
"time_in_millis": 78
},
"indices": {
"transactions-2018.11.27-reindexed-1543757375.64": {
"shards_stats": {
"initializing": 0,
"started": 0,
"finalizing": 0,
"done": 5,
"failed": 0,
"total": 5
},
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946662,
"time_in_millis": 78
},
"shards": {
"0": {
"stage": "DONE",
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946696,
"time_in_millis": 17
}
},
"1": {
"stage": "DONE",
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946722,
"time_in_millis": 18
}
},
"2": {
"stage": "DONE",
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946662,
"time_in_millis": 18
}
},
"3": {
"stage": "DONE",
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946662,
"time_in_millis": 18
}
},
"4": {
"stage": "DONE",
"stats": {
"number_of_files": 0,
"processed_files": 0,
"total_size_in_bytes": 0,
"processed_size_in_bytes": 0,
"start_time_in_millis": 1544617946696,
"time_in_millis": 20
}
}
}
}
}
}
]
}
Snapshot Restore
POST /_snapshot/nuwan-backup2/snapshot_transactions-cl2-2018.11.27-reindexed-x3/_restore
{
"indices": "snapshot-x2",
"ignore_unavailable": true,
"include_global_state": true,
"rename_pattern": "s(.+)",
"rename_replacement": "s$1"
}
Output
{
"snapshot": {
"snapshot": "snapshot_transactions-cl2-2018.11.27-reindexed-x3",
"indices": [],
"shards": {
"total": 0,
"failed": 0,
"successful": 0
}
}
}
Result
No new index generated!
I have incorrectly configured restore request, it should be
POST /_snapshot/nuwan-backup2/snapshot_transactions-cl2-2018.11.27-reindexed-x3/_restore
{
"indices": "transactions-2018.11.27-reindexed-1543757375.64",
"ignore_unavailable": true,
"include_global_state": true,
"rename_pattern": "transactions-2018.11.27-reindexed-1543757375.64",
"rename_replacement": "snapshot-x2"
}
I am using AWS elastic search service and having each node with 16GB RAM, 4 cores and 160GB EBS. While looking at the
GET _nodes/stats
I found that I have only 0.27GB of memory left in my node. I understand the fact that approximately the following amount of memory is dedicated for these processes:
Heap : 8GB
Swap: 2GB
Fielddate + Segments: 1GB
I don't understand what happens with the rest of the 4-5GB of memory, which process is consuming this memory?
The following is the stat of one node which I got from the api mentioned above:
{
"timestamp": 1536212516381,
"name": "",
"roles": [
"master",
"data",
"ingest"
],
"indices": {
"docs": {
"count": 40811869,
"deleted": 12313549
},
"store": {
"size_in_bytes": 21211684802
},
"indexing": {
"index_total": 17141254,
"index_time_in_millis": 23271050,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 11,
"time_in_millis": 4,
"exists_total": 10,
"exists_time_in_millis": 4,
"missing_total": 1,
"missing_time_in_millis": 0,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 60495650,
"query_time_in_millis": 164996296,
"query_current": 0,
"fetch_total": 1338,
"fetch_time_in_millis": 3947,
"fetch_current": 0,
"scroll_total": 1541,
"scroll_time_in_millis": 147381782,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 752561,
"total_time_in_millis": 156448427,
"total_docs": 6278661063,
"total_size_in_bytes": 2061451815435,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 64499,
"total_auto_throttle_in_bytes": 231968018126
},
"refresh": {
"total": 9621793,
"total_time_in_millis": 126038098,
"listeners": 0
},
"flush": {
"total": 135925,
"total_time_in_millis": 2306674
},
"warmer": {
"current": 0,
"total": 8576200,
"total_time_in_millis": 3784313
},
"query_cache": {
"memory_size_in_bytes": 47531137,
"total_count": 315917952,
"hit_count": 69088483,
"miss_count": 246829469,
"cache_size": 16561,
"cache_count": 740755,
"evictions": 724194
},
"fielddata": {
"memory_size_in_bytes": 19006048,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 2256,
"memory_in_bytes": 62556325,
"terms_memory_in_bytes": 50154620,
"stored_fields_memory_in_bytes": 6587256,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 557504,
"points_memory_in_bytes": 2812593,
"doc_values_memory_in_bytes": 2444352,
"index_writer_memory_in_bytes": 0,
"version_map_memory_in_bytes": 0,
"fixed_bit_set_memory_in_bytes": 6743824,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 322600,
"size_in_bytes": 511751430,
"uncommitted_operations": 22528,
"uncommitted_size_in_bytes": 35107521
},
"request_cache": {
"memory_size_in_bytes": 84792534,
"evictions": 13922143,
"hit_count": 7667542,
"miss_count": 35693456
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 952628
}
},
"os": {
"timestamp": 1536212516872,
"cpu": {
"percent": 23,
"load_average": {
"1m": 1.29,
"5m": 1.19,
"15m": 1.16
}
},
"mem": {
"total_in_bytes": 16823488512,
"free_in_bytes": 297766912,
"used_in_bytes": 16525721600,
"free_percent": 2,
"used_percent": 98
},
"swap": {
"total_in_bytes": 2147479552,
"free_in_bytes": 2143141888,
"used_in_bytes": 4337664
}
},
"process": {
"timestamp": 1536212516872,
"open_file_descriptors": 2573,
"max_file_descriptors": 128000,
"cpu": {
"percent": 19,
"total_in_millis": 4177826450
},
"mem": {
"total_virtual_in_bytes": 34029547520
}
},
"jvm": {
"timestamp": 1536212516874,
"uptime_in_millis": 6132906547,
"mem": {
"heap_used_in_bytes": 5277036968,
"heap_used_percent": 61,
"heap_committed_in_bytes": 8555069440,
"heap_max_in_bytes": 8555069440,
"non_heap_used_in_bytes": 278172640,
"non_heap_committed_in_bytes": 304259072,
"pools": {
"young": {
"used_in_bytes": 246875928,
"max_in_bytes": 279183360,
"peak_used_in_bytes": 279183360,
"peak_max_in_bytes": 279183360
},
"survivor": {
"used_in_bytes": 6813256,
"max_in_bytes": 34865152,
"peak_used_in_bytes": 34865152,
"peak_max_in_bytes": 34865152
},
"old": {
"used_in_bytes": 5023347784,
"max_in_bytes": 8241020928,
"peak_used_in_bytes": 6966292552,
"peak_max_in_bytes": 8241020928
}
}
},
"threads": {
"count": 234,
"peak_count": 250
},
"gc": {
"collectors": {
"young": {
"collection_count": 4474572,
"collection_time_in_millis": 127468649
},
"old": {
"collection_count": 920,
"collection_time_in_millis": 325448
}
}
},
"buffer_pools": {
"direct": {
"count": 463,
"used_in_bytes": 154976141,
"total_capacity_in_bytes": 154976139
},
"mapped": {
"count": 4914,
"used_in_bytes": 21027708516,
"total_capacity_in_bytes": 21027708516
}
},
"classes": {
"current_loaded_count": 26154,
"total_loaded_count": 26712,
"total_unloaded_count": 558
}
},
"thread_pool": {
"bulk": {
"threads": 4,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 4,
"completed": 17141525
},
"fetch_shard_started": {
"threads": 0,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 0,
"completed": 0
},
"fetch_shard_store": {
"threads": 0,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 0,
"completed": 0
},
"flush": {
"threads": 2,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 2,
"completed": 271881
},
"force_merge": {
"threads": 0,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 0,
"completed": 0
},
"generic": {
"threads": 32,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 128,
"completed": 43205055
},
"get": {
"threads": 4,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 4,
"completed": 8
},
"index": {
"threads": 3,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 3,
"completed": 3
},
"listener": {
"threads": 2,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 2,
"completed": 4
},
"management": {
"threads": 5,
"queue": 0,
"active": 1,
"rejected": 0,
"largest": 5,
"completed": 28115022
},
"refresh": {
"threads": 2,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 2,
"completed": 1023804661
},
"search": {
"threads": 7,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 7,
"completed": 161702240
},
"snapshot": {
"threads": 1,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 2,
"completed": 21133
},
"warmer": {
"threads": 2,
"queue": 0,
"active": 0,
"rejected": 0,
"largest": 2,
"completed": 95146934
}
},
"fs": {
"timestamp": 1536212516874,
"total": {
"total_in_bytes": 168968957952,
"free_in_bytes": 147126472704,
"available_in_bytes": 138519760896
},
"data": [
{
"type": "ext4",
"total_in_bytes": 168968957952,
"free_in_bytes": 147126472704,
"available_in_bytes": 138519760896
}
],
"io_stats": {
"devices": [
{
"device_name": "xvdf",
"operations": 133367878,
"read_operations": 1456763,
"write_operations": 131911115,
"read_kilobytes": 104740824,
"write_kilobytes": 3178855500
}
],
"total": {
"operations": 133367878,
"read_operations": 1456763,
"write_operations": 131911115,
"read_kilobytes": 104740824,
"write_kilobytes": 3178855500
}
}
},
"breakers": {
"request": {
"limit_size_in_bytes": 5133041664,
"limit_size": "4.7gb",
"estimated_size_in_bytes": 0,
"estimated_size": "0b",
"overhead": 1,
"tripped": 0
},
"fielddata": {
"limit_size_in_bytes": 5133041664,
"limit_size": "4.7gb",
"estimated_size_in_bytes": 19006048,
"estimated_size": "18.1mb",
"overhead": 1.03,
"tripped": 0
},
"in_flight_requests": {
"limit_size_in_bytes": 8555069440,
"limit_size": "7.9gb",
"estimated_size_in_bytes": 1657,
"estimated_size": "1.6kb",
"overhead": 1,
"tripped": 0
},
"accounting": {
"limit_size_in_bytes": 8555069440,
"limit_size": "7.9gb",
"estimated_size_in_bytes": 62556325,
"estimated_size": "59.6mb",
"overhead": 1,
"tripped": 0
},
"parent": {
"limit_size_in_bytes": 5988548608,
"limit_size": "5.5gb",
"estimated_size_in_bytes": 81564030,
"estimated_size": "77.7mb",
"overhead": 1,
"tripped": 0
}
},
"script": {
"compilations": 5,
"cache_evictions": 0
},
"discovery": {
"cluster_state_queue": {
"total": 0,
"pending": 0,
"committed": 0
},
"published_cluster_states": {
"full_states": 1,
"incompatible_diffs": 0,
"compatible_diffs": 70303
}
},
"ingest": {
"total": {
"count": 0,
"time_in_millis": 0,
"current": 0,
"failed": 0
},
"pipelines": {}
},
"adaptive_selection": {
"qhqf-YADRF2gS1Vu6EV_8Q": {
"outgoing_searches": 0,
"avg_queue_size": 0,
"avg_service_time_ns": 6520537,
"avg_response_time_ns": 15403676,
"rank": "15.4"
},
"I21NiLksQqCNV3-vP3uCNA": {
"outgoing_searches": 0,
"avg_queue_size": 0,
"avg_service_time_ns": 3079216,
"avg_response_time_ns": 1115616,
"rank": "1.1"
},
"T2_cLfzrQBKd7WTR0p6jWQ": {
"outgoing_searches": 0,
"avg_queue_size": 0,
"avg_service_time_ns": 12493125,
"avg_response_time_ns": 1141514,
"rank": "1.1"
},
"ZZYgl3WARsKE-80HXhRbVw": {
"outgoing_searches": 0,
"avg_queue_size": 0,
"avg_service_time_ns": 3919880,
"avg_response_time_ns": 6063593,
"rank": "6.1"
}
}
}
Can anyone please help explain the memory distribution in this node? Is it okay to have only 0.27GB free memory space or what should I do to make more free memory available in the node?
I'm new to elasticsearch and have recently setup a flow of storing JMX data polled every 10seconds into an elasticearch index that looks like this:
{
"jmxmetrics": {
"mappings": {
"kafkajmx": {
"properties": {
"#timestamp": {
"type": "date"
},
"#version": {
"type": "keyword"
},
"attr_type": {
"type": "keyword"
},
"host": {
"type": "keyword"
},
"kafka_broker_id": {
"type": "keyword"
},
"kafka_clientId": {
"type": "keyword"
},
"kafka_fetcher_id": {
"type": "keyword"
},
"kafka_metric_group": {
"type": "keyword"
},
"kafka_metric_name": {
"type": "keyword"
},
"kafka_metric_type": {
"type": "keyword"
},
"kafka_topic": {
"type": "keyword"
},
"metric_path": {
"type": "text"
},
"metric_value_number": {
"type": "long"
},
"metric_value_string": {
"type": "keyword"
},
"path": {
"type": "text"
},
"topic_partition": {
"type": "keyword"
}
}
}
}
}
}
I'm then using a web portal built in ReactJs to hit the API endpoints in elastic search so that I can populate things like: hosts in a drop down, or topics in that host that was selected.
For example, if I run this query:
POST /jmxmetrics/kafkajmx/_search
{
"size": 0,
"aggs" : {
"topics": {
"filter": {
"range": {
"#timestamp": {
"from": "now-60s"
}
}
},
"aggs": {
"topics":{
"terms": {
"field": "kafka_topic",
"size": 500
}
}
}
}
},
"query": {
"match": {
"host": "host_A"
}
}
}
it takes about 25seconds to return:
{
"took": 24709,
"timed_out": false,
"_shards": {
"total": 3,
"successful": 3,
"failed": 0
},
"hits": {
"total": 1053380207,
"max_score": 0,
"hits": []
},
"aggregations": {
"topics": {
"doc_count": 54915,
"topics": {
"doc_count_error_upper_bound": 189,
"sum_other_doc_count": 45098,
"buckets": [
{
"key": "__consumer_offsets",
"doc_count": 503
},
{
"key": "topic 1",
"doc_count": 196
},
{
"key": "topic 2",
"doc_count": 193
},
{
"key": "topic 3",
"doc_count": 142
},
...
]
}
}
}
}
Any elasticsearch aggregation query seems to take 10+ seconds to run, and my cluster topology looks like this (running on AWS Ec2):
3 master/data nodes c4.2xlarge (8 cores, and 15Gb ram)
1 client node t2.large (2 cores, 8gb ram)
Any idea on what I could be improving here? I know this is a fairly broad question but any pointers will be helpful.
-------EDIT--------
Here are my settings:
{
"jmxmetrics": {
"settings": {
"index": {
"creation_date": "1489771989403",
"number_of_shards": "3",
"number_of_replicas": "2",
"uuid": "DeLP9MrQT6S_kILMmXorew",
"version": {
"created": "5020199"
},
"provided_name": "sdpjmx"
}
}
}
}
also, here are my stats:
{
"_shards": {
"total": 9,
"successful": 9,
"failed": 0
},
"_all": {
"primaries": {
"docs": {
"count": 1402484967,
"deleted": 0
},
"store": {
"size_in_bytes": 261239372859,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 1402487151,
"index_time_in_millis": 108231827,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 1,
"time_in_millis": 13,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 1,
"missing_time_in_millis": 13,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 692,
"query_time_in_millis": 1390846,
"query_current": 0,
"fetch_total": 76,
"fetch_time_in_millis": 15444,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 4,
"current_docs": 57546764,
"current_size_in_bytes": 10961768409,
"total": 359830,
"total_time_in_millis": 298632418,
"total_docs": 8639051262,
"total_size_in_bytes": 1733171768674,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 208268389,
"total_auto_throttle_in_bytes": 15728640
},
"refresh": {
"total": 2290338,
"total_time_in_millis": 27698495,
"listeners": 0
},
"flush": {
"total": 1398,
"total_time_in_millis": 512144
},
"warmer": {
"current": 0,
"total": 2291685,
"total_time_in_millis": 365893
},
"query_cache": {
"memory_size_in_bytes": 131229184,
"total_count": 13019,
"hit_count": 905,
"miss_count": 12114,
"cache_size": 118,
"cache_count": 139,
"evictions": 21
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 167,
"memory_in_bytes": 868415719,
"terms_memory_in_bytes": 731359089,
"stored_fields_memory_in_bytes": 125593776,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 32064,
"points_memory_in_bytes": 11138810,
"doc_values_memory_in_bytes": 291980,
"index_writer_memory_in_bytes": 9788964,
"version_map_memory_in_bytes": 290304,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 529724,
"size_in_bytes": 275528684
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 0,
"miss_count": 84
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
},
"total": {
"docs": {
"count": 4207454779,
"deleted": 0
},
"store": {
"size_in_bytes": 776849456528,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 4207461365,
"index_time_in_millis": 333522565,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 2,
"time_in_millis": 13,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 2,
"missing_time_in_millis": 13,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 2046,
"query_time_in_millis": 4439867,
"query_current": 0,
"fetch_total": 204,
"fetch_time_in_millis": 61910,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 9,
"current_docs": 90922106,
"current_size_in_bytes": 17436129588,
"total": 993305,
"total_time_in_millis": 889392309,
"total_docs": 25596362951,
"total_size_in_bytes": 5109527514241,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 622031369,
"total_auto_throttle_in_bytes": 47185920
},
"refresh": {
"total": 6870703,
"total_time_in_millis": 80442220,
"listeners": 0
},
"flush": {
"total": 4194,
"total_time_in_millis": 1542414
},
"warmer": {
"current": 0,
"total": 6874724,
"total_time_in_millis": 1048456
},
"query_cache": {
"memory_size_in_bytes": 428618904,
"total_count": 38315,
"hit_count": 3196,
"miss_count": 35119,
"cache_size": 371,
"cache_count": 438,
"evictions": 67
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 492,
"memory_in_bytes": 2604314152,
"terms_memory_in_bytes": 2194198429,
"stored_fields_memory_in_bytes": 375756256,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 94464,
"points_memory_in_bytes": 33422427,
"doc_values_memory_in_bytes": 842576,
"index_writer_memory_in_bytes": 22793264,
"version_map_memory_in_bytes": 853888,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 1591047,
"size_in_bytes": 827579505
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 0,
"miss_count": 345
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
}
},
"indices": {
"jmxmetrics": {
"primaries": {
"docs": {
"count": 1402484967,
"deleted": 0
},
"store": {
"size_in_bytes": 261239372859,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 1402487151,
"index_time_in_millis": 108231827,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 1,
"time_in_millis": 13,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 1,
"missing_time_in_millis": 13,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 692,
"query_time_in_millis": 1390846,
"query_current": 0,
"fetch_total": 76,
"fetch_time_in_millis": 15444,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 4,
"current_docs": 57546764,
"current_size_in_bytes": 10961768409,
"total": 359830,
"total_time_in_millis": 298632418,
"total_docs": 8639051262,
"total_size_in_bytes": 1733171768674,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 208268389,
"total_auto_throttle_in_bytes": 15728640
},
"refresh": {
"total": 2290338,
"total_time_in_millis": 27698495,
"listeners": 0
},
"flush": {
"total": 1398,
"total_time_in_millis": 512144
},
"warmer": {
"current": 0,
"total": 2291685,
"total_time_in_millis": 365893
},
"query_cache": {
"memory_size_in_bytes": 131229184,
"total_count": 13019,
"hit_count": 905,
"miss_count": 12114,
"cache_size": 118,
"cache_count": 139,
"evictions": 21
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 167,
"memory_in_bytes": 868415719,
"terms_memory_in_bytes": 731359089,
"stored_fields_memory_in_bytes": 125593776,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 32064,
"points_memory_in_bytes": 11138810,
"doc_values_memory_in_bytes": 291980,
"index_writer_memory_in_bytes": 9788964,
"version_map_memory_in_bytes": 290304,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 529724,
"size_in_bytes": 275528684
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 0,
"miss_count": 84
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
},
"total": {
"docs": {
"count": 4207454779,
"deleted": 0
},
"store": {
"size_in_bytes": 776849456528,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 4207461365,
"index_time_in_millis": 333522565,
"index_current": 0,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 0
},
"get": {
"total": 2,
"time_in_millis": 13,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 2,
"missing_time_in_millis": 13,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 2046,
"query_time_in_millis": 4439867,
"query_current": 0,
"fetch_total": 204,
"fetch_time_in_millis": 61910,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 9,
"current_docs": 90922106,
"current_size_in_bytes": 17436129588,
"total": 993305,
"total_time_in_millis": 889392309,
"total_docs": 25596362951,
"total_size_in_bytes": 5109527514241,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 622031369,
"total_auto_throttle_in_bytes": 47185920
},
"refresh": {
"total": 6870703,
"total_time_in_millis": 80442220,
"listeners": 0
},
"flush": {
"total": 4194,
"total_time_in_millis": 1542414
},
"warmer": {
"current": 0,
"total": 6874724,
"total_time_in_millis": 1048456
},
"query_cache": {
"memory_size_in_bytes": 428618904,
"total_count": 38315,
"hit_count": 3196,
"miss_count": 35119,
"cache_size": 371,
"cache_count": 438,
"evictions": 67
},
"fielddata": {
"memory_size_in_bytes": 0,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 492,
"memory_in_bytes": 2604314152,
"terms_memory_in_bytes": 2194198429,
"stored_fields_memory_in_bytes": 375756256,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 94464,
"points_memory_in_bytes": 33422427,
"doc_values_memory_in_bytes": 842576,
"index_writer_memory_in_bytes": 22793264,
"version_map_memory_in_bytes": 853888,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {}
},
"translog": {
"operations": 1591047,
"size_in_bytes": 827579505
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 0,
"miss_count": 345
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
}
}
}
}
Note: This is cross-posted on the elasticsearch forum (https://discuss.elastic.co/t/store-size-1-000-times-the-document-byte-size/74258/4).
I am experiencing a roughly 1,000x increase in store.size over the document byte size. I've got a very simple mapping with very small documents (less than 1kb) and I've compared my mapping to Elasticsearch's internal mapping and they are the same, so it does not appear that there is any dynamic mapping going on.
So far, I have ingested 60,437 documents and have a store.size of 19.6Gb (average of 300kb per document), but the average byte size (String.getBytes().length) of the JSON is 300-400 bytes per document. In another run, the documents were averaging about 1MB - 3MB per document.
I'm using Elasticsearch 5.2 on an M4.2xlarge EC2 instance. Elasticsearch was installed with mostly all defaults, except what I needed to do in order to pass the boostrap checks and bind to a non-local IP. I've allocated 16GB (half of my physical memory) to Elasticsearch.
I used to run Elasticsearch 2.x and was ingesting FAR more fields and much larger documents than just these handful of fields and was only experiencing about 20k / document, which was still substantial, though manageable.
If anyone can point out anything that would fix this, I would appreciate it. Or is there an ES 5.x configuration I haven't seen that will resolve this?
Below is my mapping.
{
"settings": {
"index.query.default_field": "tweetText"
},
"mappings": {
"tweet": {
"_all": {
"enabled": false
},
"properties": {
"tweetDate": {
"type": "date",
"format": "EEE MMM dd HH:mm:ss Z YYYY||strict_date_optional_time||epoch_millis"
},
"userId": {
"type": "text",
"index": "not_analyzed"
},
"screenName": {
"type": "text",
"index": "not_analyzed"
},
"tweetText": {
"type": "text"
},
"cleanedText": {
"type": "text"
},
"tweetId": {
"type": "text",
"index": "not_analyzed"
},
"location": {
"type": "geo_point",
"ignore_malformed": true
},
"placeName": {
"type": "keyword",
"doc_values": true,
"eager_global_ordinals": false
},
"placeCountry": {
"type": "keyword",
"doc_values": true,
"eager_global_ordinals": true
},
"placeCountryCode": {
"type": "keyword",
"doc_values": false,
"eager_global_ordinals": false,
"index": false
},
"placeBoundingBox": {
"type": "geo_shape",
"tree": "quadtree",
"precision": "1m"
},
"resolvedUrls": {
"type": "text",
"index": "not_analyzed"
},
"hashtags": {
"type": "text"
},
"mentions": {
"type": "text"
},
"geoInferences": {
"properties": {
"matchedName": {
"type": "text"
},
"asciiName": {
"type": "keyword",
"doc_values": true,
"eager_global_ordinals": false
},
"country": {
"type": "keyword",
"doc_values": true,
"eager_global_ordinals": true
},
"county": {
"type": "text"
},
"countryCode": {
"type": "keyword",
"doc_values": false,
"eager_global_ordinals": false,
"index": false
},
"city": {
"type": "text"
},
"admin1Code": {
"type": "keyword",
"doc_values": false,
"eager_global_ordinals": false,
"index": false
},
"admin2Code": {
"type": "keyword",
"doc_values": false,
"eager_global_ordinals": false,
"index": false
},
"admin3Code": {
"type": "keyword",
"doc_values": false,
"eager_global_ordinals": false,
"index": false
},
"admin4Code": {
"type": "keyword",
"doc_values": false,
"eager_global_ordinals": false,
"index": false
},
"confidence": {
"type": "float",
"doc_values": false,
"ignore_malformed": false,
"index": false
},
"coordinates": {
"type": "geo_point",
"ignore_malformed": true
}
}
},
"temporalInferences": {
"type": "date",
"ignore_malformed": true
}
}
}
}
}
A sample document:
{
"_index": "twitter",
"_type": "tweet",
"_id": "AVoZivLca9LOhnR10_ll",
"_score": null,
"_source": {
"tweetDate": 1486487211000,
"userId": "123456789",
"screenName": "removed",
"tweetText": "RT #wef: America’s dominance is over. By 2030, we'll have a handful of global powers https://www.weforum.org/agenda/2016/11/america-s-dominance-is-over/?utm_content=buffer73cd5&utm_medium=social&utm_source=twitter.com&utm_campaign=buffer #wef17 https://twitter.com/wef/status/828994745200435200/photo/1",
"cleanedText": "RT #wef: America s dominance is over. By 2030, we'll have a handful of global powers https://www.weforum.org/agenda/2016/11/america-s-dominance-is-over/?utm_content=buffer73cd5&utm_medium=social&utm_source=twitter.com&utm_campaign=buffer #wef17 https://twitter.com/wef/status/828994745200435200/photo/1",
"tweetId": "829013568288796672",
"resolvedUrls": [
"https://www.weforum.org/agenda/2016/11/america-s-dominance-is-over/?utm_content=buffer73cd5&utm_medium=social&utm_source=twitter.com&utm_campaign=buffer"
],
"hashtags": [
"wef17"
],
"mentions": [
"wef"
],
"geoInferences": [
{
"matchedName": "America",
"asciiName": "United States",
"country": "United States",
"countryCode": "US",
"coordinates": [
-98.5,
39.76
],
"admin1Code": "00",
"admin2Code": "",
"admin3Code": "",
"admin4Code": "",
"confidence": 1
}
],
"temporalInferences": [
1893474000000
]
},
"fields": {
"temporalInferences": [
1893474000000
],
"tweetDate": [
1486487211000
]
},
"sort": [
1486487211000
]
}
The output from
GET /_cat/indices/twitter?pri&v&h=health,index,pri,rep,docs.count,mt,pri,rep,docs.count,store.size,pri.store.size
health | index | pri | rep | docs.count | mt | pri.mt | store.size | pri.store.size | pri.store.size
yellow | twitter | 5 | 1 | 26860 | 74 | 74 | 10.1gb | 10.1gb | 10.1gb
The output from:
GET /twitter/_stats
{
"_shards": {
"total": 10,
"successful": 5,
"failed": 0
},
"_all": {
"primaries": {
"docs": {
"count": 26860,
"deleted": 0
},
"store": {
"size_in_bytes": 11027965678,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 27397,
"index_time_in_millis": 3568991,
"index_current": 1,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 195961
},
"get": {
"total": 0,
"time_in_millis": 0,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 0,
"missing_time_in_millis": 0,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 55,
"query_time_in_millis": 294,
"query_current": 0,
"fetch_total": 36,
"fetch_time_in_millis": 3209,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 76,
"total_time_in_millis": 350987,
"total_docs": 45409,
"total_size_in_bytes": 4027595474,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 48633,
"total_auto_throttle_in_bytes": 82233108
},
"refresh": {
"total": 857,
"total_time_in_millis": 2994887,
"listeners": 0
},
"flush": {
"total": 15,
"total_time_in_millis": 291939
},
"warmer": {
"current": 0,
"total": 876,
"total_time_in_millis": 534
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 24808,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 139,
"memory_in_bytes": 186032131,
"terms_memory_in_bytes": 185758725,
"stored_fields_memory_in_bytes": 43976,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 77888,
"points_memory_in_bytes": 714,
"doc_values_memory_in_bytes": 150828,
"index_writer_memory_in_bytes": 1316180948,
"version_map_memory_in_bytes": 42250,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {
}
},
"translog": {
"operations": 11997,
"size_in_bytes": 5555179
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 195,
"miss_count": 195
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
},
"total": {
"docs": {
"count": 26860,
"deleted": 0
},
"store": {
"size_in_bytes": 11027965678,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 27397,
"index_time_in_millis": 3568991,
"index_current": 1,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 195961
},
"get": {
"total": 0,
"time_in_millis": 0,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 0,
"missing_time_in_millis": 0,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 55,
"query_time_in_millis": 294,
"query_current": 0,
"fetch_total": 36,
"fetch_time_in_millis": 3209,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 76,
"total_time_in_millis": 350987,
"total_docs": 45409,
"total_size_in_bytes": 4027595474,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 48633,
"total_auto_throttle_in_bytes": 82233108
},
"refresh": {
"total": 857,
"total_time_in_millis": 2994887,
"listeners": 0
},
"flush": {
"total": 15,
"total_time_in_millis": 291939
},
"warmer": {
"current": 0,
"total": 876,
"total_time_in_millis": 534
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 24808,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 139,
"memory_in_bytes": 186032131,
"terms_memory_in_bytes": 185758725,
"stored_fields_memory_in_bytes": 43976,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 77888,
"points_memory_in_bytes": 714,
"doc_values_memory_in_bytes": 150828,
"index_writer_memory_in_bytes": 1316180948,
"version_map_memory_in_bytes": 42250,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {
}
},
"translog": {
"operations": 11997,
"size_in_bytes": 5555179
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 195,
"miss_count": 195
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
}
},
"indices": {
"twitter": {
"primaries": {
"docs": {
"count": 26860,
"deleted": 0
},
"store": {
"size_in_bytes": 11027965678,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 27397,
"index_time_in_millis": 3568991,
"index_current": 1,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 195961
},
"get": {
"total": 0,
"time_in_millis": 0,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 0,
"missing_time_in_millis": 0,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 55,
"query_time_in_millis": 294,
"query_current": 0,
"fetch_total": 36,
"fetch_time_in_millis": 3209,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 76,
"total_time_in_millis": 350987,
"total_docs": 45409,
"total_size_in_bytes": 4027595474,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 48633,
"total_auto_throttle_in_bytes": 82233108
},
"refresh": {
"total": 857,
"total_time_in_millis": 2994887,
"listeners": 0
},
"flush": {
"total": 15,
"total_time_in_millis": 291939
},
"warmer": {
"current": 0,
"total": 876,
"total_time_in_millis": 534
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 24808,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 139,
"memory_in_bytes": 186032131,
"terms_memory_in_bytes": 185758725,
"stored_fields_memory_in_bytes": 43976,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 77888,
"points_memory_in_bytes": 714,
"doc_values_memory_in_bytes": 150828,
"index_writer_memory_in_bytes": 1316180948,
"version_map_memory_in_bytes": 42250,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {
}
},
"translog": {
"operations": 11997,
"size_in_bytes": 5555179
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 195,
"miss_count": 195
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
},
"total": {
"docs": {
"count": 26860,
"deleted": 0
},
"store": {
"size_in_bytes": 11027965678,
"throttle_time_in_millis": 0
},
"indexing": {
"index_total": 27397,
"index_time_in_millis": 3568991,
"index_current": 1,
"index_failed": 0,
"delete_total": 0,
"delete_time_in_millis": 0,
"delete_current": 0,
"noop_update_total": 0,
"is_throttled": false,
"throttle_time_in_millis": 195961
},
"get": {
"total": 0,
"time_in_millis": 0,
"exists_total": 0,
"exists_time_in_millis": 0,
"missing_total": 0,
"missing_time_in_millis": 0,
"current": 0
},
"search": {
"open_contexts": 0,
"query_total": 55,
"query_time_in_millis": 294,
"query_current": 0,
"fetch_total": 36,
"fetch_time_in_millis": 3209,
"fetch_current": 0,
"scroll_total": 0,
"scroll_time_in_millis": 0,
"scroll_current": 0,
"suggest_total": 0,
"suggest_time_in_millis": 0,
"suggest_current": 0
},
"merges": {
"current": 0,
"current_docs": 0,
"current_size_in_bytes": 0,
"total": 76,
"total_time_in_millis": 350987,
"total_docs": 45409,
"total_size_in_bytes": 4027595474,
"total_stopped_time_in_millis": 0,
"total_throttled_time_in_millis": 48633,
"total_auto_throttle_in_bytes": 82233108
},
"refresh": {
"total": 857,
"total_time_in_millis": 2994887,
"listeners": 0
},
"flush": {
"total": 15,
"total_time_in_millis": 291939
},
"warmer": {
"current": 0,
"total": 876,
"total_time_in_millis": 534
},
"query_cache": {
"memory_size_in_bytes": 0,
"total_count": 0,
"hit_count": 0,
"miss_count": 0,
"cache_size": 0,
"cache_count": 0,
"evictions": 0
},
"fielddata": {
"memory_size_in_bytes": 24808,
"evictions": 0
},
"completion": {
"size_in_bytes": 0
},
"segments": {
"count": 139,
"memory_in_bytes": 186032131,
"terms_memory_in_bytes": 185758725,
"stored_fields_memory_in_bytes": 43976,
"term_vectors_memory_in_bytes": 0,
"norms_memory_in_bytes": 77888,
"points_memory_in_bytes": 714,
"doc_values_memory_in_bytes": 150828,
"index_writer_memory_in_bytes": 1316180948,
"version_map_memory_in_bytes": 42250,
"fixed_bit_set_memory_in_bytes": 0,
"max_unsafe_auto_id_timestamp": -1,
"file_sizes": {
}
},
"translog": {
"operations": 11997,
"size_in_bytes": 5555179
},
"request_cache": {
"memory_size_in_bytes": 0,
"evictions": 0,
"hit_count": 195,
"miss_count": 195
},
"recovery": {
"current_as_source": 0,
"current_as_target": 0,
"throttle_time_in_millis": 0
}
}
}
}
}
EDIT 1
I've discovered the source of this issue. It seems that it's the bounding box that is at fault, though I've no idea why.
Once I remove the bounding box from the data being ingested, the index is a normal size (600 documents --> 550kb), but as soon as I add the bounding box back in (with a brand new index), the size skyrockets (3,593 documents --> 1.6GB) with only 84 documents containing a bounding box.
Below is the JSON of the bounding box:
"placeBoundingBox": {
"type": "polygon",
"coordinates": [
[
[
-71.191421,
42.227797
],
[
-71.191421,
42.399542
],
[
-70.986004,
42.399542
],
[
-70.986004,
42.227797
],
[
-71.191421,
42.227797
]
]
]
}
The mapping associated with the bounding box (from calling GET /INDEX_NAME):
"placeBoundingBox": {
"type": "geo_shape",
"tree": "quadtree",
"precision": "1.0m"
}
To demonstrate that the mapping does infact work and is creating a proper geo_shape (even though Kibana doesn't recognize it as a geo_shape), I ran the following query and got back a successful hit:
GET /_search
{
"query": {
"bool": {
"must": {
"match_all": {
}
},
"filter": {
"geo_shape": {
"placeBoundingBox": {
"shape": {
"type": "polygon",
"coordinates": [
[
[
-71.191421,
42.227797
],
[
-71.191421,
42.399542
],
[
-70.986004,
42.399542
],
[
-70.986004,
42.227797
],
[
-71.191421,
42.227797
]
]
]
},
"relation": "within"
}
}
}
}
}
}
I'd like to have the bounding box kept in, is there something wrong with either the mapping or the data? Is 1.0m too fine-grained?
The problem was the precision in the mapping, which was simply a typo (Our index for Elasticsearch 2.x had the precision as 1km). One tiny letter made all the difference...
A 1 meter ("1m") precision creates an extremely bloated index.
Removing the "precision" field from the mapping altogether will default to 50m and a well-sized index.