elasticsearch,faceted-search,Lucene,Full Text Search,elasticsearch,Faceted Search" /> elasticsearch,faceted-search,Lucene,Full Text Search,elasticsearch,Faceted Search" />

Lucene index.cache.field.max_size无法限制elasticsearch中的字段数据缓存

Lucene index.cache.field.max_size无法限制elasticsearch中的字段数据缓存,lucene,full-text-search,elasticsearch,faceted-search,Lucene,Full Text Search,elasticsearch,Faceted Search,我试图通过在config/elasticsearch.yml文件中设置index.cache.field.max_size:NUMBER来限制字段缓存(常驻)。我有大约100万条记录,在7个字段(所有字段都包含大量文本数据)上执行刻面操作,以构建一个“字云” 无论为index.cache.field.max_size指定了什么值(1000或100000),堆内存(已分配15gb)都会一直被占用。我做错了什么? 还有没有更好的方法来构建单词云,而不是对如此大量的文本数据执行面处理 映射: cur

我试图通过在
config/elasticsearch.yml
文件中设置
index.cache.field.max_size:NUMBER
来限制字段缓存(常驻)。我有大约100万条记录,在7个字段(所有字段都包含大量文本数据)上执行刻面操作,以构建一个“字云”

无论为index.cache.field.max_size指定了什么值(1000或100000),堆内存(已分配15gb)都会一直被占用。我做错了什么? 还有没有更好的方法来构建单词云,而不是对如此大量的文本数据执行面处理

映射:

 curl -XPOST http://localhost:9200/monitoring/ -d '
{
  "settings":{
    "index":{
      "number_of_shards":5,
      "number_of_replicas":1
    },
    "analysis":{
      "filter":{
        "myCustomShingle":{
          "type":"shingle",
          "max_shingle_size":3,
          "output_unigrams":true
        },
        "myCustomStop":{
          "type":"stop",
          "stopwords":["a","about","abov ... ]
        }
      },
      "analyzer":{
        "myAnalyzer":{
          "type":"custom",
          "tokenizer":"standard",
          "filter":[
            "lowercase",
            "myCustomShingle",
            "stop",
            "myCustomStop"
          ]
        }
      }
    }
  },
  "mappings":{
    "mention_reports":{
      "_source":{
        "enabled":true
      },
      "_all":{
        "enabled":false
      },
      "index.query.default_field":"post_message",
      "properties":{
      "id":{
        "type":"string",
        "index":"not_analyzed",
        "include_in_all" : "false",
        "null_value" : "null"
      },
      "creation_time":{
        "type":"date"
      },
      "field1":{
        "type":"string",
        "analyzer":"standard",
        "include_in_all":"false",
        "null_value":0
      },
      "field2":{
        "type":"string",
        "index":"not_analyzed",
        "include_in_all":"false",
        "null_value":"null"
      },

            . . .


        "field7":{
          "type":"string",
          "analyzer":"myAnalyzer",
          "term_vector":"with_positions_offsets",
          "null_value" : "null"
        }                                           

      }
    }
  }
}
'

你的elasticsearch版本是什么?
 curl -XPOST http://localhost:9200/monitoring/ -d '
{
  "settings":{
    "index":{
      "number_of_shards":5,
      "number_of_replicas":1
    },
    "analysis":{
      "filter":{
        "myCustomShingle":{
          "type":"shingle",
          "max_shingle_size":3,
          "output_unigrams":true
        },
        "myCustomStop":{
          "type":"stop",
          "stopwords":["a","about","abov ... ]
        }
      },
      "analyzer":{
        "myAnalyzer":{
          "type":"custom",
          "tokenizer":"standard",
          "filter":[
            "lowercase",
            "myCustomShingle",
            "stop",
            "myCustomStop"
          ]
        }
      }
    }
  },
  "mappings":{
    "mention_reports":{
      "_source":{
        "enabled":true
      },
      "_all":{
        "enabled":false
      },
      "index.query.default_field":"post_message",
      "properties":{
      "id":{
        "type":"string",
        "index":"not_analyzed",
        "include_in_all" : "false",
        "null_value" : "null"
      },
      "creation_time":{
        "type":"date"
      },
      "field1":{
        "type":"string",
        "analyzer":"standard",
        "include_in_all":"false",
        "null_value":0
      },
      "field2":{
        "type":"string",
        "index":"not_analyzed",
        "include_in_all":"false",
        "null_value":"null"
      },

            . . .


        "field7":{
          "type":"string",
          "analyzer":"myAnalyzer",
          "term_vector":"with_positions_offsets",
          "null_value" : "null"
        }                                           

      }
    }
  }
}
'