PUT explorasim
{
"settings": {
"analysis": {
"analyzer": {
"simple_analyzer": {
"tokenizer": "uax_url_email",
"char_filter": ["numeros"],
"filter": ["lowercase","asciifolding","sinonimos"]
},
"raw_analyzer": {
"tokenizer": "uax_url_email",
"char_filter": ["numeros"],
"filter": ["lowercase","asciifolding"]
},
"stemmed_analyzer": {
"tokenizer": "uax_url_email",
"char_filter": ["numeros"],
"filter": ["lowercase", "asciifolding", "keyword_repeat", "brazilian_stem", "remove_duplicates" ]
}
},
"filter" : {"sinonimos":
{"type": "synonym","lenient": false, "expand" : true,
"synonyms": [ "art, artig, artigos, artigo => art, artig, artigos, artigo",
"home, apartamento, moradia, casa => home, apartamento, moradia, casa",
"lei, norma, normativo, projeto de lei, regulamento => lei, norma, normativo, projeto de lei, regulamento"]
}
},
"char_filter": {
"numeros": {
"type": "pattern_replace",
"pattern": "(\\d+)[\\.\\-\\/\\:](?=\\d)",
"replacement": "$1_"
}
}
}
},
"mappings": {
"properties": {
"pasta": {"type": "keyword"},
"arquivo": {"type": "keyword"},
"grupo": {"type": "keyword"},
"grupo_sim": {"type": "integer"},
"vetor": {"type": "dense_vector","dims": 300},
"texto": {"type": "text","analyzer": "simple_analyzer","term_vector": "with_positions_offsets",
"fields": { "stemmed": {"type": "text","analyzer": "stemmed_analyzer","term_vector": "with_positions_offsets"},
"raw": {"type": "text","analyzer": "raw_analyzer","term_vector": "with_positions_offsets"}
}
},
"dthr_vetor": { "type": "date", "format": "yyyy-MM-dd HH:mm:ss||yyyy-MM-dd||epoch_millis"
}
}
}
}