Git地址:https://github.com/medcl/elasticsearch-analysis-pinyin
PUT /doctor
{
"settings":{
"number_of_shards":1,
"analysis":{
"analyzer":{
"pinyin_analyzer":{
"tokenizer":"my_pinyin"
}
},
"tokenizer":{
"my_pinyin":{
"lowercase":"true",
"keep_original":"false",
"keep_first_letter":"true",
"keep_separate_first_letter":"true",
"type":"pinyin",
"limit_first_letter_length":"16",
"keep_full_pinyin":"true",
"keep_none_chinese_in_joined_full_pinyin":"true",
"keep_joined_full_pinyin":"true"
}
}
}
}
}
POST /doctor/_analyze
{
"analyzer": "pinyin_analyzer",
"text": "刘德华2019"
}
结果:
{
"tokens" : [
{
"token" : "l",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 0
},
{
"token" : "liu",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 0
},
{
"token" : "d",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 1
},
{
"token" : "de",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 1
},
{
"token" : "h",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 2
},
{
"token" : "hua",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 2
},
{
"token" : "2019",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 3
},
{
"token" : "liudehua2019",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 3
},
{
"token" : "ldh2019",
"start_offset" : 0,
"end_offset" : 0,
"type" : "word",
"position" : 3
}
]
}
原创声明:本文系作者授权腾讯云开发者社区发表,未经许可,不得转载。
如有侵权,请联系 cloudcommunity@tencent.com 删除。
原创声明:本文系作者授权腾讯云开发者社区发表,未经许可,不得转载。
如有侵权,请联系 cloudcommunity@tencent.com 删除。