Skip to content

Instantly share code, notes, and snippets.

@quoeamaster
Created April 14, 2022 11:16
Show Gist options
  • Save quoeamaster/8bc3f943ea47f8103776474c8873cfe6 to your computer and use it in GitHub Desktop.
Save quoeamaster/8bc3f943ea47f8103776474c8873cfe6 to your computer and use it in GitHub Desktop.
PUT courses-03/
{
"settings": {
"analysis": {
"char_filter": {
"email_dot_replacer": {
"type": "mapping",
"mappings": [
". => -"
]
}
},
"analyzer": {
"ana_email_fixer": {
"type": "custom",
"char_filter": [ "email_dot_replacer" ],
"tokenizer": "standard",
"filter": [ "lowercase" ]
},
"email_extractor": {
"tokenizer": "uax_url_email",
"filter": [ "lowercase" ]
}
}
}
},
"mappings": {
"properties": {
"comments": {
"type": "text",
"analyzer": "email_extractor",
"fields": {
"email": {
"type": "text",
"analyzer": "ana_email_fixer"
}
}
}
}
}
}
/* test */
POST courses-03/_analyze
{
"analyzer": "email_extractor",
"text": ["if you think the course is nice and wanna comment, please send an email to -> donna.karen@uni.gov or jojo.star.crusade@uni.gov . Thx~"]
}
...
/* result */
{
"tokens" : [
{
"token" : "if",
"start_offset" : 0,
"end_offset" : 2,
"type" : "<ALPHANUM>",
"position" : 0
},
...
{
"token" : "donna.karen@uni.gov",
"start_offset" : 78,
"end_offset" : 97,
"type" : "<EMAIL>",
"position" : 15
},
...
{
"token" : "jojo.star.crusade@uni.gov",
"start_offset" : 101,
"end_offset" : 126,
"type" : "<EMAIL>",
"position" : 17
}
...
]
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment