Skip to content

Instantly share code, notes, and snippets.

@cawoodm
Last active August 26, 2019 11:46
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save cawoodm/d2139ee00c8d31d392ef58e8eb08639d to your computer and use it in GitHub Desktop.
Save cawoodm/d2139ee00c8d31d392ef58e8eb08639d to your computer and use it in GitHub Desktop.
Explanation of Rankings
The explanation of "UVV 000155 099" (scoring 15.364279) is:
{
"_shard": "[myindex][0]",
"_node": "6tgOP8JVSmai0c0uR_Co7g",
"_index": "myindex",
"_type": "_doc",
"_id": "UVV -00155-099",
"_score": 15.364279,
"_source": {
"sparepart": false,
"stackable": false,
"text_en": "UVV 00155 099 x",
"part": "UVV -00155-099",
"matnr": "UVV 00155099",
"typ": "part",
"matnrT": "UVV 00155 099",
"text_de": "UVV 00155 099 NORD-Stirnradgetr.Motor 0,55kW"
},
"_explanation": {
"value": 15.364279,
"description": "sum of:",
"details": [
{
"value": 3.7968116,
"description": "weight(text_en:uvv in 15981) [PerFieldSimilarity], result of:",
"details": [
{
"value": 3.7968116,
"description": "score(freq=1.0), product of:",
"details": [
{
"value": 2.2,
"description": "boost",
"details": []
},
{
"value": 2.7486653,
"description": "idf, computed as log(1 + (N - n + 0.5) / (n + 0.5)) from:",
"details": [
{
"value": 64497,
"description": "n, number of documents containing term",
"details": []
},
{
"value": 1007564,
"description": "N, total number of documents with field",
"details": []
}
]
},
{
"value": 0.6278769,
"description": "tf, computed as freq / (freq + k1 * (1 - b + b * dl / avgdl)) from:",
"details": [
{
"value": 1.0,
"description": "freq, occurrences of term within document",
"details": []
},
{
"value": 1.2,
"description": "k1, term saturation parameter",
"details": []
},
{
"value": 0.75,
"description": "b, length normalization parameter",
"details": []
},
{
"value": 5.0,
"description": "dl, length of field",
"details": []
},
{
"value": 15.375735,
"description": "avgdl, average length of field",
"details": []
}
]
}
]
}
]
},
{
"value": 11.567467,
"description": "weight(text_en:099 in 15981) [PerFieldSimilarity], result of:",
"details": [
{
"value": 11.567467,
"description": "score(freq=1.0), product of:",
"details": [
{
"value": 2.2,
"description": "boost",
"details": []
},
{
"value": 8.374157,
"description": "idf, computed as log(1 + (N - n + 0.5) / (n + 0.5)) from:",
"details": [
{
"value": 232,
"description": "n, number of documents containing term",
"details": []
},
{
"value": 1007564,
"description": "N, total number of documents with field",
"details": []
}
]
},
{
"value": 0.6278769,
"description": "tf, computed as freq / (freq + k1 * (1 - b + b * dl / avgdl)) from:",
"details": [
{
"value": 1.0,
"description": "freq, occurrences of term within document",
"details": []
},
{
"value": 1.2,
"description": "k1, term saturation parameter",
"details": []
},
{
"value": 0.75,
"description": "b, length normalization parameter",
"details": []
},
{
"value": 5.0,
"description": "dl, length of field",
"details": []
},
{
"value": 15.375735,
"description": "avgdl, average length of field",
"details": []
}
]
}
]
}
]
}
]
}
},
The explanation of "UVV 00031 099" (scoring 13.41111):
{
"_shard": "[myindex][0]",
"_node": "6tgOP8JVSmai0c0uR_Co7g",
"_index": "myindex",
"_type": "_doc",
"_id": "UVV -00031-099",
"_score": 13.41111,
"_source": {
"sparepart": false,
"stackable": false,
"text_en": "UVV 00031 099 Filterschlauch L=1800MM Nadelfilz Acryl",
"part": "UVV -00031-099",
"matnr": "UVV 00031099",
"typ": "part",
"matnrT": "UVV 00031 099",
"text_de": "UVV 00031 099 Filterschlauch L=1800MM Nadelfilz Acryl"
},
"_explanation": {
"value": 13.41111,
"description": "sum of:",
"details": [
{
"value": 1.9415544,
"description": "weight(text_en:uvv in 71582) [PerFieldSimilarity], result of:",
"details": [
{
"value": 1.9415544,
"description": "score(freq=1.0), product of:",
"details": [
{
"value": 2.2,
"description": "boost",
"details": []
},
{
"value": 2.7486653,
"description": "idf, computed as log(1 + (N - n + 0.5) / (n + 0.5)) from:",
"details": [
{
"value": 64497,
"description": "n, number of documents containing term",
"details": []
},
{
"value": 1007564,
"description": "N, total number of documents with field",
"details": []
}
]
},
{
"value": 0.32107392,
"description": "tf, computed as freq / (freq + k1 * (1 - b + b * dl / avgdl)) from:",
"details": [
{
"value": 1.0,
"description": "freq, occurrences of term within document",
"details": []
},
{
"value": 1.2,
"description": "k1, term saturation parameter",
"details": []
},
{
"value": 0.75,
"description": "b, length normalization parameter",
"details": []
},
{
"value": 31.0,
"description": "dl, length of field",
"details": []
},
{
"value": 15.375735,
"description": "avgdl, average length of field",
"details": []
}
]
}
]
}
]
},
{
"value": 5.5543637,
"description": "weight(text_en:00031 in 71582) [PerFieldSimilarity], result of:",
"details": [
{
"value": 5.5543637,
"description": "score(freq=1.0), product of:",
"details": [
{
"value": 2.2,
"description": "boost",
"details": []
},
{
"value": 7.8633313,
"description": "idf, computed as log(1 + (N - n + 0.5) / (n + 0.5)) from:",
"details": [
{
"value": 387,
"description": "n, number of documents containing term",
"details": []
},
{
"value": 1007564,
"description": "N, total number of documents with field",
"details": []
}
]
},
{
"value": 0.32107392,
"description": "tf, computed as freq / (freq + k1 * (1 - b + b * dl / avgdl)) from:",
"details": [
{
"value": 1.0,
"description": "freq, occurrences of term within document",
"details": []
},
{
"value": 1.2,
"description": "k1, term saturation parameter",
"details": []
},
{
"value": 0.75,
"description": "b, length normalization parameter",
"details": []
},
{
"value": 31.0,
"description": "dl, length of field",
"details": []
},
{
"value": 15.375735,
"description": "avgdl, average length of field",
"details": []
}
]
}
]
}
]
},
{
"value": 5.9151917,
"description": "weight(text_en:099 in 71582) [PerFieldSimilarity], result of:",
"details": [
{
"value": 5.9151917,
"description": "score(freq=1.0), product of:",
"details": [
{
"value": 2.2,
"description": "boost",
"details": []
},
{
"value": 8.374157,
"description": "idf, computed as log(1 + (N - n + 0.5) / (n + 0.5)) from:",
"details": [
{
"value": 232,
"description": "n, number of documents containing term",
"details": []
},
{
"value": 1007564,
"description": "N, total number of documents with field",
"details": []
}
]
},
{
"value": 0.32107392,
"description": "tf, computed as freq / (freq + k1 * (1 - b + b * dl / avgdl)) from:",
"details": [
{
"value": 1.0,
"description": "freq, occurrences of term within document",
"details": []
},
{
"value": 1.2,
"description": "k1, term saturation parameter",
"details": []
},
{
"value": 0.75,
"description": "b, length normalization parameter",
"details": []
},
{
"value": 31.0,
"description": "dl, length of field",
"details": []
},
{
"value": 15.375735,
"description": "avgdl, average length of field",
"details": []
}
]
}
]
}
]
}
]
}
},
Analysis of query "UVV 00031 099":
POST /myindex/_analyze
{
"field": "text_en",
"text": "UVV 00031 099"
}
{
"tokens": [
{
"token": "uvv",
"start_offset": 0,
"end_offset": 3,
"type": "word",
"position": 0
},
{
"token": "000",
"start_offset": 5,
"end_offset": 8,
"type": "word",
"position": 1
},
{
"token": "0003",
"start_offset": 5,
"end_offset": 9,
"type": "word",
"position": 2
},
{
"token": "00031",
"start_offset": 5,
"end_offset": 10,
"type": "word",
"position": 3
},
{
"token": "099",
"start_offset": 11,
"end_offset": 14,
"type": "word",
"position": 4
}
]
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment