Details
Description
Search results with highlighting and snippets are incorrect for some documents. The searched for words are not in the snippet and the highlighting appears on other words.
Documents that shows the wrong results highlighting for a search for "subway/rapid": 1217245.json and 2514575.json
Documents that show wrong highlighting for a search for "stole"
609868.json and 109479.json
I suspected that they are not UTF-8 encoding but "file -I" informs me they are us-ascii which is theoretically a subset of UTF-8.
Wills-MacBook-Pro:fts will$ file -I ~/datasets/json/1217245.json |
/Users/will/datasets/json/1217245.json: text/plain; charset=us-ascii |
Wills-MacBook-Pro:fts will$ file -I ~/datasets/json/2514575.json |
/Users/will/datasets/json/2514575.json: text/plain; charset=us-ascii |
Wills-MacBook-Pro:fts will$ file -I ~/datasets/json/609868.json |
/Users/will/datasets/json/609868.json: text/plain; charset=us-ascii |
Wills-MacBook-Pro:fts will$ file -I ~/datasets/json/109479.json |
/Users/will/datasets/json/109479.json: text/plain; charset=us-ascii |
|
Index definition:
{
|
"type": "fulltext-index", |
"name": "reviews", |
"uuid": "7f584d644ac8a7c7", |
"sourceType": "couchbase", |
"sourceName": "reviews", |
"sourceUUID": "7b00f8b84c36de0ba10a44ff5ce5301b", |
"planParams": { |
"maxPartitionsPerPIndex": 32, |
"numReplicas": 0, |
"hierarchyRules": null, |
"nodePlanParams": null, |
"pindexWeights": null, |
"planFrozen": false |
},
|
"params": { |
"mapping": { |
"analysis": { |
"analyzers": {}, |
"char_filters": {}, |
"token_filters": {}, |
"token_maps": {}, |
"tokenizers": {} |
},
|
"byte_array_converter": "json", |
"default_analyzer": "standard", |
"default_datetime_parser": "dateTimeOptional", |
"default_field": "_all", |
"default_mapping": { |
"display_order": "0", |
"dynamic": true, |
"enabled": true, |
"fields": [], |
"properties": { |
"Reviews": { |
"display_order": "0", |
"dynamic": false, |
"enabled": true, |
"fields": [], |
"properties": { |
"Content": { |
"dynamic": false, |
"enabled": true, |
"fields": [ |
{
|
"analyzer": "", |
"date_format": null, |
"display_order": "0", |
"include_in_all": true, |
"include_term_vectors": true, |
"index": true, |
"name": "Content", |
"store": true, |
"type": "text" |
}
|
],
|
"properties": {} |
}
|
}
|
}
|
}
|
},
|
"default_type": "_default", |
"type_field": "type", |
"types": {} |
},
|
"store": { |
"kvStoreName": "forestdb" |
}
|
},
|
"sourceParams": { |
"authPassword": "", |
"authSaslPassword": "", |
"authSaslUser": "", |
"authUser": "reviews", |
"clusterManagerBackoffFactor": 0, |
"clusterManagerSleepInitMS": 0, |
"clusterManagerSleepMaxMS": 2000, |
"dataManagerBackoffFactor": 0, |
"dataManagerSleepInitMS": 0, |
"dataManagerSleepMaxMS": 2000, |
"feedBufferAckThreshold": 0, |
"feedBufferSizeBytes": 0 |
}
|
}
|
Attachments
Issue Links
- depends on
-
MB-18712 unexpected forestdb iterator behavior
- Resolved
For Gerrit Dashboard: MB-18219 | ||||||
---|---|---|---|---|---|---|
# | Subject | Branch | Project | Status | CR | V |
60446,2 | bump bleve SHA as part of MB-18219 | master | manifest | Status: MERGED | +2 | +1 |