"Snippets much better"
This commit is contained in:
parent
ac74c809eb
commit
fd032a7d12
|
@ -413,7 +413,7 @@ export default Archivist;
|
||||||
const flatDoc = await send("DOMSnapshot.captureSnapshot", {
|
const flatDoc = await send("DOMSnapshot.captureSnapshot", {
|
||||||
computedStyles: [],
|
computedStyles: [],
|
||||||
}, sessionId);
|
}, sessionId);
|
||||||
const pageText = processDoc(flatDoc);
|
const pageText = processDoc(flatDoc).replace(/\t\n/g, ' ');
|
||||||
|
|
||||||
const {title, url} = Targets.get(sessionId);
|
const {title, url} = Targets.get(sessionId);
|
||||||
let id, ndx_id;
|
let id, ndx_id;
|
||||||
|
|
|
@ -2,9 +2,9 @@ import ukkonen from 'ukkonen';
|
||||||
import {DEBUG} from './common.js';
|
import {DEBUG} from './common.js';
|
||||||
|
|
||||||
const MAX_ACCEPT_SCORE = 0.5;
|
const MAX_ACCEPT_SCORE = 0.5;
|
||||||
const CHUNK_SIZE = 24;
|
const CHUNK_SIZE = 12;
|
||||||
|
|
||||||
//testHighlighter();
|
testHighlighter();
|
||||||
|
|
||||||
function params(qLength, chunkSize) {
|
function params(qLength, chunkSize) {
|
||||||
const MaxDist = CHUNK_SIZE;
|
const MaxDist = CHUNK_SIZE;
|
||||||
|
@ -216,5 +216,5 @@ function testHighlighter() {
|
||||||
46 points by helsinkiandrew 8 hours ago | hide | 17 comments
|
46 points by helsinkiandrew 8 hours ago | hide | 17 comments
|
||||||
More
|
More
|
||||||
`
|
`
|
||||||
), null, 2));
|
).map(({fragment:{text,offset}}) => offset + ':' + text), null, 2));
|
||||||
}
|
}
|
||||||
|
|
|
@ -65,6 +65,7 @@ function addHandlers() {
|
||||||
} else {
|
} else {
|
||||||
results.forEach(r => {
|
results.forEach(r => {
|
||||||
r.snippet = highlight(query, r.content, {maxLength:MAX_HIGHLIGHTABLE_LENGTH})
|
r.snippet = highlight(query, r.content, {maxLength:MAX_HIGHLIGHTABLE_LENGTH})
|
||||||
|
.sort(({fragment:{offset:a}}, {fragment:{offset:b}}) => a-b)
|
||||||
.map(hl => Archivist.findOffsets(query, hl.fragment.text))
|
.map(hl => Archivist.findOffsets(query, hl.fragment.text))
|
||||||
.join(' ... ');
|
.join(' ... ');
|
||||||
});
|
});
|
||||||
|
|
1
todo
1
todo
|
@ -1,3 +1,4 @@
|
||||||
|
- get snippets earlier (before rendering in lib server) and use to add to signal
|
||||||
- implement trigram index
|
- implement trigram index
|
||||||
- try an exact match on the query term if possible for highlight. first one.
|
- try an exact match on the query term if possible for highlight. first one.
|
||||||
- we could also add signal from the highlighting to just in time alter the order (e.g. 'hell wiki' search brings google search to top rank, but the Hell wikipedia page has more highlight visible)
|
- we could also add signal from the highlighting to just in time alter the order (e.g. 'hell wiki' search brings google search to top rank, but the Hell wikipedia page has more highlight visible)
|
||||||
|
|
Loading…
Reference in New Issue