hugo-theme-relearn/static/js/orama-adapter.js
Sören Weber f986a7dc40
Some checks failed
docs-build-deployment / Run deploy (push) Has been cancelled
docs-build / Run build (push) Has been cancelled
orama: test different parameter #407
for now PT15 seems to generate the best results for the exampleSite
2024-10-27 12:38:35 +01:00

99 lines
3 KiB
JavaScript

import { create, search as oramaSearch, insertMultiple } from "https://cdn.jsdelivr.net/npm/@orama/orama@latest/+esm";
import { pluginQPS } from 'https://cdn.jsdelivr.net/npm/@orama/plugin-qps@latest/+esm'
import { pluginPT15 } from 'https://cdn.jsdelivr.net/npm/@orama/plugin-pt15@latest/+esm'
//import { pluginEmbeddings } from 'https://cdn.jsdelivr.net/npm/@orama/plugin-embeddings@latest/+esm'
//import * as tf from 'https://cdn.jsdelivr.net/npm/@tensorflow/tfjs-core';
//import 'https://cdn.jsdelivr.net/npm/@tensorflow/tfjs-backend-webgl';
//import { createTokenizer } from '@orama/tokenizers/japanese'
//import { stopwords as japaneseStopwords } from "@orama/stopwords/japanese";
let searchEngine = null;
async function init() {
async function initIndex( index ){
/*
const embeddings = await pluginEmbeddings({
embeddings: {
// Property used to store generated embeddings. Must be defined in the schema.
defaultProperty: 'embeddings',
onInsert: {
// Generate embeddings at insert-time.
// Turn off if you're inserting documents with embeddings already generated.
generate: true,
// Properties to use for generating embeddings at insert time.
// These properties will be concatenated and used to generate embeddings.
properties: ['description'],
verbose: true,
}
}
});
*/
searchEngine = await create({
schema: {
title: 'string',
content: 'string',
uri: 'string',
breadcrumb: 'string',
description: 'string',
tags: 'string[]',
// embeddings: 'vector[1]'
},
plugins: [
// embeddings,
// pluginQPS()
pluginPT15()
],
/*
defaultLanguage: 'french',
components: {
tokenizer: {
stemmingFn: stemmer,
},
},
*/
});
await insertMultiple(searchEngine, index);
window.relearn.isSearchEngineReady = true;
window.relearn.executeInitialSearch();
}
if( window.index_js_url ){
var js = document.createElement("script");
js.src = index_js_url;
js.setAttribute("async", "");
js.onload = function(){
initIndex(relearn_searchindex);
};
js.onerror = function(e){
console.error('Error getting Hugo index file');
};
document.head.appendChild(js);
}
}
async function search( term ){
const searchResponse = await oramaSearch(searchEngine, {
// mode: 'hybrid', // vector search seems not to work
term: term,
properties: '*',
threshold: 0, // only show results where all keywords were found
limit: 99,
boost: { // doesn't seem to make a difference in score
tags: 1.8,
title: 1.5,
descriptoin: 1.3,
breadcrumb: 1.2,
},
// distinctOn: 'title', // just to filter out changelog/releasenotes if having the same title
// exact: true, // not for PT15
// tolerance: 1, // not for PT15
});
console.log( "new term", term )
searchResponse.hits.forEach( hit => console.log(hit.score, hit.document.uri) );
return searchResponse.hits.map( hit => ({ matches: [ term, ...term.split(' ') ], page: hit.document }) );
}
export { init, search };