2019-03-09 23:43:32 +00:00
const tsquery = require ( 'pg-tsquery' ) ( )
2019-03-24 04:27:42 +00:00
const stream = require ( 'stream' )
const Promise = require ( 'bluebird' )
const pipeline = Promise . promisify ( stream . pipeline )
/* global WIKI */
2019-03-09 05:51:02 +00:00
module . exports = {
2019-03-09 23:43:32 +00:00
async activate ( ) {
2019-03-11 04:47:27 +00:00
if ( WIKI . config . db . type !== 'postgres' ) {
throw new WIKI . Error . SearchActivationFailed ( 'Must use PostgreSQL database to activate this engine!' )
}
2019-03-09 05:51:02 +00:00
} ,
2019-03-09 23:43:32 +00:00
async deactivate ( ) {
2019-03-24 04:27:42 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Dropping index tables... ` )
await WIKI . models . knex . schema . dropTable ( 'pagesWords' )
await WIKI . models . knex . schema . dropTable ( 'pagesVector' )
WIKI . logger . info ( ` (SEARCH/POSTGRES) Index tables have been dropped. ` )
2019-03-09 05:51:02 +00:00
} ,
/ * *
* INIT
* /
2019-03-09 23:43:32 +00:00
async init ( ) {
2019-03-13 06:52:08 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Initializing... ` )
2019-03-10 06:28:58 +00:00
// -> Create Search Index
2019-03-09 23:43:32 +00:00
const indexExists = await WIKI . models . knex . schema . hasTable ( 'pagesVector' )
if ( ! indexExists ) {
2019-03-13 06:52:08 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Creating Pages Vector table... ` )
2019-03-09 23:43:32 +00:00
await WIKI . models . knex . schema . createTable ( 'pagesVector' , table => {
table . increments ( )
table . string ( 'path' )
table . string ( 'locale' )
table . string ( 'title' )
table . string ( 'description' )
2019-03-10 06:28:58 +00:00
table . specificType ( 'tokens' , 'TSVECTOR' )
2019-03-24 04:27:42 +00:00
table . text ( 'content' )
2019-03-09 23:43:32 +00:00
} )
}
2019-03-10 06:28:58 +00:00
// -> Create Words Index
const wordsExists = await WIKI . models . knex . schema . hasTable ( 'pagesWords' )
if ( ! wordsExists ) {
2019-03-13 06:52:08 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Creating Words Suggestion Index... ` )
2019-03-10 06:28:58 +00:00
await WIKI . models . knex . raw ( `
CREATE TABLE "pagesWords" AS SELECT word FROM ts _stat (
2019-03-24 16:51:52 +00:00
'SELECT to_tsvector(' 'simple' ', "title") || to_tsvector(' 'simple' ', "description") || to_tsvector(' 'simple' ', "content") FROM "pagesVector"'
2019-03-10 06:28:58 +00:00
) ` )
await WIKI . models . knex . raw ( 'CREATE EXTENSION IF NOT EXISTS pg_trgm' )
await WIKI . models . knex . raw ( ` CREATE INDEX "pageWords_idx" ON "pagesWords" USING GIN (word gin_trgm_ops) ` )
}
2019-03-13 06:52:08 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Initialization completed. ` )
2019-03-09 05:51:02 +00:00
} ,
/ * *
* QUERY
*
* @ param { String } q Query
* @ param { Object } opts Additional options
* /
async query ( q , opts ) {
2019-03-09 23:43:32 +00:00
try {
2019-03-10 06:28:58 +00:00
let suggestions = [ ]
2019-03-09 23:43:32 +00:00
const results = await WIKI . models . knex . raw ( `
SELECT id , path , locale , title , description
FROM "pagesVector" , to _tsquery ( ? ) query
2019-03-10 06:28:58 +00:00
WHERE query @ @ "tokens"
ORDER BY ts _rank ( tokens , query ) DESC
2019-03-09 23:43:32 +00:00
` , [tsquery(q)])
2019-03-10 06:28:58 +00:00
if ( results . rows . length < 5 ) {
const suggestResults = await WIKI . models . knex . raw ( ` SELECT word, word <-> ? AS rank FROM "pagesWords" WHERE similarity(word, ?) > 0.2 ORDER BY rank LIMIT 5; ` , [ q , q ] )
suggestions = suggestResults . rows . map ( r => r . word )
}
2019-03-09 23:43:32 +00:00
return {
results : results . rows ,
2019-03-10 06:28:58 +00:00
suggestions ,
2019-03-09 23:43:32 +00:00
totalHits : results . rows . length
}
} catch ( err ) {
WIKI . logger . warn ( 'Search Engine Error:' )
WIKI . logger . warn ( err )
}
2019-03-09 05:51:02 +00:00
} ,
/ * *
* CREATE
*
* @ param { Object } page Page to create
* /
async created ( page ) {
2019-03-09 23:43:32 +00:00
await WIKI . models . knex . raw ( `
2019-03-24 04:27:42 +00:00
INSERT INTO "pagesVector" ( path , locale , title , description , "tokens" ) VALUES (
? , ? , ? , ? , ( setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'A' ) || setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'B' ) || setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'C' ) )
2019-03-09 23:43:32 +00:00
)
2019-03-24 04:27:42 +00:00
` , [page.path, page.localeCode, page.title, page.description, page.title, page.description, page.safeContent])
2019-03-09 05:51:02 +00:00
} ,
/ * *
* UPDATE
*
* @ param { Object } page Page to update
* /
async updated ( page ) {
2019-03-09 23:43:32 +00:00
await WIKI . models . knex . raw ( `
UPDATE "pagesVector" SET
2019-03-11 04:47:27 +00:00
title = ? ,
description = ? ,
tokens = ( setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'A' ) ||
setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'B' ) ||
setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'C' ) )
WHERE path = ? AND locale = ?
2019-03-24 04:27:42 +00:00
` , [page.title, page.description, page.title, page.description, page.safeContent, page.path, page.localeCode])
2019-03-09 05:51:02 +00:00
} ,
/ * *
* DELETE
*
* @ param { Object } page Page to delete
* /
async deleted ( page ) {
2019-03-09 23:43:32 +00:00
await WIKI . models . knex ( 'pagesVector' ) . where ( {
2019-03-11 04:47:27 +00:00
locale : page . localeCode ,
2019-03-09 23:43:32 +00:00
path : page . path
} ) . del ( ) . limit ( 1 )
2019-03-09 05:51:02 +00:00
} ,
/ * *
* RENAME
*
* @ param { Object } page Page to rename
* /
async renamed ( page ) {
2019-03-09 23:43:32 +00:00
await WIKI . models . knex ( 'pagesVector' ) . where ( {
2019-03-11 04:47:27 +00:00
locale : page . localeCode ,
2019-03-09 23:43:32 +00:00
path : page . sourcePath
} ) . update ( {
2019-10-13 23:59:50 +00:00
locale : page . destinationLocaleCode ,
2019-03-09 23:43:32 +00:00
path : page . destinationPath
2019-03-11 04:47:27 +00:00
} )
2019-03-09 05:51:02 +00:00
} ,
/ * *
* REBUILD INDEX
* /
async rebuild ( ) {
2019-03-13 06:52:08 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Rebuilding Index... ` )
2019-03-09 23:43:32 +00:00
await WIKI . models . knex ( 'pagesVector' ) . truncate ( )
2019-03-24 04:27:42 +00:00
await WIKI . models . knex ( 'pagesWords' ) . truncate ( )
await pipeline (
WIKI . models . knex . column ( 'path' , 'localeCode' , 'title' , 'description' , 'render' ) . select ( ) . from ( 'pages' ) . where ( {
isPublished : true ,
isPrivate : false
} ) . stream ( ) ,
new stream . Transform ( {
objectMode : true ,
transform : async ( page , enc , cb ) => {
const content = WIKI . models . pages . cleanHTML ( page . render )
await WIKI . models . knex . raw ( `
INSERT INTO "pagesVector" ( path , locale , title , description , "tokens" , content ) VALUES (
? , ? , ? , ? , ( setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'A' ) || setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'B' ) || setweight ( to _tsvector ( '${this.config.dictLanguage}' , ? ) , 'C' ) ) , ?
)
` , [page.path, page.localeCode, page.title, page.description, page.title, page.description, content, content])
cb ( )
}
} )
)
2019-03-09 23:43:32 +00:00
await WIKI . models . knex . raw ( `
2019-03-24 04:27:42 +00:00
INSERT INTO "pagesWords" ( word )
SELECT word FROM ts _stat (
'SELECT to_tsvector(' 'simple' ', "title") || to_tsvector(' 'simple' ', "description") || to_tsvector(' 'simple' ', "content") FROM "pagesVector"'
)
` )
2019-03-13 06:52:08 +00:00
WIKI . logger . info ( ` (SEARCH/POSTGRES) Index rebuilt successfully. ` )
2019-03-09 05:51:02 +00:00
}
}