2023-05-29 05:34:18 +02:00
import { Health , MeiliSearch , Stats } from "meilisearch" ;
import { dbLogger } from "./logger.js" ;
2023-05-25 00:55:33 +02:00
import config from "@/config/index.js" ;
2023-05-29 05:34:18 +02:00
import { Note } from "@/models/entities/note.js" ;
2023-05-26 00:33:02 +02:00
import * as url from "url" ;
2023-05-29 05:34:18 +02:00
import { ILocalUser , User } from "@/models/entities/user.js" ;
import { Followings , Users } from "@/models/index.js" ;
2023-05-26 02:07:34 +02:00
2023-05-25 00:55:33 +02:00
const logger = dbLogger . createSubLogger ( "meilisearch" , "gray" , false ) ;
logger . info ( "Connecting to MeiliSearch" ) ;
const hasConfig =
2023-05-26 03:06:41 +02:00
config . meilisearch &&
( config . meilisearch . host ||
config . meilisearch . port ||
config . meilisearch . apiKey ) ;
2023-05-25 00:55:33 +02:00
const host = hasConfig ? config . meilisearch . host ? ? "localhost" : "" ;
const port = hasConfig ? config . meilisearch . port ? ? 7700 : 0 ;
const auth = hasConfig ? config . meilisearch . apiKey ? ? "" : "" ;
2023-05-26 10:12:52 +02:00
const ssl = hasConfig ? config . meilisearch . ssl ? ? false : false ;
2023-05-25 00:55:33 +02:00
2023-05-25 14:15:13 +02:00
const client : MeiliSearch = new MeiliSearch ( {
2023-05-26 10:12:52 +02:00
host : ` ${ ssl ? "https" : "http" } :// ${ host } : ${ port } ` ,
2023-05-25 02:19:42 +02:00
apiKey : auth ,
2023-05-26 03:06:41 +02:00
} ) ;
const posts = client . index ( "posts" ) ;
posts
. updateSearchableAttributes ( [ "text" ] )
. catch ( ( e ) = >
logger . error ( ` Setting searchable attr failed, searches won't work: ${ e } ` ) ,
) ;
posts
. updateFilterableAttributes ( [
"userName" ,
"userHost" ,
"mediaAttachment" ,
"createdAt" ,
2023-05-28 02:15:13 +02:00
"userId" ,
2023-05-26 03:06:41 +02:00
] )
. catch ( ( e ) = >
logger . error (
` Setting filterable attr failed, advanced searches won't work: ${ e } ` ,
) ,
) ;
2023-05-25 14:15:13 +02:00
2023-05-28 02:15:13 +02:00
posts
. updateSortableAttributes ( [ "createdAt" ] )
. catch ( ( e ) = >
logger . error (
` Setting sortable attr failed, placeholder searches won't sort properly: ${ e } ` ,
) ,
) ;
2023-05-25 00:55:33 +02:00
logger . info ( "Connected to MeiliSearch" ) ;
export type MeilisearchNote = {
id : string ;
text : string ;
userId : string ;
userHost : string ;
2023-05-25 22:29:47 +02:00
userName : string ;
2023-05-25 00:55:33 +02:00
channelId : string ;
2023-05-25 14:15:13 +02:00
mediaAttachment : string ;
2023-05-26 03:06:41 +02:00
createdAt : number ;
} ;
export default hasConfig
? {
2023-05-29 05:34:18 +02:00
search : async (
query : string ,
limit : number ,
offset : number ,
userCtx : ILocalUser | null ,
) = > {
/// Advanced search syntax
/// from:user => filter by user + optional domain
/// has:image/video/audio/text/file => filter by attachment types
/// domain:domain.com => filter by domain
/// before:Date => show posts made before Date
/// after: Date => show posts made after Date
/// "text" => get posts with exact text between quotes
/// filter:following => show results only from users you follow
/// filter:followers => show results only from followers
let constructedFilters : string [ ] = [ ] ;
let splitSearch = query . split ( " " ) ;
// Detect search operators and remove them from the actual query
let filteredSearchTerms = (
await Promise . all (
splitSearch . map ( async ( term ) = > {
if ( term . startsWith ( "has:" ) ) {
let fileType = term . slice ( 4 ) ;
constructedFilters . push ( ` mediaAttachment = " ${ fileType } " ` ) ;
return null ;
} else if ( term . startsWith ( "from:" ) ) {
let user = term . slice ( 5 ) ;
constructedFilters . push ( ` userName = ${ user } ` ) ;
return null ;
} else if ( term . startsWith ( "domain:" ) ) {
let domain = term . slice ( 7 ) ;
constructedFilters . push ( ` userHost = ${ domain } ` ) ;
return null ;
} else if ( term . startsWith ( "after:" ) ) {
let timestamp = term . slice ( 6 ) ;
// Try to parse the timestamp as JavaScript Date
let date = Date . parse ( timestamp ) ;
if ( isNaN ( date ) ) return null ;
constructedFilters . push ( ` createdAt > ${ date / 1000 } ` ) ;
return null ;
} else if ( term . startsWith ( "before:" ) ) {
let timestamp = term . slice ( 7 ) ;
// Try to parse the timestamp as JavaScript Date
let date = Date . parse ( timestamp ) ;
if ( isNaN ( date ) ) return null ;
constructedFilters . push ( ` createdAt < ${ date / 1000 } ` ) ;
return null ;
} else if ( term . startsWith ( "filter:following" ) ) {
// Check if we got a context user
if ( userCtx ) {
// Fetch user follows from DB
let followedUsers = await Followings . find ( {
where : {
followerId : userCtx.id ,
} ,
select : {
followeeId : true ,
} ,
} ) ;
let followIDs = followedUsers . map ( ( user ) = > user . followeeId ) ;
if ( followIDs . length === 0 ) return null ;
constructedFilters . push ( ` userId IN [ ${ followIDs . join ( "," ) } ] ` ) ;
} else {
logger . warn (
"search filtered to follows called without user context" ,
) ;
}
return null ;
} else if ( term . startsWith ( "filter:followers" ) ) {
// Check if we got a context user
if ( userCtx ) {
// Fetch users follows from DB
let followedUsers = await Followings . find ( {
where : {
followeeId : userCtx.id ,
} ,
select : {
followerId : true ,
} ,
} ) ;
let followIDs = followedUsers . map ( ( user ) = > user . followerId ) ;
if ( followIDs . length === 0 ) return null ;
constructedFilters . push ( ` userId IN [ ${ followIDs . join ( "," ) } ] ` ) ;
} else {
logger . warn (
"search filtered to followers called without user context" ,
) ;
}
return null ;
2023-05-28 02:15:13 +02:00
}
2023-05-29 05:34:18 +02:00
return term ;
} ) ,
)
) . filter ( ( term ) = > term !== null ) ;
2023-05-28 02:15:13 +02:00
2023-05-29 05:34:18 +02:00
let sortRules = [ ] ;
2023-05-28 02:15:13 +02:00
2023-05-29 05:34:18 +02:00
// An empty search term with defined filters means we have a placeholder search => https://www.meilisearch.com/docs/reference/api/search#placeholder-search
// These have to be ordered manually, otherwise the *oldest* posts are returned first, which we don't want
if ( filteredSearchTerms . length === 0 && constructedFilters . length > 0 ) {
sortRules . push ( "createdAt:desc" ) ;
2023-05-26 03:06:41 +02:00
}
2023-05-29 05:34:18 +02:00
logger . info ( ` Searching for ${ filteredSearchTerms . join ( " " ) } ` ) ;
logger . info ( ` Limit: ${ limit } ` ) ;
logger . info ( ` Offset: ${ offset } ` ) ;
logger . info ( ` Filters: ${ constructedFilters } ` ) ;
logger . info ( ` Ordering: ${ sortRules } ` ) ;
return posts . search ( filteredSearchTerms . join ( " " ) , {
limit : limit ,
offset : offset ,
filter : constructedFilters ,
sort : sortRules ,
} ) ;
} ,
ingestNote : async ( ingestNotes : Note | Note [ ] ) = > {
if ( ingestNotes instanceof Note ) {
ingestNotes = [ ingestNotes ] ;
}
let indexingBatch : MeilisearchNote [ ] = [ ] ;
for ( let note of ingestNotes ) {
if ( note . user === undefined ) {
note . user = await Users . findOne ( {
where : {
id : note.userId ,
} ,
} ) ;
2023-05-26 03:06:41 +02:00
}
2023-05-29 05:34:18 +02:00
let attachmentType = "" ;
if ( note . attachedFileTypes . length > 0 ) {
attachmentType = note . attachedFileTypes [ 0 ] . split ( "/" ) [ 0 ] ;
switch ( attachmentType ) {
case "image" :
case "video" :
case "audio" :
case "text" :
break ;
default :
attachmentType = "file" ;
break ;
}
}
indexingBatch . push ( < MeilisearchNote > {
id : note.id.toString ( ) ,
text : note.text ? note . text : "" ,
userId : note.userId ,
userHost :
note . userHost !== ""
? note . userHost
: url . parse ( config . host ) . host ,
channelId : note.channelId ? note . channelId : "" ,
mediaAttachment : attachmentType ,
userName : note.user?.username ? ? "UNKNOWN" ,
createdAt : note.createdAt.getTime ( ) / 1000 , // division by 1000 is necessary because Node returns in ms-accuracy
} ) ;
2023-05-25 23:49:52 +02:00
}
2023-05-29 05:34:18 +02:00
return posts
. addDocuments ( indexingBatch , {
primaryKey : "id" ,
} )
. then ( ( ) = >
console . log ( ` sent ${ indexingBatch . length } posts for indexing ` ) ,
) ;
} ,
serverStats : async ( ) = > {
let health : Health = await client . health ( ) ;
let stats : Stats = await client . getStats ( ) ;
return {
health : health.status ,
size : stats.databaseSize ,
indexed_count : stats.indexes [ "posts" ] . numberOfDocuments ,
} ;
} ,
}
2023-05-26 03:06:41 +02:00
: null ;