stacker.news/worker/search.js

135 lines
3.1 KiB
JavaScript

import { gql } from 'graphql-tag'
import search from '../api/search/index.js'
import removeMd from 'remove-markdown'
const ITEM_SEARCH_FIELDS = gql`
fragment ItemSearchFields on Item {
id
parentId
createdAt
updatedAt
title
text
url
userId
user {
name
}
sub {
name
}
root {
subName
}
status
maxBid
company
location
remote
upvotes
sats
boost
lastCommentAt
commentSats
path
ncomments
}`
async function _indexItem (item, { models }) {
console.log('indexing item', item.id)
// HACK: modify the title for jobs so that company/location are searchable
// and highlighted without further modification
const itemcp = { ...item }
if (item.company) {
itemcp.title += ` \\ ${item.company}`
}
if (item.location || item.remote) {
itemcp.title += ` \\ ${item.location || ''}${item.location && item.remote ? ' or ' : ''}${item.remote ? 'Remote' : ''}`
}
if (!item.sub?.name && item.root?.subName) {
itemcp.sub = { name: item.root.subName }
}
if (item.text) {
itemcp.text = removeMd(item.text)
}
const itemdb = await models.item.findUnique({
where: { id: Number(item.id) },
select: { weightedVotes: true, weightedDownVotes: true }
})
itemcp.wvotes = itemdb.weightedVotes - itemdb.weightedDownVotes
try {
await search.index({
id: item.id,
index: 'item',
version: new Date(item.updatedAt).getTime(),
versionType: 'external_gte',
body: itemcp
})
} catch (e) {
// ignore version conflict ...
if (e?.meta?.statusCode === 409) {
console.log('version conflict ignoring', item.id)
return
}
console.log(e)
throw e
}
console.log('done indexing item', item.id)
}
export function indexItem ({ apollo, models }) {
return async function ({ data: { id } }) {
console.log('indexing item, fetching ...', id)
// 1. grab item from database
// could use apollo to avoid duping logic
// when grabbing sats and user name, etc
const { data: { item } } = await apollo.query({
query: gql`
${ITEM_SEARCH_FIELDS}
query Item {
item(id: ${id}) {
...ItemSearchFields
}
}`
})
// 2. index it with external version based on updatedAt
await _indexItem(item, { models })
}
}
export function indexAllItems ({ apollo, models }) {
return async function () {
// cursor over all items in the Item table
let items = []; let cursor = null
do {
// query for items
({ data: { items: { items, cursor } } } = await apollo.query({
query: gql`
${ITEM_SEARCH_FIELDS}
query AllItems($cursor: String) {
items(cursor: $cursor, sort: "recent", limit: 1000, type: "all") {
items {
...ItemSearchFields
}
cursor
}
}`,
variables: { cursor }
}))
// for all items, index them
try {
items.forEach(i => _indexItem(i, { models }))
} catch (e) {
// ignore errors
console.log(e)
}
} while (cursor)
}
}