stacker.news/worker/earn.js

155 lines
7.2 KiB
JavaScript
Raw Normal View History

2022-03-17 20:13:19 +00:00
const serialize = require('../api/resolvers/serial')
2023-08-14 19:37:09 +00:00
const { ANON_USER_ID } = require('../lib/constants')
2022-03-17 20:13:19 +00:00
2023-07-06 16:10:44 +00:00
// const ITEM_EACH_REWARD = 3.0
// const UPVOTE_EACH_REWARD = 6.0
const TOP_PERCENTILE = 21
2023-08-10 02:27:53 +00:00
const TOTAL_UPPER_BOUND_MSATS = 1000000000
const REDUCE_REWARDS = [616, 6030, 946, 4502]
2022-07-07 19:14:22 +00:00
2022-03-17 20:13:19 +00:00
function earn ({ models }) {
return async function ({ name }) {
console.log('running', name)
// compute how much sn earned today
2023-08-10 02:27:53 +00:00
const [{ sum: sumDecimal }] = await models.$queryRaw`
SELECT coalesce(sum(msats), 0) as sum
FROM (
(SELECT ("ItemAct".msats - COALESCE("ReferralAct".msats, 0)) as msats
FROM "ItemAct"
LEFT JOIN "ReferralAct" ON "ReferralAct"."itemActId" = "ItemAct".id
WHERE date_trunc('day', "ItemAct".created_at AT TIME ZONE 'UTC' AT TIME ZONE 'America/Chicago') = date_trunc('day', (now() - interval '1 day') AT TIME ZONE 'America/Chicago') AND "ItemAct".act <> 'TIP')
UNION ALL
(SELECT sats * 1000 as msats
FROM "Donation"
WHERE date_trunc('day', created_at AT TIME ZONE 'UTC' AT TIME ZONE 'America/Chicago') = date_trunc('day', (now() - interval '1 day') AT TIME ZONE 'America/Chicago'))
2023-08-14 19:37:09 +00:00
UNION ALL
(SELECT "ItemAct".msats
FROM "Item"
JOIN "ItemAct" ON "ItemAct"."itemId" = "Item".id
WHERE "Item"."userId" = ${ANON_USER_ID} AND "ItemAct".act = 'TIP' AND "Item"."fwdUserId" IS NULL
AND date_trunc('day', "ItemAct".created_at AT TIME ZONE 'UTC' AT TIME ZONE 'America/Chicago') = date_trunc('day', (now() - interval '1 day') AT TIME ZONE 'America/Chicago'))
2023-08-10 02:27:53 +00:00
) subquery`
// XXX primsa will return a Decimal (https://mikemcl.github.io/decimal.js)
// because sum of a BIGINT returns a NUMERIC type (https://www.postgresql.org/docs/13/functions-aggregate.html)
// and Decimal is what prisma maps it to https://www.prisma.io/docs/concepts/components/prisma-client/raw-database-access#raw-query-type-mapping
// so check it before coercing to Number
if (!sumDecimal || sumDecimal.lessThanOrEqualTo(0)) {
2023-08-01 16:10:07 +00:00
console.log('done', name, 'no sats to award today')
return
}
2023-08-10 02:27:53 +00:00
// extra sanity check on rewards ... if it's more than upper bound, we
// probably have a bug somewhere or we've grown A LOT
if (sumDecimal.greaterThan(TOTAL_UPPER_BOUND_MSATS)) {
console.log('done', name, 'error: too many sats to award today', sumDecimal)
2023-08-01 16:10:07 +00:00
return
}
2023-08-10 02:27:53 +00:00
const sum = Number(sumDecimal)
2023-08-01 16:10:07 +00:00
console.log(name, 'giving away', sum, 'msats')
2022-12-08 00:04:02 +00:00
2022-07-07 19:14:22 +00:00
/*
2023-07-06 16:10:44 +00:00
How earnings (used to) work:
1/3: top 21% posts over last 36 hours, scored on a relative basis
1/3: top 21% comments over last 36 hours, scored on a relative basis
2022-07-07 19:14:22 +00:00
1/3: top upvoters of top posts/comments, scored on:
- their trust
- how much they tipped
- how early they upvoted it
- how the post/comment scored
2023-07-06 16:10:44 +00:00
Now: 100% of earnings go to zappers of the top 21% of posts/comments
2022-07-07 19:14:22 +00:00
*/
2022-03-18 12:29:02 +00:00
// get earners { userId, id, type, rank, proportion }
2023-08-10 02:27:53 +00:00
const earners = await models.$queryRaw`
-- get top 21% of posts and comments
2022-07-07 19:14:22 +00:00
WITH item_ratios AS (
SELECT *,
CASE WHEN "parentId" IS NULL THEN 'POST' ELSE 'COMMENT' END as type,
CASE WHEN "weightedVotes" > 0 THEN "weightedVotes"/(sum("weightedVotes") OVER (PARTITION BY "parentId" IS NULL)) ELSE 0 END AS ratio
FROM (
SELECT *,
2022-11-23 18:12:09 +00:00
NTILE(100) OVER (PARTITION BY "parentId" IS NULL ORDER BY ("weightedVotes"-"weightedDownVotes") desc) AS percentile,
ROW_NUMBER() OVER (PARTITION BY "parentId" IS NULL ORDER BY ("weightedVotes"-"weightedDownVotes") desc) AS rank
FROM
"Item"
WHERE created_at >= now_utc() - interval '36 hours'
2023-01-12 23:53:09 +00:00
AND "weightedVotes" > 0 AND "deletedAt" IS NULL AND NOT bio
) x
WHERE x.percentile <= ${TOP_PERCENTILE}
),
2023-08-10 02:27:53 +00:00
-- get top upvoters of top posts and comments
upvoter_islands AS (
SELECT "ItemAct"."userId", item_ratios.id, item_ratios.ratio, item_ratios."parentId",
"ItemAct".msats as tipped, "ItemAct".created_at as acted_at,
ROW_NUMBER() OVER (partition by item_ratios.id order by "ItemAct".created_at asc)
- ROW_NUMBER() OVER (partition by item_ratios.id, "ItemAct"."userId" order by "ItemAct".created_at asc) AS island
FROM item_ratios
JOIN "ItemAct" on "ItemAct"."itemId" = item_ratios.id
WHERE act = 'TIP'
),
-- isolate contiguous upzaps from the same user on the same item so that when we take the log
-- of the upzaps it accounts for successive zaps and does not disproporionately reward them
2022-07-07 19:14:22 +00:00
upvoters AS (
SELECT "userId", id, ratio, "parentId", GREATEST(log(sum(tipped) / 1000), 0) as tipped, min(acted_at) as acted_at
2023-08-10 02:27:53 +00:00
FROM upvoter_islands
GROUP BY "userId", id, ratio, "parentId", island
2022-07-07 19:14:22 +00:00
),
2023-08-10 02:27:53 +00:00
-- the relative contribution of each upvoter to the post/comment
-- early multiplier: 10/ln(early_rank + e)
-- we also weight by trust in a step wise fashion
2022-07-07 19:14:22 +00:00
upvoter_ratios AS (
SELECT "userId", sum(early_multiplier*tipped_ratio*ratio*CASE WHEN users.id = ANY (${REDUCE_REWARDS}) THEN 0.2 ELSE CEIL(users.trust*2)+1 END) as upvoter_ratio,
"parentId" IS NULL as "isPost", CASE WHEN "parentId" IS NULL THEN 'TIP_POST' ELSE 'TIP_COMMENT' END as type
2022-07-07 19:14:22 +00:00
FROM (
SELECT *,
2023-08-10 02:27:53 +00:00
10.0/LN(ROW_NUMBER() OVER (partition by id order by acted_at asc) + EXP(1.0)) AS early_multiplier,
2022-07-07 19:14:22 +00:00
tipped::float/(sum(tipped) OVER (partition by id)) tipped_ratio
FROM upvoters
) u
JOIN users on "userId" = users.id
GROUP BY "userId", "parentId" IS NULL
)
SELECT "userId", NULL as id, type, ROW_NUMBER() OVER (PARTITION BY "isPost" ORDER BY upvoter_ratio DESC) as rank,
2023-07-23 14:00:02 +00:00
upvoter_ratio/(sum(upvoter_ratio) OVER (PARTITION BY "isPost"))/2 as proportion
FROM upvoter_ratios
2023-08-10 02:27:53 +00:00
WHERE upvoter_ratio > 0
ORDER BY "isPost", rank ASC`
// in order to group earnings for users we use the same createdAt time for
// all earnings
const now = new Date(new Date().getTime())
// this is just a sanity check because it seems like a good idea
2023-08-01 16:10:07 +00:00
let total = 0
2022-03-18 12:29:02 +00:00
// for each earner, serialize earnings
// we do this for each earner because we don't need to serialize
// all earner updates together
earners.forEach(async earner => {
2023-08-01 16:10:07 +00:00
const earnings = Math.floor(parseFloat(earner.proportion) * sum)
total += earnings
if (total > sum) {
2023-08-01 16:10:07 +00:00
console.log(name, 'total exceeds sum', total, '>', sum)
return
}
2023-08-10 02:27:53 +00:00
console.log('stacker', earner.userId, 'earned', earnings, 'proportion', earner.proportion, 'rank', earner.rank, 'type', earner.type)
2023-08-01 16:10:07 +00:00
if (earnings > 0) {
2022-03-18 12:29:02 +00:00
await serialize(models,
2023-07-27 00:18:42 +00:00
models.$executeRaw`SELECT earn(${earner.userId}::INTEGER, ${earnings},
${now}::timestamp without time zone, ${earner.type}::"EarnType", ${earner.id}::INTEGER, ${earner.rank}::INTEGER)`)
2022-03-18 12:29:02 +00:00
}
})
console.log('done', name)
}
}
2022-07-07 19:14:22 +00:00
module.exports = { earn }