325 lines
8.8 KiB
TypeScript
325 lines
8.8 KiB
TypeScript
/* eslint-disable @typescript-eslint/no-explicit-any */
|
|
import type { Knex } from 'knex'
|
|
import { postgresMaxConnections } from '@/modules/shared/helpers/envHelper'
|
|
import { EnvironmentResourceError, LogicError } from '@/modules/shared/errors'
|
|
import type { MaybeAsync } from '@speckle/shared'
|
|
import { isNonNullable } from '@speckle/shared'
|
|
import { base64Decode, base64Encode } from '@/modules/shared/helpers/cryptoHelper'
|
|
import type { Dayjs } from 'dayjs'
|
|
import dayjs from 'dayjs'
|
|
import type { MaybeNullOrUndefined, Nullable } from '@speckle/shared'
|
|
import type { SchemaConfig } from '@/modules/core/dbSchema'
|
|
import { has, isObjectLike, isString, mapValues, pick, times } from 'lodash-es'
|
|
import cryptoRandomString from 'crypto-random-string'
|
|
|
|
export type Collection<T> = {
|
|
cursor: string | null
|
|
totalCount: number
|
|
items: T[]
|
|
}
|
|
|
|
export type BatchedSelectOptions = {
|
|
/**
|
|
* Maximum amount of items to pull in one batch
|
|
* Defaults to: 100
|
|
*/
|
|
batchSize: number
|
|
trx: Knex.Transaction
|
|
}
|
|
|
|
/**
|
|
* Batches a SELECT query through the use of LIMIT/OFFSET
|
|
*/
|
|
export async function* executeBatchedSelect<
|
|
TRecord extends {},
|
|
TResult extends Array<any>
|
|
>(
|
|
selectQuery: Knex.QueryBuilder<TRecord, TResult>,
|
|
options?: Partial<BatchedSelectOptions>
|
|
): AsyncGenerator<Awaited<typeof selectQuery>, void, unknown> {
|
|
const { batchSize = 100, trx } = options || {}
|
|
|
|
if (trx) selectQuery.transacting(trx)
|
|
|
|
selectQuery.limit(batchSize)
|
|
|
|
let hasMorePages = true
|
|
let currentOffset = 0
|
|
while (hasMorePages) {
|
|
const q = selectQuery.clone().offset(currentOffset)
|
|
const results = (await q) as Awaited<typeof selectQuery>
|
|
|
|
if (!results.length) {
|
|
hasMorePages = false
|
|
break
|
|
} else {
|
|
currentOffset += results.length
|
|
}
|
|
|
|
yield results
|
|
}
|
|
}
|
|
|
|
const iso8601TimestampRegex = /\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}\.\d{3}\+\d{2}:\d{2}/
|
|
|
|
/**
|
|
* When rows are grouped and returned as an array through array_agg(row_to_json(...)), the fields don't get formatted as they would
|
|
* if the rows were returned directly. For example, date strings don't get converted to Date objects.
|
|
*
|
|
* This function will handle that.
|
|
*/
|
|
export const formatJsonArrayRecords = <V extends Record<string, unknown>>(
|
|
records: V[]
|
|
) =>
|
|
records
|
|
.map((r): typeof r | undefined => {
|
|
// PG can sometimes retuern `[null]` for an empty array_agg
|
|
if (!r) return r
|
|
|
|
const res: Record<string, unknown> = {}
|
|
for (const [key, value] of Object.entries(r)) {
|
|
// Check if value is an ISO date string or matches common date keys
|
|
if (
|
|
isString(value) &&
|
|
(key.endsWith('At') || iso8601TimestampRegex.test(value))
|
|
) {
|
|
res[key] = new Date(value)
|
|
} else {
|
|
res[key] = value
|
|
}
|
|
}
|
|
|
|
return res as V
|
|
})
|
|
.filter(isNonNullable)
|
|
|
|
export const numberOfUsedOrPendingConnections = (db: Knex) => {
|
|
if (!(db && 'client' in db && db.client))
|
|
throw new EnvironmentResourceError('knex is not defined or does not have a client.')
|
|
|
|
const dbClient: Knex.Client = db.client
|
|
if (!('pool' in dbClient && dbClient.pool))
|
|
throw new EnvironmentResourceError('knex client does not have a connection pool')
|
|
|
|
const pool = dbClient.pool
|
|
|
|
return (
|
|
pool.numUsed() +
|
|
pool.numPendingCreates() +
|
|
pool.numPendingValidations() +
|
|
pool.numPendingAcquires()
|
|
)
|
|
}
|
|
|
|
export const numberOfFreeConnections = (knex: Knex) => {
|
|
const pgMaxConnections = postgresMaxConnections()
|
|
|
|
const demand = numberOfUsedOrPendingConnections(knex)
|
|
|
|
return Math.max(pgMaxConnections - demand, 0)
|
|
}
|
|
|
|
export const withTransaction = async <T>(
|
|
operation: (args: { db: Knex; trx: Knex }) => MaybeAsync<T>,
|
|
params: {
|
|
db: Knex
|
|
}
|
|
) => {
|
|
const { db } = params
|
|
const trx = await db.transaction()
|
|
|
|
try {
|
|
// db and trx are just aliases, you can use whichever is more convenient
|
|
const result = await operation({ db: trx, trx })
|
|
await trx.commit()
|
|
return result
|
|
} catch (e) {
|
|
await trx.rollback()
|
|
throw e
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Encode cursor to turn it into an opaque & obfuscated value
|
|
*/
|
|
export function encodeCursor(value: string): string {
|
|
return base64Encode(value)
|
|
}
|
|
|
|
/**
|
|
* Decode obfuscated cursor value
|
|
*/
|
|
export function decodeCursor(value: string): string {
|
|
return base64Decode(value)
|
|
}
|
|
|
|
export function decodeIsoDateCursor(value: string): string | null {
|
|
const decoded = decodeCursor(value)
|
|
if (!decoded) return null
|
|
|
|
const date = dayjs(decoded)
|
|
if (!date.isValid()) return null
|
|
|
|
return date.toISOString()
|
|
}
|
|
|
|
export function encodeIsoDateCursor(date: Date | Dayjs): string {
|
|
const str = date.toISOString()
|
|
return encodeCursor(str)
|
|
}
|
|
|
|
export const encodeCompositeCursor = <C extends object>(val: C): string => {
|
|
const json = JSON.stringify(val)
|
|
return encodeCursor(json)
|
|
}
|
|
|
|
export const decodeCompositeCursor = <C extends object>(
|
|
cursor: MaybeNullOrUndefined<string>,
|
|
/**
|
|
* Users can feed in any kind of garbage into the cursor, this predicate will validate
|
|
* that its the expected format and if it isn't, null will be returned
|
|
*/
|
|
validate: (obj: unknown) => boolean
|
|
): Nullable<C> => {
|
|
if (!cursor) return null
|
|
|
|
let decodedJson: unknown
|
|
try {
|
|
decodedJson = JSON.parse(decodeCursor(cursor))
|
|
} catch {
|
|
// swallow - user error
|
|
return null
|
|
}
|
|
|
|
if (validate(decodedJson)) {
|
|
return decodedJson as C
|
|
}
|
|
|
|
return null
|
|
}
|
|
|
|
// This is to allow custom column/alias support for compositeCursorTools() - we don't want
|
|
// to force the user to pass in the entire schema config, just the data we need
|
|
type LimitedSchemaConfig = Pick<SchemaConfig<any, any, any>, 'col'>
|
|
|
|
/**
|
|
* Simplifies working with composite cursors in SQL queries. Composite cursors are better because they
|
|
* allow duplicate values (e.g. updatedAt date) in different rows
|
|
*/
|
|
export const compositeCursorTools = <
|
|
Config extends LimitedSchemaConfig,
|
|
SelectedCols extends Array<keyof Config['col']>
|
|
>(args: {
|
|
/**
|
|
* Db table schema config OR in case of aliased columns - manual column mapping between final aliases
|
|
* as keys and table-prefixed column names as values
|
|
*/
|
|
schema: Config
|
|
/**
|
|
* Order of columns matters - put the primary ordering column first (e.g. updatedAt), then the secondary
|
|
* ones like the ID.
|
|
*/
|
|
cols: SelectedCols
|
|
}) => {
|
|
type Cursor = {
|
|
[Col in SelectedCols[number]]: string
|
|
}
|
|
|
|
type CursorRecord = {
|
|
[Col in SelectedCols[number]]: string | Date | number | boolean
|
|
}
|
|
|
|
const encode = (val: Cursor) => encodeCompositeCursor(val)
|
|
const decode = (cursor: MaybeNullOrUndefined<string>): Nullable<Cursor> =>
|
|
decodeCompositeCursor(
|
|
cursor,
|
|
(c) => isObjectLike(c) && args.cols.every((col) => has(c, col))
|
|
)
|
|
|
|
/**
|
|
* Invoke this on the knex querybuilder to filter the query by the cursor and apply
|
|
* appropriate ordering
|
|
*/
|
|
const applyCursorSortAndFilter = <Query extends Knex.QueryBuilder>(params: {
|
|
query: Query
|
|
/**
|
|
* If falsy, filter will be skipped
|
|
*/
|
|
cursor: MaybeNullOrUndefined<Cursor | string>
|
|
/**
|
|
* How the results are sorted. Descending by default.
|
|
*/
|
|
sort?: 'desc' | 'asc'
|
|
}) => {
|
|
const { query, sort = 'desc' } = params
|
|
|
|
// Apply orderBy for each cursor column w/ proper sort direction
|
|
args.cols.forEach((col) => {
|
|
query.orderBy(args.schema.col[col], sort)
|
|
})
|
|
|
|
const cursor = isString(params.cursor) ? decode(params.cursor) : params.cursor
|
|
if (!cursor) return query
|
|
|
|
// Apply cursor filter
|
|
const colCount = args.cols.length
|
|
|
|
const sql = `(${times(colCount, () => '??').join(', ')}) ${
|
|
sort === 'desc' ? '<' : '>'
|
|
} (${times(colCount, () => '?').join(', ')})` // string like (??, ??) < (?, ?)
|
|
|
|
// e.g. WHERE (table.updatedAt, table.id) < ('2023-10-01T00:00:00.000Z', '12345')
|
|
query.andWhereRaw(sql, [
|
|
...args.cols.map((col) => args.schema.col[col]),
|
|
...args.cols.map((col) => cursor[col].toString())
|
|
])
|
|
|
|
return query
|
|
}
|
|
|
|
/**
|
|
* Feed in an entire page of items and this will build the next cursor accordingly
|
|
*/
|
|
const resolveNewCursor = (items: Array<CursorRecord>) => {
|
|
if (!items.length) return null
|
|
const lastItem = items.at(-1)
|
|
if (!lastItem) return null
|
|
|
|
const cursor: Cursor = mapValues(pick(lastItem, args.cols), (value) => {
|
|
if (value instanceof Date) {
|
|
return value.toISOString()
|
|
}
|
|
|
|
return `${value}`
|
|
})
|
|
|
|
return encode(cursor)
|
|
}
|
|
|
|
return {
|
|
encode,
|
|
decode,
|
|
applyCursorSortAndFilter,
|
|
resolveNewCursor
|
|
}
|
|
}
|
|
|
|
export const prepareTransaction = async (db: Knex): Promise<string> => {
|
|
if (!db.isTransaction) {
|
|
throw new LogicError('Cannot PREPARE postgres operation outside of a transaction')
|
|
}
|
|
|
|
const preparedId = cryptoRandomString({ length: 10 })
|
|
|
|
await db.raw(`PREPARE TRANSACTION '${preparedId}';`)
|
|
|
|
return preparedId
|
|
}
|
|
|
|
export const rollbackPreparedTransaction = async (
|
|
db: Knex,
|
|
gid: string
|
|
): Promise<void> => {
|
|
await db.raw(`ROLLBACK PREPARED '${gid}';`)
|
|
}
|