ente/web/packages/utils/array.ts

/**
 * Shuffle.
 *
 * Return a new array containing the shuffled elements of the given array.
 *
 * The algorithm used is not the most efficient, but is effectively a one-liner
 * whilst being reasonably efficient. To each element we assign a random key,
 * then we sort by this key. Since the key is random, the sorted array will have
 * the original elements in a random order.
 */
export const shuffled = <T>(xs: T[]): T[] =>
    xs
        .map((x) => [Math.random(), x])
        .sort()
        .map(([, x]) => x) as T[];

/**
 * Return a random sample of {@link n} elements from the given {@link items}.
 *
 * Functionally this is equivalent to `shuffled(items).slice(0, n)`, except it
 * tries to be a bit faster for long arrays when we need only a small sample
 * from it. In a few tests, this indeed makes a substantial difference.
 *
 * If {@link n} is less than the number of {@link items} then a random shuffle
 * of the {@link items} is returned.
 */
export const randomSample = <T>(items: T[], n: number) => {
    if (items.length <= n) return shuffled(items);
    if (n == 0) return [];

    if (n > items.length / 3) {
        // Avoid using the random sampling without replacement method if a
        // significant proportion of the original items are needed, otherwise we
        // might run into long retry loop at the tail end (hitting the same
        // indexes again an again).
        return shuffled(items).slice(0, n);
    }

    const ix = new Set<number>();
    while (ix.size < n) {
        ix.add(Math.floor(Math.random() * items.length));
    }
    return [...ix].map((i) => items[i]!);
};

/**
 * Return the first non-empty string from the given list of strings.
 *
 * This function is needed because the `a ?? b` idiom doesn't do what you'd
 * expect when a is "". Perhaps the behaviour is wrong, perhaps the expectation
 * is wrong; this function papers over the differences.
 *
 * If none of the strings are non-empty, or if there are no strings in the given
 * array, return undefined.
 */
export const firstNonEmpty = (
    ss: (string | undefined)[],
): string | undefined => {
    for (const s of ss) if (s && s.length > 0) return s;
    return undefined;
};

/**
 * Merge the given array of {@link Uint8Array}s in order into a single
 * {@link Uint8Array}.
 *
 * @param as An array of {@link Uint8Array}.
 */
export const mergeUint8Arrays = (as: Uint8Array[]): Uint8Array => {
    // A longer but better performing replacement of
    //
    //     new Uint8Array(as.reduce((acc, x) => acc.concat(...x), []))
    //

    const len = as.reduce((len, xs) => len + xs.length, 0);
    const result = new Uint8Array(len);
    as.reduce((n, xs) => (result.set(xs, n), n + xs.length), 0);
    return result;
};

/**
 * Break an array into batches of size {@link chunkSize}.
 *
 * @returns An array of the resultant batches.
 */
export const batch = <T>(xs: T[], batchSize: number): T[][] => {
    const batches: T[][] = [];
    for (let i = 0; i < xs.length; i += batchSize) {
        batches.push(xs.slice(i, i + batchSize));
    }
    return batches;
};

/**
 * Split an array into two arrays - those that satisfy the given
 * {@link predicate}, and those that don't.
 *
 * @param xs The array to split.
 *
 * @param predicate A function invoked for each element, to decide which part of
 * the split it will belong to.
 *
 * @returns A tuple with two arrays. The first of these arrays contains all
 * elements for which the predicate returned `true`, and the second array
 * contains the rest of the elements.
 */
export const splitByPredicate = <T>(
    xs: T[],
    predicate: (t: T) => boolean,
): [T[], T[]] =>
    xs.reduce<[T[], T[]]>(
        (result, x) => {
            (predicate(x) ? result[0] : result[1]).push(x);
            return result;
        },
        [[], []],
    );