All files / lib/attachment-archive backfill.ts

67.74% Statements 21/31
50% Branches 10/20
85.71% Functions 6/7
67.74% Lines 21/31

Press n or j to go to the next uncovered block, b, p or k for the previous block.

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155        1x 1x                       3x                                 3x   3x                                       1x                           1x 1x   1x       2x 2x                                                                           1x     1x 2x                                         2x 2x 3x 3x       2x 2x 1x        
import { search } from "libs/opensearch-lib";
 
import { getDomainAndNamespace } from "../libs/utils";
 
export const ATTACHMENT_ARCHIVE_BACKFILL_PAGE_SIZE = 25;
const COMPOSITE_PAGE_SIZE = 500;
 
type CompositeBucket = {
  key: Record<string, string>;
};
 
type CompositeAggregationResult = {
  after_key?: Record<string, string>;
  buckets?: CompositeBucket[];
};
 
function getAttachmentArchiveEligibilityQuery() {
  return {
    bool: {
      filter: [{ exists: { field: "attachments.key" } }],
      must_not: [{ term: { isAdminChange: true } }],
    },
  };
}
 
async function searchCompositeAggregation({
  after,
  size,
  sources,
}: {
  after?: Record<string, string>;
  size: number;
  sources: Array<Record<string, unknown>>;
}) {
  const { domain, index } = getDomainAndNamespace("changelog");
 
  return (await search(domain, index, {
    size: 0,
    query: getAttachmentArchiveEligibilityQuery(),
    aggs: {
      values: {
        composite: {
          size,
          ...(after ? { after } : {}),
          sources,
        },
      },
    },
  })) as {
    aggregations?: {
      values?: CompositeAggregationResult;
    };
  };
}
 
export async function getAttachmentArchiveBackfillPage({ afterKey }: { afterKey?: string }) {
  const result = await searchCompositeAggregation({
    after: afterKey ? { packageId: afterKey } : undefined,
    size: ATTACHMENT_ARCHIVE_BACKFILL_PAGE_SIZE,
    sources: [
      {
        packageId: {
          terms: {
            field: "packageId.keyword",
          },
        },
      },
    ],
  });
 
  const buckets = result.aggregations?.values?.buckets || [];
  const nextAfterKey = result.aggregations?.values?.after_key?.packageId;
 
  return {
    afterKey: nextAfterKey,
    done: !nextAfterKey,
    packageIds: buckets
      .map((bucket) => bucket.key.packageId)
      .filter((packageId): packageId is string => Boolean(packageId)),
  };
}
 
export async function listAllAttachmentArchivePackageIds() {
  const packageIds = new Set<string>();
  let after: Record<string, string> | undefined;
 
  while (true) {
    const result = await searchCompositeAggregation({
      after,
      size: COMPOSITE_PAGE_SIZE,
      sources: [
        {
          packageId: {
            terms: {
              field: "packageId.keyword",
            },
          },
        },
      ],
    });
 
    const aggregation = result.aggregations?.values;
    for (const bucket of aggregation?.buckets || []) {
      if (bucket.key.packageId) {
        packageIds.add(bucket.key.packageId);
      }
    }
 
    after = aggregation?.after_key;
    if (!after) {
      return Array.from(packageIds).sort();
    }
  }
}
 
export async function listAllAttachmentArchiveSections() {
  const sections = new Set<string>();
  let after: Record<string, string> | undefined;
 
  while (true) {
    const result = await searchCompositeAggregation({
      after,
      size: COMPOSITE_PAGE_SIZE,
      sources: [
        {
          packageId: {
            terms: {
              field: "packageId.keyword",
            },
          },
        },
        {
          sectionId: {
            terms: {
              field: "id.keyword",
            },
          },
        },
      ],
    });
 
    const aggregation = result.aggregations?.values;
    for (const bucket of aggregation?.buckets || []) {
      Eif (bucket.key.packageId && bucket.key.sectionId) {
        sections.add(`${bucket.key.packageId}::${bucket.key.sectionId}`);
      }
    }
 
    after = aggregation?.after_key;
    if (!after) {
      return Array.from(sections).sort();
    }
  }
}