Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

fix: prevent duplicate tiles in task creation #29

Merged
merged 3 commits into from
Nov 25, 2024
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
17 changes: 17 additions & 0 deletions package-lock.json

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

1 change: 1 addition & 0 deletions package.json
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,7 @@
}
},
"dependencies": {
"@faker-js/faker": "^9.2.0",
"@godaddy/terminus": "^4.12.1",
"@map-colonies/error-express-handler": "^2.1.0",
"@map-colonies/error-types": "^1.2.0",
Expand Down
10 changes: 9 additions & 1 deletion src/common/interfaces.ts
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ import {
IngestionUpdateJobParams,
} from '@map-colonies/mc-model-types';
import { TilesMimeFormat } from '@map-colonies/types';
import { BBox, Polygon } from 'geojson';
import { BBox, Feature, MultiPolygon, Polygon } from 'geojson';
import { Footprint, ITileRange } from '@map-colonies/mc-utils';
import { LayerCacheType, SeedMode } from './constants';

Expand Down Expand Up @@ -122,6 +122,14 @@ export interface PartSourceContext {
maxZoom: number;
}

export interface UnifiedPart {
fileName: string;
tilesPath: string;
footprint: Feature<Polygon | MultiPolygon>;
extent: BBox;
maxZoom: number;
}

export interface MergeParameters {
parts: PartSourceContext[];
destPath: string;
Expand Down
54 changes: 40 additions & 14 deletions src/task/models/tileMergeTaskManager.ts
Original file line number Diff line number Diff line change
@@ -1,10 +1,10 @@
import { join } from 'path';
import { BBox } from 'geojson';
import { BBox, Feature, MultiPolygon, Polygon } from 'geojson';
import { Logger } from '@map-colonies/js-logger';
import { InputFiles, PolygonPart, TileOutputFormat } from '@map-colonies/mc-model-types';
import { ICreateTaskBody, TaskHandler as QueueClient } from '@map-colonies/mc-priority-queue';
import { degreesPerPixelToZoomLevel, Footprint, multiIntersect, subGroupsGen, tileBatchGenerator, TileRanger } from '@map-colonies/mc-utils';
import { bbox, featureCollection, union } from '@turf/turf';
import { bbox, featureCollection, intersect, polygon, union } from '@turf/turf';
import { difference } from '@turf/difference';
import { inject, injectable } from 'tsyringe';
import { SERVICES, TilesStorageProvider } from '../../common/constants';
Expand All @@ -19,6 +19,7 @@ import {
PartSourceContext,
IntersectionState,
PartsSourceWithMaxZoom,
UnifiedPart,
} from '../../common/interfaces';
import { convertToFeature } from '../../utils/geoUtils';
import { fileExtensionExtractor } from '../../utils/fileutils';
Expand Down Expand Up @@ -166,23 +167,49 @@ export class TileMergeTaskManager {
private async *createZoomLevelTasks(params: MergeParameters): AsyncGenerator<MergeTaskParameters, void, void> {
const { parts, destPath, targetFormat, isNewTarget, grid, maxZoom } = params;

this.logger.debug({ msg: 'Creating batched tasks', destPath, targetFormat });
for (let zoom = maxZoom; zoom >= 0; zoom--) {
// when we used the old implementation with the parts intersection calculation with large numbers of parts
//we encountered performance issues, as long as we are not performing ingestion from more then one file we can omit this.
// const partsIntersections = this.findPartsIntersections(parts);
for await (const part of parts) {
if (part.maxZoom < zoom) {
// checking if the layer is relevant for the current zoom level (allowing different parts with different resolutions)
continue;
}
const filteredParts = parts.filter((part) => part.maxZoom >= zoom);
const processedParts = this.unifyParts(filteredParts);
for await (const part of processedParts) {
yield* this.createTasksForPart(part, zoom, { destPath, grid, isNewTarget, targetFormat });
}
}
}

private unifyParts(parts: PartSourceContext[]): UnifiedPart[] {
const mergedParts: UnifiedPart[] = [];
// Merge parts by union and avoid duplicate overlaps.
for (const part of parts) {
let merged = false;
const geo1 = polygon(part.footprint.coordinates);
for (let i = 0; i < mergedParts.length; i++) {
const geo2 = mergedParts[i].footprint;
if (this.doIntersect(geo1, geo2)) {
const unionResult = union(featureCollection([geo1, geo2]));
if (unionResult === null) {
continue;
}
mergedParts[i].footprint = unionResult;
merged = true;
break;
}
}
if (!merged) {
const processedPart: UnifiedPart = { ...part, footprint: geo1 };
mergedParts.push(processedPart);
}
}
this.logger.debug({ msg: 'Preprocessed parts', numberOfParts: mergedParts.length });
return mergedParts;
}

private doIntersect(footprint1: Feature<Polygon | MultiPolygon>, footprint2: Feature<Polygon | MultiPolygon>): boolean {
const intersection = intersect(featureCollection([footprint1, footprint2]));
return intersection !== null;
}

private async *createTasksForPart(
part: PartSourceContext,
part: UnifiedPart,
zoom: number,
params: { destPath: string; targetFormat: TileOutputFormat; isNewTarget: boolean; grid: Grid }
): AsyncGenerator<MergeTaskParameters, void, void> {
Expand All @@ -205,7 +232,7 @@ export class TileMergeTaskManager {
}
}

private createPartSources(part: PartSourceContext, grid: Grid, destPath: string): MergeSources[] {
private createPartSources(part: UnifiedPart, grid: Grid, destPath: string): MergeSources[] {
this.logger.debug({ msg: 'Creating source layers' });

const sourceEntry: MergeSources = { type: this.tilesStorageProvider, path: destPath };
Expand Down Expand Up @@ -237,7 +264,6 @@ export class TileMergeTaskManager {
let state: IntersectionState = { currentIntersection: null, accumulatedIntersection: null };

const subGroups = subGroupsGen(parts, parts.length, false);

for (const subGroup of subGroups) {
const subGroupFootprints = subGroup.map((layer) => layer.footprint as Footprint);
this.logger.debug({ msg: 'Processing sub group' });
Expand Down
38 changes: 38 additions & 0 deletions tests/unit/mocks/partsMockData.ts
Original file line number Diff line number Diff line change
@@ -1,5 +1,33 @@
/* eslint-disable @typescript-eslint/no-magic-numbers */
import { faker } from '@faker-js/faker';
import { BBox, Polygon } from 'geojson';
import { PolygonPart } from '@map-colonies/mc-model-types';
import { PartSourceContext } from '../../../src/common/interfaces';

function createFakeBBox(): BBox {
return [
faker.location.longitude({ min: -180, max: 180 }),
faker.location.latitude({ min: -90, max: 90 }),
faker.location.longitude({ min: -180, max: 180 }),
faker.location.latitude({ min: -90, max: 90 }),
];
}

function createFakePolygon(): Polygon {
const firstAndLastPoint = [faker.location.longitude({ min: -180, max: 180 }), faker.location.latitude({ min: -90, max: 90 })];
return {
type: 'Polygon',
coordinates: [
[
firstAndLastPoint,
[faker.location.longitude({ min: -180, max: 180 }), faker.location.latitude({ min: -90, max: 90 })],
[faker.location.longitude({ min: -180, max: 180 }), faker.location.latitude({ min: -90, max: 90 })],
[faker.location.longitude({ min: -180, max: 180 }), faker.location.latitude({ min: -90, max: 90 })],
firstAndLastPoint,
],
],
};
}

export const partsData: PolygonPart[] = [
{
Expand Down Expand Up @@ -114,3 +142,13 @@ export const multiPartDataWithDifferentResolution: PolygonPart[] = [
},
},
];

export function createFakePartSource(): PartSourceContext {
return {
tilesPath: `${faker.string.uuid()}/${faker.string.uuid()}`,
fileName: `${faker.string.alpha({ length: 8 })}.gpkg`,
maxZoom: faker.number.int({ min: 0, max: 21 }),
extent: createFakeBBox(),
footprint: createFakePolygon(),
};
}
85 changes: 48 additions & 37 deletions tests/unit/task/tileMergeTaskManager/tileMergeTaskManager.spec.ts
Original file line number Diff line number Diff line change
@@ -1,9 +1,10 @@
import { randomUUID } from 'crypto';
import nock from 'nock';
import { booleanEqual } from '@turf/turf';
import { faker } from '@faker-js/faker';
import { Feature } from 'geojson';
import { TileOutputFormat } from '@map-colonies/mc-model-types';
import { partsData } from '../../mocks/partsMockData';
import { createFakePartSource, partsData } from '../../mocks/partsMockData';
import { configMock, registerDefaultConfig } from '../../mocks/configMock';
import { Grid, MergeTaskParameters, MergeTilesTaskParams } from '../../../../src/common/interfaces';
import { testData } from '../../mocks/tileMergeTaskManagerMockData';
Expand Down Expand Up @@ -70,6 +71,16 @@ describe('tileMergeTaskManager', () => {
});
});

describe('unifyParts', () => {
it('should unify parts correctly', () => {
const { tileMergeTaskManager } = testContext;
const partsData = faker.helpers.multiple(createFakePartSource, { count: 10 });
const result = tileMergeTaskManager['unifyParts'](partsData);

expect(result.length).toBeGreaterThan(0);
});
});

describe('calculateIntersectionState', () => {
// Test case 1: No intersection found
it('should return null intersection when no overlap is found', () => {
Expand Down Expand Up @@ -130,54 +141,54 @@ describe('tileMergeTaskManager', () => {
expect(result.currentIntersection).toBeNull();
expect(result.accumulatedIntersection).not.toBeNull();
});
});

describe('pushTasks', () => {
it('should push tasks in batches correctly', async () => {
const { tileMergeTaskManager } = testContext;
const buildTasksParams: MergeTilesTaskParams = {
taskMetadata: { layerRelativePath: 'layerRelativePath', tileOutputFormat: TileOutputFormat.PNG, isNewTarget: true, grid: Grid.TWO_ON_ONE },
partsData,
inputFiles: { originDirectory: 'originDirectory', fileNames: ['fileNames'] },
};
describe('pushTasks', () => {
it('should push tasks in batches correctly', async () => {
const { tileMergeTaskManager } = testContext;
const buildTasksParams: MergeTilesTaskParams = {
taskMetadata: { layerRelativePath: 'layerRelativePath', tileOutputFormat: TileOutputFormat.PNG, isNewTarget: true, grid: Grid.TWO_ON_ONE },
partsData,
inputFiles: { originDirectory: 'originDirectory', fileNames: ['fileNames'] },
};

const jobId = randomUUID();
const jobId = randomUUID();

const jobManagerBaseUrl = configMock.get<string>('jobManagement.config.jobManagerBaseUrl');
const path = `/jobs/${jobId}/tasks`;
nock(jobManagerBaseUrl).post(path).reply(200).persist();
const jobManagerBaseUrl = configMock.get<string>('jobManagement.config.jobManagerBaseUrl');
const path = `/jobs/${jobId}/tasks`;
nock(jobManagerBaseUrl).post(path).reply(200).persist();

const tasks = tileMergeTaskManager.buildTasks(buildTasksParams);
const tasks = tileMergeTaskManager.buildTasks(buildTasksParams);

let error: Error | null = null;
try {
await tileMergeTaskManager.pushTasks(jobId, tasks);
} catch (err) {
error = err as Error;
}
let error: Error | null = null;
try {
await tileMergeTaskManager.pushTasks(jobId, tasks);
} catch (err) {
error = err as Error;
}

expect(error).toBeNull();
});
expect(error).toBeNull();
});

it('should handle errors in pushTasks correctly', async () => {
const { tileMergeTaskManager } = testContext;
const buildTasksParams: MergeTilesTaskParams = {
taskMetadata: { layerRelativePath: 'layerRelativePath', tileOutputFormat: TileOutputFormat.PNG, isNewTarget: true, grid: Grid.TWO_ON_ONE },
partsData,
inputFiles: { originDirectory: 'originDirectory', fileNames: ['fileNames'] },
};
it('should handle errors in pushTasks correctly', async () => {
const { tileMergeTaskManager } = testContext;
const buildTasksParams: MergeTilesTaskParams = {
taskMetadata: { layerRelativePath: 'layerRelativePath', tileOutputFormat: TileOutputFormat.PNG, isNewTarget: true, grid: Grid.TWO_ON_ONE },
partsData,
inputFiles: { originDirectory: 'originDirectory', fileNames: ['fileNames'] },
};

const jobId = randomUUID();
const jobId = randomUUID();

const jobManagerBaseUrl = configMock.get<string>('jobManagement.config.jobManagerBaseUrl');
const path = `/jobs/${jobId}/tasks`;
nock(jobManagerBaseUrl).post(path).reply(500).persist();
const jobManagerBaseUrl = configMock.get<string>('jobManagement.config.jobManagerBaseUrl');
const path = `/jobs/${jobId}/tasks`;
nock(jobManagerBaseUrl).post(path).reply(500).persist();

const tasks = tileMergeTaskManager.buildTasks(buildTasksParams);
const tasks = tileMergeTaskManager.buildTasks(buildTasksParams);

const action = async () => tileMergeTaskManager.pushTasks(jobId, tasks);
const action = async () => tileMergeTaskManager.pushTasks(jobId, tasks);

await expect(action).rejects.toThrow();
});
await expect(action).rejects.toThrow();
});
});
});
Loading