2023-07-06 16:37:47 +02:00
|
|
|
import mockfs from 'mock-fs';
|
2023-11-19 23:16:24 +01:00
|
|
|
import { CrawlOptionsDto } from 'src/cores/dto/crawl-options-dto';
|
|
|
|
import { CrawlService } from '.';
|
|
|
|
|
|
|
|
interface Test {
|
|
|
|
test: string;
|
|
|
|
options: CrawlOptionsDto;
|
|
|
|
files: Record<string, boolean>;
|
|
|
|
}
|
|
|
|
|
|
|
|
const cwd = process.cwd();
|
|
|
|
|
|
|
|
const tests: Test[] = [
|
|
|
|
{
|
|
|
|
test: 'should return empty when crawling an empty path list',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: [],
|
|
|
|
},
|
|
|
|
files: {},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl a single path',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should exclude by file extension',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
exclusionPatterns: ['**/*.tif'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.tif': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should exclude by file extension without case sensitivity',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
exclusionPatterns: ['**/*.TIF'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.tif': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should exclude by folder',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
exclusionPatterns: ['**/raw/**'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/raw/image.jpg': false,
|
|
|
|
'/photos/raw2/image.jpg': true,
|
|
|
|
'/photos/folder/raw/image.jpg': false,
|
|
|
|
'/photos/crawl/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl multiple paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/', '/images/', '/albums/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image1.jpg': true,
|
|
|
|
'/images/image2.jpg': true,
|
|
|
|
'/albums/image3.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should support globbing paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos*'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos1/image1.jpg': true,
|
|
|
|
'/photos2/image2.jpg': true,
|
|
|
|
'/images/image3.jpg': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl a single path without trailing slash',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl a single path',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/subfolder/image1.jpg': true,
|
|
|
|
'/photos/subfolder/image2.jpg': true,
|
|
|
|
'/image1.jpg': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should filter file extensions',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.txt': false,
|
|
|
|
'/photos/1': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should include photo and video extensions',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/', '/videos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.jpeg': true,
|
|
|
|
'/photos/image.heic': true,
|
|
|
|
'/photos/image.heif': true,
|
|
|
|
'/photos/image.png': true,
|
|
|
|
'/photos/image.gif': true,
|
|
|
|
'/photos/image.tif': true,
|
|
|
|
'/photos/image.tiff': true,
|
|
|
|
'/photos/image.webp': true,
|
|
|
|
'/photos/image.dng': true,
|
|
|
|
'/photos/image.nef': true,
|
|
|
|
'/videos/video.mp4': true,
|
|
|
|
'/videos/video.mov': true,
|
|
|
|
'/videos/video.webm': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should check file extensions without case sensitivity',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.Jpg': true,
|
|
|
|
'/photos/image.jpG': true,
|
|
|
|
'/photos/image.JPG': true,
|
|
|
|
'/photos/image.jpEg': true,
|
|
|
|
'/photos/image.TIFF': true,
|
|
|
|
'/photos/image.tif': true,
|
|
|
|
'/photos/image.dng': true,
|
|
|
|
'/photos/image.NEF': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should normalize the path',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/1/../2'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/1/image.jpg': false,
|
|
|
|
'/photos/2/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should return absolute paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['photos'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
[`${cwd}/photos/1.jpg`]: true,
|
|
|
|
[`${cwd}/photos/2.jpg`]: true,
|
|
|
|
[`/photos/3.jpg`]: false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
];
|
|
|
|
|
|
|
|
describe(CrawlService.name, () => {
|
|
|
|
const sut = new CrawlService(
|
|
|
|
['.jpg', '.jpeg', '.png', '.heif', '.heic', '.tif', '.nef', '.webp', '.tiff', '.dng', '.gif'],
|
|
|
|
['.mov', '.mp4', '.webm'],
|
|
|
|
);
|
2023-07-06 16:37:47 +02:00
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
afterEach(() => {
|
|
|
|
mockfs.restore();
|
2023-07-06 16:37:47 +02:00
|
|
|
});
|
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
describe('crawl', () => {
|
|
|
|
for (const { test, options, files } of tests) {
|
|
|
|
it(test, async () => {
|
|
|
|
mockfs(Object.fromEntries(Object.keys(files).map((file) => [file, ''])));
|
2023-07-06 16:37:47 +02:00
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
const actual = await sut.crawl(options);
|
|
|
|
const expected = Object.entries(files)
|
|
|
|
.filter((entry) => entry[1])
|
|
|
|
.map(([file]) => file);
|
2023-07-06 16:37:47 +02:00
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
expect(actual.sort()).toEqual(expected.sort());
|
|
|
|
});
|
|
|
|
}
|
2023-07-06 16:37:47 +02:00
|
|
|
});
|
|
|
|
});
|