2023-07-06 16:37:47 +02:00
|
|
|
import mockfs from 'mock-fs';
|
2024-03-22 15:30:24 +01:00
|
|
|
import { CrawlOptions, crawl } from 'src/utils';
|
2023-11-19 23:16:24 +01:00
|
|
|
|
|
|
|
interface Test {
|
|
|
|
test: string;
|
2024-03-22 15:30:24 +01:00
|
|
|
options: Omit<CrawlOptions, 'extensions'>;
|
2023-11-19 23:16:24 +01:00
|
|
|
files: Record<string, boolean>;
|
|
|
|
}
|
|
|
|
|
|
|
|
const cwd = process.cwd();
|
|
|
|
|
2024-03-22 15:30:24 +01:00
|
|
|
const extensions = [
|
|
|
|
'.jpg',
|
|
|
|
'.jpeg',
|
|
|
|
'.png',
|
|
|
|
'.heif',
|
|
|
|
'.heic',
|
|
|
|
'.tif',
|
|
|
|
'.nef',
|
|
|
|
'.webp',
|
|
|
|
'.tiff',
|
|
|
|
'.dng',
|
|
|
|
'.gif',
|
|
|
|
'.mov',
|
|
|
|
'.mp4',
|
|
|
|
'.webm',
|
|
|
|
];
|
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
const tests: Test[] = [
|
|
|
|
{
|
|
|
|
test: 'should return empty when crawling an empty path list',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: [],
|
|
|
|
},
|
|
|
|
files: {},
|
|
|
|
},
|
|
|
|
{
|
2023-12-19 20:15:11 +01:00
|
|
|
test: 'should crawl a single folder',
|
2023-11-19 23:16:24 +01:00
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
2023-12-19 20:15:11 +01:00
|
|
|
{
|
|
|
|
test: 'should crawl a single file',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/image.jpg'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl a single file and a folder',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/image.jpg', '/images/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/images/image2.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
2023-11-19 23:16:24 +01:00
|
|
|
{
|
|
|
|
test: 'should exclude by file extension',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '**/*.tif',
|
2023-11-19 23:16:24 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.tif': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should exclude by file extension without case sensitivity',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '**/*.TIF',
|
2023-11-19 23:16:24 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.tif': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should exclude by folder',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '**/raw/**',
|
2023-12-19 20:15:11 +01:00
|
|
|
recursive: true,
|
2023-11-19 23:16:24 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/raw/image.jpg': false,
|
|
|
|
'/photos/raw2/image.jpg': true,
|
|
|
|
'/photos/folder/raw/image.jpg': false,
|
|
|
|
'/photos/crawl/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl multiple paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/', '/images/', '/albums/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image1.jpg': true,
|
|
|
|
'/images/image2.jpg': true,
|
|
|
|
'/albums/image3.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should support globbing paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos*'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos1/image1.jpg': true,
|
|
|
|
'/photos2/image2.jpg': true,
|
|
|
|
'/images/image3.jpg': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl a single path without trailing slash',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should crawl a single path',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
2023-12-19 20:15:11 +01:00
|
|
|
recursive: true,
|
2023-11-19 23:16:24 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/subfolder/image1.jpg': true,
|
|
|
|
'/photos/subfolder/image2.jpg': true,
|
|
|
|
'/image1.jpg': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should filter file extensions',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.txt': false,
|
|
|
|
'/photos/1': false,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should include photo and video extensions',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/', '/videos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.jpeg': true,
|
|
|
|
'/photos/image.heic': true,
|
|
|
|
'/photos/image.heif': true,
|
|
|
|
'/photos/image.png': true,
|
|
|
|
'/photos/image.gif': true,
|
|
|
|
'/photos/image.tif': true,
|
|
|
|
'/photos/image.tiff': true,
|
|
|
|
'/photos/image.webp': true,
|
|
|
|
'/photos/image.dng': true,
|
|
|
|
'/photos/image.nef': true,
|
|
|
|
'/videos/video.mp4': true,
|
|
|
|
'/videos/video.mov': true,
|
|
|
|
'/videos/video.webm': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should check file extensions without case sensitivity',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image.jpg': true,
|
|
|
|
'/photos/image.Jpg': true,
|
|
|
|
'/photos/image.jpG': true,
|
|
|
|
'/photos/image.JPG': true,
|
|
|
|
'/photos/image.jpEg': true,
|
|
|
|
'/photos/image.TIFF': true,
|
|
|
|
'/photos/image.tif': true,
|
|
|
|
'/photos/image.dng': true,
|
|
|
|
'/photos/image.NEF': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should normalize the path',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos/1/../2'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/1/image.jpg': false,
|
|
|
|
'/photos/2/image.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should return absolute paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['photos'],
|
|
|
|
},
|
|
|
|
files: {
|
|
|
|
[`${cwd}/photos/1.jpg`]: true,
|
|
|
|
[`${cwd}/photos/2.jpg`]: true,
|
|
|
|
[`/photos/3.jpg`]: false,
|
|
|
|
},
|
|
|
|
},
|
2024-01-03 23:42:26 +01:00
|
|
|
{
|
|
|
|
test: 'should support ignoring full filename',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos'],
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '**/image2.jpg',
|
2024-01-03 23:42:26 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image1.jpg': true,
|
|
|
|
'/photos/image2.jpg': false,
|
|
|
|
'/photos/image3.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should support ignoring file extensions',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos'],
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '**/*.png',
|
2024-01-03 23:42:26 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image1.jpg': true,
|
|
|
|
'/photos/image2.png': false,
|
|
|
|
'/photos/image3.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should support ignoring folder names',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/photos'],
|
|
|
|
recursive: true,
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '**/raw/**',
|
2024-01-03 23:42:26 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image1.jpg': true,
|
|
|
|
'/photos/image/image1.jpg': true,
|
|
|
|
'/photos/raw/image2.dng': false,
|
|
|
|
'/photos/raw/image3.dng': false,
|
|
|
|
'/photos/notraw/image3.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
test: 'should support ignoring absolute paths',
|
|
|
|
options: {
|
|
|
|
pathsToCrawl: ['/'],
|
|
|
|
recursive: true,
|
2024-04-25 16:48:17 +02:00
|
|
|
exclusionPattern: '/images/**',
|
2024-01-03 23:42:26 +01:00
|
|
|
},
|
|
|
|
files: {
|
|
|
|
'/photos/image1.jpg': true,
|
|
|
|
'/images/image2.jpg': false,
|
|
|
|
'/assets/image3.jpg': true,
|
|
|
|
},
|
|
|
|
},
|
2023-11-19 23:16:24 +01:00
|
|
|
];
|
|
|
|
|
2024-03-22 15:30:24 +01:00
|
|
|
describe('crawl', () => {
|
2023-11-19 23:16:24 +01:00
|
|
|
afterEach(() => {
|
|
|
|
mockfs.restore();
|
2023-07-06 16:37:47 +02:00
|
|
|
});
|
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
describe('crawl', () => {
|
|
|
|
for (const { test, options, files } of tests) {
|
|
|
|
it(test, async () => {
|
|
|
|
mockfs(Object.fromEntries(Object.keys(files).map((file) => [file, ''])));
|
2023-07-06 16:37:47 +02:00
|
|
|
|
2024-03-22 15:30:24 +01:00
|
|
|
const actual = await crawl({ ...options, extensions });
|
2023-11-19 23:16:24 +01:00
|
|
|
const expected = Object.entries(files)
|
|
|
|
.filter((entry) => entry[1])
|
|
|
|
.map(([file]) => file);
|
2023-07-06 16:37:47 +02:00
|
|
|
|
2023-11-19 23:16:24 +01:00
|
|
|
expect(actual.sort()).toEqual(expected.sort());
|
|
|
|
});
|
|
|
|
}
|
2023-07-06 16:37:47 +02:00
|
|
|
});
|
|
|
|
});
|