2024-05-14 21:31:36 +02:00
|
|
|
import { BadRequestException, Inject, Injectable } from '@nestjs/common';
|
|
|
|
import { SystemConfigCore } from 'src/cores/system-config.core';
|
2024-03-20 23:53:07 +01:00
|
|
|
import { AssetResponseDto, mapAsset } from 'src/dtos/asset-response.dto';
|
|
|
|
import { AuthDto } from 'src/dtos/auth.dto';
|
|
|
|
import { PersonResponseDto } from 'src/dtos/person.dto';
|
2024-02-24 01:42:37 +01:00
|
|
|
import {
|
|
|
|
MetadataSearchDto,
|
|
|
|
PlacesResponseDto,
|
|
|
|
SearchPeopleDto,
|
|
|
|
SearchPlacesDto,
|
2024-03-20 23:53:07 +01:00
|
|
|
SearchResponseDto,
|
|
|
|
SearchSuggestionRequestDto,
|
|
|
|
SearchSuggestionType,
|
2024-02-24 01:42:37 +01:00
|
|
|
SmartSearchDto,
|
|
|
|
mapPlaces,
|
2024-03-20 23:53:07 +01:00
|
|
|
} from 'src/dtos/search.dto';
|
2024-03-20 22:02:51 +01:00
|
|
|
import { AssetOrder } from 'src/entities/album.entity';
|
|
|
|
import { AssetEntity } from 'src/entities/asset.entity';
|
2024-05-16 19:08:37 +02:00
|
|
|
import { IAssetRepository, WithoutProperty } from 'src/interfaces/asset.interface';
|
|
|
|
import { ICryptoRepository } from 'src/interfaces/crypto.interface';
|
|
|
|
import {
|
|
|
|
IBaseJob,
|
|
|
|
IEntityJob,
|
|
|
|
IJobRepository,
|
|
|
|
JOBS_ASSET_PAGINATION_SIZE,
|
|
|
|
JobName,
|
|
|
|
JobStatus,
|
|
|
|
} from 'src/interfaces/job.interface';
|
2024-04-16 23:30:31 +02:00
|
|
|
import { ILoggerRepository } from 'src/interfaces/logger.interface';
|
2024-03-21 12:59:49 +01:00
|
|
|
import { IMachineLearningRepository } from 'src/interfaces/machine-learning.interface';
|
|
|
|
import { IMetadataRepository } from 'src/interfaces/metadata.interface';
|
|
|
|
import { IPartnerRepository } from 'src/interfaces/partner.interface';
|
|
|
|
import { IPersonRepository } from 'src/interfaces/person.interface';
|
2024-05-16 19:08:37 +02:00
|
|
|
import { AssetDuplicateResult, ISearchRepository, SearchExploreItem } from 'src/interfaces/search.interface';
|
2024-05-16 00:58:23 +02:00
|
|
|
import { ISystemMetadataRepository } from 'src/interfaces/system-metadata.interface';
|
2024-05-16 19:08:37 +02:00
|
|
|
import { isDuplicateDetectionEnabled, isSmartSearchEnabled } from 'src/utils/misc';
|
|
|
|
import { usePagination } from 'src/utils/pagination';
|
2023-03-18 14:44:42 +01:00
|
|
|
|
2023-03-03 03:47:08 +01:00
|
|
|
@Injectable()
|
|
|
|
export class SearchService {
|
2023-08-25 06:15:03 +02:00
|
|
|
private configCore: SystemConfigCore;
|
2023-03-18 14:44:42 +01:00
|
|
|
|
2023-03-03 03:47:08 +01:00
|
|
|
constructor(
|
2024-05-16 00:58:23 +02:00
|
|
|
@Inject(ISystemMetadataRepository) systemMetadataRepository: ISystemMetadataRepository,
|
2023-03-18 14:44:42 +01:00
|
|
|
@Inject(IMachineLearningRepository) private machineLearning: IMachineLearningRepository,
|
2023-09-27 22:46:46 +02:00
|
|
|
@Inject(IPersonRepository) private personRepository: IPersonRepository,
|
2024-02-13 02:50:47 +01:00
|
|
|
@Inject(ISearchRepository) private searchRepository: ISearchRepository,
|
2023-12-08 17:15:46 +01:00
|
|
|
@Inject(IAssetRepository) private assetRepository: IAssetRepository,
|
2024-01-01 23:25:22 +01:00
|
|
|
@Inject(IPartnerRepository) private partnerRepository: IPartnerRepository,
|
2024-02-13 20:54:58 +01:00
|
|
|
@Inject(IMetadataRepository) private metadataRepository: IMetadataRepository,
|
2024-04-16 23:30:31 +02:00
|
|
|
@Inject(ILoggerRepository) private logger: ILoggerRepository,
|
2024-05-16 19:08:37 +02:00
|
|
|
@Inject(ICryptoRepository) private cryptoRepository: ICryptoRepository,
|
|
|
|
@Inject(IJobRepository) private jobRepository: IJobRepository,
|
2023-03-03 03:47:08 +01:00
|
|
|
) {
|
2024-04-16 23:30:31 +02:00
|
|
|
this.logger.setContext(SearchService.name);
|
2024-05-16 00:58:23 +02:00
|
|
|
this.configCore = SystemConfigCore.create(systemMetadataRepository, logger);
|
2023-03-18 14:44:42 +01:00
|
|
|
}
|
|
|
|
|
2023-12-10 05:34:12 +01:00
|
|
|
async searchPerson(auth: AuthDto, dto: SearchPeopleDto): Promise<PersonResponseDto[]> {
|
|
|
|
return this.personRepository.getByName(auth.user.id, dto.name, { withHidden: dto.withHidden });
|
2023-03-03 03:47:08 +01:00
|
|
|
}
|
|
|
|
|
2024-02-24 01:42:37 +01:00
|
|
|
async searchPlaces(dto: SearchPlacesDto): Promise<PlacesResponseDto[]> {
|
|
|
|
const places = await this.searchRepository.searchPlaces(dto.name);
|
|
|
|
return places.map((place) => mapPlaces(place));
|
|
|
|
}
|
|
|
|
|
2023-12-10 05:34:12 +01:00
|
|
|
async getExploreData(auth: AuthDto): Promise<SearchExploreItem<AssetResponseDto>[]> {
|
2023-12-08 17:15:46 +01:00
|
|
|
const options = { maxFields: 12, minAssetsPerField: 5 };
|
|
|
|
const results = await Promise.all([
|
2023-12-10 05:34:12 +01:00
|
|
|
this.assetRepository.getAssetIdByCity(auth.user.id, options),
|
|
|
|
this.assetRepository.getAssetIdByTag(auth.user.id, options),
|
2023-12-08 17:15:46 +01:00
|
|
|
]);
|
|
|
|
const assetIds = new Set<string>(results.flatMap((field) => field.items.map((item) => item.data)));
|
2024-03-14 06:58:09 +01:00
|
|
|
const assets = await this.assetRepository.getByIdsWithAllRelations([...assetIds]);
|
2023-12-08 17:15:46 +01:00
|
|
|
const assetMap = new Map<string, AssetResponseDto>(assets.map((asset) => [asset.id, mapAsset(asset)]));
|
2023-05-30 19:55:06 +02:00
|
|
|
|
2023-05-28 03:56:17 +02:00
|
|
|
return results.map(({ fieldName, items }) => ({
|
|
|
|
fieldName,
|
2023-12-08 17:15:46 +01:00
|
|
|
items: items.map(({ value, data }) => ({ value, data: assetMap.get(data) as AssetResponseDto })),
|
2023-05-28 03:56:17 +02:00
|
|
|
}));
|
2023-03-05 21:44:31 +01:00
|
|
|
}
|
|
|
|
|
2024-02-13 02:50:47 +01:00
|
|
|
async searchMetadata(auth: AuthDto, dto: MetadataSearchDto): Promise<SearchResponseDto> {
|
|
|
|
let checksum: Buffer | undefined;
|
2024-02-17 18:00:55 +01:00
|
|
|
const userIds = await this.getUserIdsToSearch(auth);
|
2024-02-13 02:50:47 +01:00
|
|
|
|
|
|
|
if (dto.checksum) {
|
|
|
|
const encoding = dto.checksum.length === 28 ? 'base64' : 'hex';
|
|
|
|
checksum = Buffer.from(dto.checksum, encoding);
|
|
|
|
}
|
|
|
|
|
2024-04-02 06:56:56 +02:00
|
|
|
dto.previewPath ??= dto.resizePath;
|
|
|
|
dto.thumbnailPath ??= dto.webpPath;
|
|
|
|
|
2024-02-13 02:50:47 +01:00
|
|
|
const page = dto.page ?? 1;
|
|
|
|
const size = dto.size || 250;
|
|
|
|
const enumToOrder = { [AssetOrder.ASC]: 'ASC', [AssetOrder.DESC]: 'DESC' } as const;
|
|
|
|
const { hasNextPage, items } = await this.searchRepository.searchMetadata(
|
|
|
|
{ page, size },
|
|
|
|
{
|
|
|
|
...dto,
|
|
|
|
checksum,
|
2024-02-17 18:00:55 +01:00
|
|
|
userIds,
|
2024-02-13 02:50:47 +01:00
|
|
|
orderDirection: dto.order ? enumToOrder[dto.order] : 'DESC',
|
|
|
|
},
|
|
|
|
);
|
|
|
|
|
|
|
|
return this.mapResponse(items, hasNextPage ? (page + 1).toString() : null);
|
|
|
|
}
|
|
|
|
|
|
|
|
async searchSmart(auth: AuthDto, dto: SmartSearchDto): Promise<SearchResponseDto> {
|
|
|
|
const { machineLearning } = await this.configCore.getConfig();
|
2024-05-14 21:31:36 +02:00
|
|
|
if (!isSmartSearchEnabled(machineLearning)) {
|
|
|
|
throw new BadRequestException('Smart search is not enabled');
|
|
|
|
}
|
|
|
|
|
2024-02-13 02:50:47 +01:00
|
|
|
const userIds = await this.getUserIdsToSearch(auth);
|
|
|
|
|
|
|
|
const embedding = await this.machineLearning.encodeText(
|
|
|
|
machineLearning.url,
|
|
|
|
{ text: dto.query },
|
|
|
|
machineLearning.clip,
|
|
|
|
);
|
|
|
|
|
|
|
|
const page = dto.page ?? 1;
|
|
|
|
const size = dto.size || 100;
|
|
|
|
const { hasNextPage, items } = await this.searchRepository.searchSmart(
|
|
|
|
{ page, size },
|
|
|
|
{ ...dto, userIds, embedding },
|
|
|
|
);
|
|
|
|
|
|
|
|
return this.mapResponse(items, hasNextPage ? (page + 1).toString() : null);
|
|
|
|
}
|
|
|
|
|
2024-03-20 04:23:57 +01:00
|
|
|
async getAssetsByCity(auth: AuthDto): Promise<AssetResponseDto[]> {
|
|
|
|
const userIds = await this.getUserIdsToSearch(auth);
|
|
|
|
const assets = await this.searchRepository.getAssetsByCity(userIds);
|
|
|
|
return assets.map((asset) => mapAsset(asset));
|
|
|
|
}
|
|
|
|
|
|
|
|
getSearchSuggestions(auth: AuthDto, dto: SearchSuggestionRequestDto): Promise<string[]> {
|
|
|
|
switch (dto.type) {
|
|
|
|
case SearchSuggestionType.COUNTRY: {
|
|
|
|
return this.metadataRepository.getCountries(auth.user.id);
|
|
|
|
}
|
|
|
|
case SearchSuggestionType.STATE: {
|
|
|
|
return this.metadataRepository.getStates(auth.user.id, dto.country);
|
|
|
|
}
|
|
|
|
case SearchSuggestionType.CITY: {
|
|
|
|
return this.metadataRepository.getCities(auth.user.id, dto.country, dto.state);
|
|
|
|
}
|
|
|
|
case SearchSuggestionType.CAMERA_MAKE: {
|
|
|
|
return this.metadataRepository.getCameraMakes(auth.user.id, dto.model);
|
|
|
|
}
|
|
|
|
case SearchSuggestionType.CAMERA_MODEL: {
|
|
|
|
return this.metadataRepository.getCameraModels(auth.user.id, dto.make);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-16 19:08:37 +02:00
|
|
|
async handleQueueSearchDuplicates({ force }: IBaseJob): Promise<JobStatus> {
|
|
|
|
const { machineLearning } = await this.configCore.getConfig();
|
|
|
|
if (!isDuplicateDetectionEnabled(machineLearning)) {
|
|
|
|
return JobStatus.SKIPPED;
|
|
|
|
}
|
|
|
|
|
|
|
|
const assetPagination = usePagination(JOBS_ASSET_PAGINATION_SIZE, (pagination) => {
|
|
|
|
return force
|
|
|
|
? this.assetRepository.getAll(pagination, { isVisible: true })
|
|
|
|
: this.assetRepository.getWithout(pagination, WithoutProperty.DUPLICATE);
|
|
|
|
});
|
|
|
|
|
|
|
|
for await (const assets of assetPagination) {
|
|
|
|
await this.jobRepository.queueAll(
|
|
|
|
assets.map((asset) => ({ name: JobName.DUPLICATE_DETECTION, data: { id: asset.id } })),
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
return JobStatus.SUCCESS;
|
|
|
|
}
|
|
|
|
|
|
|
|
async handleSearchDuplicates({ id }: IEntityJob): Promise<JobStatus> {
|
|
|
|
const { machineLearning } = await this.configCore.getConfig();
|
|
|
|
if (!isDuplicateDetectionEnabled(machineLearning)) {
|
|
|
|
return JobStatus.SKIPPED;
|
|
|
|
}
|
|
|
|
|
|
|
|
const asset = await this.assetRepository.getById(id, { smartSearch: true });
|
|
|
|
if (!asset) {
|
|
|
|
this.logger.error(`Asset ${id} not found`);
|
|
|
|
return JobStatus.FAILED;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!asset.isVisible) {
|
|
|
|
this.logger.debug(`Asset ${id} is not visible, skipping`);
|
|
|
|
return JobStatus.SKIPPED;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!asset.previewPath) {
|
|
|
|
this.logger.warn(`Asset ${id} is missing preview image`);
|
|
|
|
return JobStatus.FAILED;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!asset.smartSearch?.embedding) {
|
|
|
|
this.logger.debug(`Asset ${id} is missing embedding`);
|
|
|
|
return JobStatus.FAILED;
|
|
|
|
}
|
|
|
|
|
|
|
|
const duplicateAssets = await this.searchRepository.searchDuplicates({
|
|
|
|
assetId: asset.id,
|
|
|
|
embedding: asset.smartSearch.embedding,
|
|
|
|
maxDistance: machineLearning.duplicateDetection.maxDistance,
|
|
|
|
userIds: [asset.ownerId],
|
|
|
|
});
|
|
|
|
|
|
|
|
let assetIds = [asset.id];
|
|
|
|
if (duplicateAssets.length > 0) {
|
|
|
|
this.logger.debug(
|
|
|
|
`Found ${duplicateAssets.length} duplicate${duplicateAssets.length === 1 ? '' : 's'} for asset ${asset.id}`,
|
|
|
|
);
|
|
|
|
assetIds = await this.updateDuplicates(asset, duplicateAssets);
|
|
|
|
} else if (asset.duplicateId) {
|
|
|
|
this.logger.debug(`No duplicates found for asset ${asset.id}, removing duplicateId`);
|
|
|
|
await this.assetRepository.update({ id: asset.id, duplicateId: null });
|
|
|
|
}
|
|
|
|
|
|
|
|
const duplicatesDetectedAt = new Date();
|
|
|
|
await this.assetRepository.upsertJobStatus(...assetIds.map((assetId) => ({ assetId, duplicatesDetectedAt })));
|
|
|
|
|
|
|
|
return JobStatus.SUCCESS;
|
|
|
|
}
|
|
|
|
|
|
|
|
private async updateDuplicates(asset: AssetEntity, duplicateAssets: AssetDuplicateResult[]): Promise<string[]> {
|
|
|
|
const duplicateIds = [
|
|
|
|
...new Set(
|
|
|
|
duplicateAssets
|
|
|
|
.filter((asset): asset is AssetDuplicateResult & { duplicateId: string } => !!asset.duplicateId)
|
|
|
|
.map((duplicate) => duplicate.duplicateId),
|
|
|
|
),
|
|
|
|
];
|
|
|
|
|
|
|
|
const targetDuplicateId = asset.duplicateId ?? duplicateIds.shift() ?? this.cryptoRepository.randomUUID();
|
|
|
|
const assetIdsToUpdate = duplicateAssets
|
|
|
|
.filter((asset) => asset.duplicateId !== targetDuplicateId)
|
|
|
|
.map((duplicate) => duplicate.assetId);
|
|
|
|
assetIdsToUpdate.push(asset.id);
|
|
|
|
|
|
|
|
await this.assetRepository.updateDuplicates({ targetDuplicateId, assetIds: assetIdsToUpdate, duplicateIds });
|
|
|
|
return assetIdsToUpdate;
|
|
|
|
}
|
|
|
|
|
2024-01-01 23:25:22 +01:00
|
|
|
private async getUserIdsToSearch(auth: AuthDto): Promise<string[]> {
|
|
|
|
const userIds: string[] = [auth.user.id];
|
|
|
|
const partners = await this.partnerRepository.getAll(auth.user.id);
|
|
|
|
const partnersIds = partners
|
|
|
|
.filter((partner) => partner.sharedBy && partner.inTimeline)
|
|
|
|
.map((partner) => partner.sharedById);
|
|
|
|
userIds.push(...partnersIds);
|
|
|
|
return userIds;
|
|
|
|
}
|
2024-02-13 02:50:47 +01:00
|
|
|
|
2024-03-05 23:23:06 +01:00
|
|
|
private mapResponse(assets: AssetEntity[], nextPage: string | null): SearchResponseDto {
|
2024-02-13 02:50:47 +01:00
|
|
|
return {
|
|
|
|
albums: { total: 0, count: 0, items: [], facets: [] },
|
|
|
|
assets: {
|
|
|
|
total: assets.length,
|
|
|
|
count: assets.length,
|
|
|
|
items: assets.map((asset) => mapAsset(asset)),
|
|
|
|
facets: [],
|
|
|
|
nextPage,
|
|
|
|
},
|
|
|
|
};
|
|
|
|
}
|
2023-03-03 03:47:08 +01:00
|
|
|
}
|