mirror of
https://github.com/immich-app/immich.git
synced 2025-01-28 06:32:44 +01:00
refactor(server): telemetry env variables (#13705)
refactor(server)!: telemetry env variables Co-authored-by: Mert <101130780+mertalev@users.noreply.github.com>
This commit is contained in:
parent
bc06863d28
commit
151ba9f1d9
10 changed files with 67 additions and 79 deletions
|
@ -25,10 +25,10 @@ The metrics in immich are grouped into API (endpoint calls and response times),
|
||||||
|
|
||||||
### Configuration
|
### Configuration
|
||||||
|
|
||||||
Immich will not expose an endpoint for metrics by default. To enable this endpoint, you can add the `IMMICH_METRICS=true` environmental variable to your `.env` file. Note that only the server and microservices containers currently use this variable.
|
Immich will not expose an endpoint for metrics by default. To enable this endpoint, you can add the `IMMICH_TELEMETRY_INCLUDE=all` environmental variable to your `.env` file. Note that only the server container currently use this variable.
|
||||||
|
|
||||||
:::tip
|
:::tip
|
||||||
`IMMICH_METRICS` enables all metrics, but there are also [environmental variables](/docs/install/environment-variables.md#prometheus) to toggle specific metric groups. If you'd like to only expose certain kinds of metrics, you can set only those environmental variables to `true`. Explicitly setting the environmental variable for a metric group overrides `IMMICH_METRICS` for that group. For example, setting `IMMICH_METRICS=true` and `IMMICH_API_METRICS=false` will enable all metrics except API metrics.
|
`IMMICH_TELEMETRY_INCLUDE=all` enables all metrics. For a more granular configuration you can enumerate the telemetry metrics that should be included as a comma separated list (e.g. `IMMICH_TELEMETRY_INCLUDE=repo,api`). Alternatively, you can also exclude specific metrics with `IMMICH_TELEMETRY_EXCLUDE`. For more information refer to the [environment section](/docs/install/environment-variables.md#prometheus).
|
||||||
:::
|
:::
|
||||||
|
|
||||||
The next step is to configure a new or existing Prometheus instance to scrape this endpoint. The following steps assume that you do not have an existing Prometheus instance, but the steps will be similar either way.
|
The next step is to configure a new or existing Prometheus instance to scrape this endpoint. The following steps assume that you do not have an existing Prometheus instance, but the steps will be similar either way.
|
||||||
|
|
|
@ -183,15 +183,10 @@ Other machine learning parameters can be tuned from the admin UI.
|
||||||
|
|
||||||
## Prometheus
|
## Prometheus
|
||||||
|
|
||||||
| Variable | Description | Default | Containers | Workers |
|
| Variable | Description | Default | Containers | Workers |
|
||||||
| :----------------------------- | :-------------------------------------------------------------------------------------------- | :-----: | :--------- | :----------------- |
|
| :------------------------- | :-------------------------------------------------------------------------------------------------------------------- | :-----: | :--------- | :----------------- |
|
||||||
| `IMMICH_METRICS`<sup>\*1</sup> | Toggle all metrics (one of [`true`, `false`]) | | server | api, microservices |
|
| `IMMICH_TELEMETRY_INCLUDE` | Collect these telemetries. List of `host`, `api`, `io`, `repo`, `job`. Note: You can also specify `all` to enable all | | server | api, microservices |
|
||||||
| `IMMICH_API_METRICS` | Toggle metrics for endpoints and response times (one of [`true`, `false`]) | | server | api, microservices |
|
| `IMMICH_TELEMETRY_EXCLUDE` | Do not collect these telemetries. List of `host`, `api`, `io`, `repo`, `job` | | server | api, microservices |
|
||||||
| `IMMICH_HOST_METRICS` | Toggle metrics for CPU and memory utilization for host and process (one of [`true`, `false`]) | | server | api, microservices |
|
|
||||||
| `IMMICH_IO_METRICS` | Toggle metrics for database queries, image processing, etc. (one of [`true`, `false`]) | | server | api, microservices |
|
|
||||||
| `IMMICH_JOB_METRICS` | Toggle metrics for jobs and queues (one of [`true`, `false`]) | | server | api, microservices |
|
|
||||||
|
|
||||||
\*1: Overridden for a metric group when its corresponding environmental variable is set.
|
|
||||||
|
|
||||||
## Docker Secrets
|
## Docker Secrets
|
||||||
|
|
||||||
|
|
|
@ -363,3 +363,11 @@ export enum ImmichWorker {
|
||||||
API = 'api',
|
API = 'api',
|
||||||
MICROSERVICES = 'microservices',
|
MICROSERVICES = 'microservices',
|
||||||
}
|
}
|
||||||
|
|
||||||
|
export enum ImmichTelemetry {
|
||||||
|
HOST = 'host',
|
||||||
|
API = 'api',
|
||||||
|
IO = 'io',
|
||||||
|
REPO = 'repo',
|
||||||
|
JOB = 'job',
|
||||||
|
}
|
||||||
|
|
|
@ -2,7 +2,7 @@ import { RegisterQueueOptions } from '@nestjs/bullmq';
|
||||||
import { QueueOptions } from 'bullmq';
|
import { QueueOptions } from 'bullmq';
|
||||||
import { RedisOptions } from 'ioredis';
|
import { RedisOptions } from 'ioredis';
|
||||||
import { OpenTelemetryModuleOptions } from 'nestjs-otel/lib/interfaces';
|
import { OpenTelemetryModuleOptions } from 'nestjs-otel/lib/interfaces';
|
||||||
import { ImmichEnvironment, ImmichWorker, LogLevel } from 'src/enum';
|
import { ImmichEnvironment, ImmichTelemetry, ImmichWorker, LogLevel } from 'src/enum';
|
||||||
import { VectorExtension } from 'src/interfaces/database.interface';
|
import { VectorExtension } from 'src/interfaces/database.interface';
|
||||||
|
|
||||||
export const IConfigRepository = 'IConfigRepository';
|
export const IConfigRepository = 'IConfigRepository';
|
||||||
|
@ -77,11 +77,7 @@ export interface EnvData {
|
||||||
telemetry: {
|
telemetry: {
|
||||||
apiPort: number;
|
apiPort: number;
|
||||||
microservicesPort: number;
|
microservicesPort: number;
|
||||||
enabled: boolean;
|
metrics: Set<ImmichTelemetry>;
|
||||||
apiMetrics: boolean;
|
|
||||||
hostMetrics: boolean;
|
|
||||||
repoMetrics: boolean;
|
|
||||||
jobMetrics: boolean;
|
|
||||||
};
|
};
|
||||||
|
|
||||||
storage: {
|
storage: {
|
||||||
|
|
|
@ -1,3 +1,4 @@
|
||||||
|
import { ImmichTelemetry } from 'src/enum';
|
||||||
import { clearEnvCache, ConfigRepository } from 'src/repositories/config.repository';
|
import { clearEnvCache, ConfigRepository } from 'src/repositories/config.repository';
|
||||||
|
|
||||||
const getEnv = () => {
|
const getEnv = () => {
|
||||||
|
@ -12,11 +13,8 @@ const resetEnv = () => {
|
||||||
'IMMICH_TRUSTED_PROXIES',
|
'IMMICH_TRUSTED_PROXIES',
|
||||||
'IMMICH_API_METRICS_PORT',
|
'IMMICH_API_METRICS_PORT',
|
||||||
'IMMICH_MICROSERVICES_METRICS_PORT',
|
'IMMICH_MICROSERVICES_METRICS_PORT',
|
||||||
'IMMICH_METRICS',
|
'IMMICH_TELEMETRY_INCLUDE',
|
||||||
'IMMICH_API_METRICS',
|
'IMMICH_TELEMETRY_EXCLUDE',
|
||||||
'IMMICH_HOST_METRICS',
|
|
||||||
'IMMICH_IO_METRICS',
|
|
||||||
'IMMICH_JOB_METRICS',
|
|
||||||
|
|
||||||
'DB_URL',
|
'DB_URL',
|
||||||
'DB_HOSTNAME',
|
'DB_HOSTNAME',
|
||||||
|
@ -210,11 +208,7 @@ describe('getEnv', () => {
|
||||||
expect(telemetry).toEqual({
|
expect(telemetry).toEqual({
|
||||||
apiPort: 8081,
|
apiPort: 8081,
|
||||||
microservicesPort: 8082,
|
microservicesPort: 8082,
|
||||||
enabled: false,
|
metrics: new Set([]),
|
||||||
apiMetrics: false,
|
|
||||||
hostMetrics: false,
|
|
||||||
jobMetrics: false,
|
|
||||||
repoMetrics: false,
|
|
||||||
});
|
});
|
||||||
});
|
});
|
||||||
|
|
||||||
|
@ -225,32 +219,29 @@ describe('getEnv', () => {
|
||||||
expect(telemetry).toMatchObject({
|
expect(telemetry).toMatchObject({
|
||||||
apiPort: 2001,
|
apiPort: 2001,
|
||||||
microservicesPort: 2002,
|
microservicesPort: 2002,
|
||||||
|
metrics: expect.any(Set),
|
||||||
});
|
});
|
||||||
});
|
});
|
||||||
|
|
||||||
it('should run with telemetry enabled', () => {
|
it('should run with telemetry enabled', () => {
|
||||||
process.env.IMMICH_METRICS = 'true';
|
process.env.IMMICH_TELEMETRY_INCLUDE = 'all';
|
||||||
const { telemetry } = getEnv();
|
const { telemetry } = getEnv();
|
||||||
expect(telemetry).toMatchObject({
|
expect(telemetry.metrics).toEqual(new Set(Object.values(ImmichTelemetry)));
|
||||||
enabled: true,
|
|
||||||
apiMetrics: true,
|
|
||||||
hostMetrics: true,
|
|
||||||
jobMetrics: true,
|
|
||||||
repoMetrics: true,
|
|
||||||
});
|
|
||||||
});
|
});
|
||||||
|
|
||||||
it('should run with telemetry enabled and jobs disabled', () => {
|
it('should run with telemetry enabled and jobs disabled', () => {
|
||||||
process.env.IMMICH_METRICS = 'true';
|
process.env.IMMICH_TELEMETRY_INCLUDE = 'all';
|
||||||
process.env.IMMICH_JOB_METRICS = 'false';
|
process.env.IMMICH_TELEMETRY_EXCLUDE = 'job';
|
||||||
const { telemetry } = getEnv();
|
const { telemetry } = getEnv();
|
||||||
expect(telemetry).toMatchObject({
|
expect(telemetry.metrics).toEqual(
|
||||||
enabled: true,
|
new Set([ImmichTelemetry.API, ImmichTelemetry.HOST, ImmichTelemetry.IO, ImmichTelemetry.REPO]),
|
||||||
apiMetrics: true,
|
);
|
||||||
hostMetrics: true,
|
});
|
||||||
jobMetrics: false,
|
|
||||||
repoMetrics: true,
|
it('should run with specific telemetry metrics', () => {
|
||||||
});
|
process.env.IMMICH_TELEMETRY_INCLUDE = 'io, host, api';
|
||||||
|
const { telemetry } = getEnv();
|
||||||
|
expect(telemetry.metrics).toEqual(new Set([ImmichTelemetry.API, ImmichTelemetry.HOST, ImmichTelemetry.IO]));
|
||||||
});
|
});
|
||||||
});
|
});
|
||||||
});
|
});
|
||||||
|
|
|
@ -2,7 +2,7 @@ import { Injectable } from '@nestjs/common';
|
||||||
import { join } from 'node:path';
|
import { join } from 'node:path';
|
||||||
import { citiesFile, excludePaths } from 'src/constants';
|
import { citiesFile, excludePaths } from 'src/constants';
|
||||||
import { Telemetry } from 'src/decorators';
|
import { Telemetry } from 'src/decorators';
|
||||||
import { ImmichEnvironment, ImmichWorker, LogLevel } from 'src/enum';
|
import { ImmichEnvironment, ImmichTelemetry, ImmichWorker, LogLevel } from 'src/enum';
|
||||||
import { EnvData, IConfigRepository } from 'src/interfaces/config.interface';
|
import { EnvData, IConfigRepository } from 'src/interfaces/config.interface';
|
||||||
import { DatabaseExtension } from 'src/interfaces/database.interface';
|
import { DatabaseExtension } from 'src/interfaces/database.interface';
|
||||||
import { QueueName } from 'src/interfaces/job.interface';
|
import { QueueName } from 'src/interfaces/job.interface';
|
||||||
|
@ -25,18 +25,17 @@ const stagingKeys = {
|
||||||
};
|
};
|
||||||
|
|
||||||
const WORKER_TYPES = new Set(Object.values(ImmichWorker));
|
const WORKER_TYPES = new Set(Object.values(ImmichWorker));
|
||||||
|
const TELEMETRY_TYPES = new Set(Object.values(ImmichTelemetry));
|
||||||
|
|
||||||
const asSet = (value: string | undefined, defaults: ImmichWorker[]) => {
|
const asSet = <T>(value: string | undefined, defaults: T[]) => {
|
||||||
const values = (value || '').replaceAll(/\s/g, '').split(',').filter(Boolean);
|
const values = (value || '').replaceAll(/\s/g, '').split(',').filter(Boolean);
|
||||||
return new Set(values.length === 0 ? defaults : (values as ImmichWorker[]));
|
return new Set(values.length === 0 ? defaults : (values as T[]));
|
||||||
};
|
};
|
||||||
|
|
||||||
const parseBoolean = (value: string | undefined, defaultValue: boolean) => (value ? value === 'true' : defaultValue);
|
|
||||||
|
|
||||||
const getEnv = (): EnvData => {
|
const getEnv = (): EnvData => {
|
||||||
const included = asSet(process.env.IMMICH_WORKERS_INCLUDE, [ImmichWorker.API, ImmichWorker.MICROSERVICES]);
|
const includedWorkers = asSet(process.env.IMMICH_WORKERS_INCLUDE, [ImmichWorker.API, ImmichWorker.MICROSERVICES]);
|
||||||
const excluded = asSet(process.env.IMMICH_WORKERS_EXCLUDE, []);
|
const excludedWorkers = asSet(process.env.IMMICH_WORKERS_EXCLUDE, []);
|
||||||
const workers = [...setDifference(included, excluded)];
|
const workers = [...setDifference(includedWorkers, excludedWorkers)];
|
||||||
for (const worker of workers) {
|
for (const worker of workers) {
|
||||||
if (!WORKER_TYPES.has(worker)) {
|
if (!WORKER_TYPES.has(worker)) {
|
||||||
throw new Error(`Invalid worker(s) found: ${workers.join(',')}`);
|
throw new Error(`Invalid worker(s) found: ${workers.join(',')}`);
|
||||||
|
@ -69,12 +68,18 @@ const getEnv = (): EnvData => {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
const globalEnabled = parseBoolean(process.env.IMMICH_METRICS, false);
|
const includedTelemetries =
|
||||||
const hostMetrics = parseBoolean(process.env.IMMICH_HOST_METRICS, globalEnabled);
|
process.env.IMMICH_TELEMETRY_INCLUDE === 'all'
|
||||||
const apiMetrics = parseBoolean(process.env.IMMICH_API_METRICS, globalEnabled);
|
? new Set(Object.values(ImmichTelemetry))
|
||||||
const repoMetrics = parseBoolean(process.env.IMMICH_IO_METRICS, globalEnabled);
|
: asSet<ImmichTelemetry>(process.env.IMMICH_TELEMETRY_INCLUDE, []);
|
||||||
const jobMetrics = parseBoolean(process.env.IMMICH_JOB_METRICS, globalEnabled);
|
|
||||||
const telemetryEnabled = globalEnabled || hostMetrics || apiMetrics || repoMetrics || jobMetrics;
|
const excludedTelemetries = asSet<ImmichTelemetry>(process.env.IMMICH_TELEMETRY_EXCLUDE, []);
|
||||||
|
const telemetries = setDifference(includedTelemetries, excludedTelemetries);
|
||||||
|
for (const telemetry of telemetries) {
|
||||||
|
if (!TELEMETRY_TYPES.has(telemetry)) {
|
||||||
|
throw new Error(`Invalid telemetry found: ${telemetry}`);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
return {
|
return {
|
||||||
host: process.env.IMMICH_HOST,
|
host: process.env.IMMICH_HOST,
|
||||||
|
@ -136,9 +141,9 @@ const getEnv = (): EnvData => {
|
||||||
|
|
||||||
otel: {
|
otel: {
|
||||||
metrics: {
|
metrics: {
|
||||||
hostMetrics,
|
hostMetrics: telemetries.has(ImmichTelemetry.HOST),
|
||||||
apiMetrics: {
|
apiMetrics: {
|
||||||
enable: apiMetrics,
|
enable: telemetries.has(ImmichTelemetry.API),
|
||||||
ignoreRoutes: excludePaths,
|
ignoreRoutes: excludePaths,
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
|
@ -168,11 +173,7 @@ const getEnv = (): EnvData => {
|
||||||
telemetry: {
|
telemetry: {
|
||||||
apiPort: Number(process.env.IMMICH_API_METRICS_PORT || '') || 8081,
|
apiPort: Number(process.env.IMMICH_API_METRICS_PORT || '') || 8081,
|
||||||
microservicesPort: Number(process.env.IMMICH_MICROSERVICES_METRICS_PORT || '') || 8082,
|
microservicesPort: Number(process.env.IMMICH_MICROSERVICES_METRICS_PORT || '') || 8082,
|
||||||
enabled: telemetryEnabled,
|
metrics: telemetries,
|
||||||
hostMetrics,
|
|
||||||
apiMetrics,
|
|
||||||
repoMetrics,
|
|
||||||
jobMetrics,
|
|
||||||
},
|
},
|
||||||
|
|
||||||
workers,
|
workers,
|
||||||
|
|
|
@ -14,7 +14,7 @@ import { snakeCase, startCase } from 'lodash';
|
||||||
import { MetricService } from 'nestjs-otel';
|
import { MetricService } from 'nestjs-otel';
|
||||||
import { copyMetadataFromFunctionToFunction } from 'nestjs-otel/lib/opentelemetry.utils';
|
import { copyMetadataFromFunctionToFunction } from 'nestjs-otel/lib/opentelemetry.utils';
|
||||||
import { serverVersion } from 'src/constants';
|
import { serverVersion } from 'src/constants';
|
||||||
import { MetadataKey } from 'src/enum';
|
import { ImmichTelemetry, MetadataKey } from 'src/enum';
|
||||||
import { IConfigRepository } from 'src/interfaces/config.interface';
|
import { IConfigRepository } from 'src/interfaces/config.interface';
|
||||||
import { ILoggerRepository } from 'src/interfaces/logger.interface';
|
import { ILoggerRepository } from 'src/interfaces/logger.interface';
|
||||||
import { IMetricGroupRepository, ITelemetryRepository, MetricGroupOptions } from 'src/interfaces/telemetry.interface';
|
import { IMetricGroupRepository, ITelemetryRepository, MetricGroupOptions } from 'src/interfaces/telemetry.interface';
|
||||||
|
@ -99,17 +99,18 @@ export class TelemetryRepository implements ITelemetryRepository {
|
||||||
@Inject(ILoggerRepository) private logger: ILoggerRepository,
|
@Inject(ILoggerRepository) private logger: ILoggerRepository,
|
||||||
) {
|
) {
|
||||||
const { telemetry } = this.configRepository.getEnv();
|
const { telemetry } = this.configRepository.getEnv();
|
||||||
const { apiMetrics, hostMetrics, jobMetrics, repoMetrics } = telemetry;
|
const { metrics } = telemetry;
|
||||||
|
|
||||||
this.api = new MetricGroupRepository(metricService).configure({ enabled: apiMetrics });
|
this.api = new MetricGroupRepository(metricService).configure({ enabled: metrics.has(ImmichTelemetry.API) });
|
||||||
this.host = new MetricGroupRepository(metricService).configure({ enabled: hostMetrics });
|
this.host = new MetricGroupRepository(metricService).configure({ enabled: metrics.has(ImmichTelemetry.HOST) });
|
||||||
this.jobs = new MetricGroupRepository(metricService).configure({ enabled: jobMetrics });
|
this.jobs = new MetricGroupRepository(metricService).configure({ enabled: metrics.has(ImmichTelemetry.JOB) });
|
||||||
this.repo = new MetricGroupRepository(metricService).configure({ enabled: repoMetrics });
|
this.repo = new MetricGroupRepository(metricService).configure({ enabled: metrics.has(ImmichTelemetry.REPO) });
|
||||||
}
|
}
|
||||||
|
|
||||||
setup({ repositories }: { repositories: ClassConstructor<unknown>[] }) {
|
setup({ repositories }: { repositories: ClassConstructor<unknown>[] }) {
|
||||||
const { telemetry } = this.configRepository.getEnv();
|
const { telemetry } = this.configRepository.getEnv();
|
||||||
if (!telemetry.enabled || !telemetry.repoMetrics) {
|
const { metrics } = telemetry;
|
||||||
|
if (!metrics.has(ImmichTelemetry.REPO)) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -20,7 +20,7 @@ async function bootstrap() {
|
||||||
process.title = 'immich-api';
|
process.title = 'immich-api';
|
||||||
|
|
||||||
const { telemetry, network } = new ConfigRepository().getEnv();
|
const { telemetry, network } = new ConfigRepository().getEnv();
|
||||||
if (telemetry.enabled) {
|
if (telemetry.metrics.size > 0) {
|
||||||
bootstrapTelemetry(telemetry.apiPort);
|
bootstrapTelemetry(telemetry.apiPort);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -11,7 +11,7 @@ import { isStartUpError } from 'src/services/storage.service';
|
||||||
|
|
||||||
export async function bootstrap() {
|
export async function bootstrap() {
|
||||||
const { telemetry } = new ConfigRepository().getEnv();
|
const { telemetry } = new ConfigRepository().getEnv();
|
||||||
if (telemetry.enabled) {
|
if (telemetry.metrics.size > 0) {
|
||||||
bootstrapTelemetry(telemetry.microservicesPort);
|
bootstrapTelemetry(telemetry.microservicesPort);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -73,11 +73,7 @@ const envData: EnvData = {
|
||||||
telemetry: {
|
telemetry: {
|
||||||
apiPort: 8081,
|
apiPort: 8081,
|
||||||
microservicesPort: 8082,
|
microservicesPort: 8082,
|
||||||
enabled: false,
|
metrics: new Set(),
|
||||||
hostMetrics: false,
|
|
||||||
apiMetrics: false,
|
|
||||||
jobMetrics: false,
|
|
||||||
repoMetrics: false,
|
|
||||||
},
|
},
|
||||||
|
|
||||||
workers: [ImmichWorker.API, ImmichWorker.MICROSERVICES],
|
workers: [ImmichWorker.API, ImmichWorker.MICROSERVICES],
|
||||||
|
|
Loading…
Reference in a new issue