diff --git a/docs/reference.cue b/docs/reference.cue index 36ae0bac0342a..e728bbe86f597 100644 --- a/docs/reference.cue +++ b/docs/reference.cue @@ -44,7 +44,7 @@ _values: { // * `sidecar` - Vector is installed alongside each process it is // monitoring. Therefore, there might be multiple Vector processes // on the host. -// * `service` - Vector receives data from one or more upstream +// * `aggregator` - Vector receives data from one or more upstream // sources, typically over a network protocol. #DeploymentRole: "aggregator" | "daemon" | "sidecar" diff --git a/docs/reference/components.cue b/docs/reference/components.cue index 779b77d1ecfca..93b562fb56e1f 100644 --- a/docs/reference/components.cue +++ b/docs/reference/components.cue @@ -354,11 +354,12 @@ components: { } #MetricOutput: [Name=string]: close({ - description: string - relevant_when?: string - tags: #MetricTags - name: Name - type: #MetricType + description: string + relevant_when?: string + tags: #MetricTags + name: Name + type: #MetricType + default_namespace: string }) #Output: { @@ -833,7 +834,8 @@ components: { required: false } } - type: "counter" + type: "counter" + default_namespace: "vector" } _passthrough_distribution: { @@ -845,7 +847,8 @@ components: { required: false } } - type: "distribution" + type: "distribution" + default_namespace: "vector" } _passthrough_gauge: { @@ -857,7 +860,8 @@ components: { required: false } } - type: "gauge" + type: "gauge" + default_namespace: "vector" } _passthrough_histogram: { @@ -869,7 +873,8 @@ components: { required: false } } - type: "gauge" + type: "gauge" + default_namespace: "vector" } _passthrough_set: { @@ -881,7 +886,8 @@ components: { required: false } } - type: "gauge" + type: "gauge" + default_namespace: "vector" } _passthrough_summary: { @@ -893,14 +899,16 @@ components: { required: false } } - type: "gauge" + type: "gauge" + default_namespace: "vector" } } } telemetry: metrics: { // Default metrics for each component - vector_events_processed_total: _vector_events_processed_total + events_processed_total: components.sources.internal_metrics.output.metrics.events_processed_total + processed_bytes_total: components.sources.internal_metrics.output.metrics.processed_bytes_total } }} } diff --git a/docs/reference/components/kafka.cue b/docs/reference/components/kafka.cue index af955ab2edc1e..64adb233a5fe7 100644 --- a/docs/reference/components/kafka.cue +++ b/docs/reference/components/kafka.cue @@ -88,4 +88,9 @@ components: _kafka: { """ } } + + telemetry: metrics: { + consumer_offset_updates_failed_total: components.sources.internal_metrics.output.metrics.consumer_offset_updates_failed_total + events_failed_total: components.sources.internal_metrics.output.metrics.events_failed_total + } } diff --git a/docs/reference/components/sinks/aws_cloudwatch_logs.cue b/docs/reference/components/sinks/aws_cloudwatch_logs.cue index 403172e824e1d..5c27382889ad7 100644 --- a/docs/reference/components/sinks/aws_cloudwatch_logs.cue +++ b/docs/reference/components/sinks/aws_cloudwatch_logs.cue @@ -119,4 +119,8 @@ components: sinks: aws_cloudwatch_logs: { logs: true metrics: null } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/sinks/console.cue b/docs/reference/components/sinks/console.cue index 2f53183d3a54b..579a9c15ebc4b 100644 --- a/docs/reference/components/sinks/console.cue +++ b/docs/reference/components/sinks/console.cue @@ -81,7 +81,6 @@ components: sinks: console: { } telemetry: metrics: { - vector_processed_bytes_total: _vector_processed_bytes_total - vector_processing_errors_total: _vector_processing_errors_total + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total } } diff --git a/docs/reference/components/sinks/elasticsearch.cue b/docs/reference/components/sinks/elasticsearch.cue index 49bf461eed3bb..f4ac3bdce9a9c 100644 --- a/docs/reference/components/sinks/elasticsearch.cue +++ b/docs/reference/components/sinks/elasticsearch.cue @@ -239,4 +239,8 @@ components: sinks: elasticsearch: { """ } } + + telemetry: metrics: { + missing_keys_total: components.sources.internal_metrics.output.metrics.missing_keys_total + } } diff --git a/docs/reference/components/sinks/http.cue b/docs/reference/components/sinks/http.cue index e35add2c1dc39..cbd63dd251aae 100644 --- a/docs/reference/components/sinks/http.cue +++ b/docs/reference/components/sinks/http.cue @@ -119,4 +119,8 @@ components: sinks: http: { logs: true metrics: null } + + telemetry: metrics: { + http_bad_requests_total: components.sources.internal_metrics.output.metrics.http_bad_requests_total + } } diff --git a/docs/reference/components/sinks/sematext_metrics.cue b/docs/reference/components/sinks/sematext_metrics.cue index 3bde057adb960..380bb16e0703a 100644 --- a/docs/reference/components/sinks/sematext_metrics.cue +++ b/docs/reference/components/sinks/sematext_metrics.cue @@ -78,4 +78,8 @@ components: sinks: sematext_metrics: { summary: false } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/sinks/splunk_hec.cue b/docs/reference/components/sinks/splunk_hec.cue index 6c5a3271b05d4..4350a6924b262 100644 --- a/docs/reference/components/sinks/splunk_hec.cue +++ b/docs/reference/components/sinks/splunk_hec.cue @@ -165,4 +165,9 @@ components: sinks: splunk_hec: { logs: true metrics: null } + + telemetry: metrics: { + http_request_errors_total: components.sources.internal_metrics.output.metrics.http_request_errors_total + http_requests_total: components.sources.internal_metrics.output.metrics.http_requests_total + } } diff --git a/docs/reference/components/sinks/statsd.cue b/docs/reference/components/sinks/statsd.cue index 3f2c4ca305f00..1e5b6678e90e1 100644 --- a/docs/reference/components/sinks/statsd.cue +++ b/docs/reference/components/sinks/statsd.cue @@ -63,4 +63,8 @@ components: sinks: statsd: { } } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/sinks/vector.cue b/docs/reference/components/sinks/vector.cue index e8b9d81fff732..801c9bd426099 100644 --- a/docs/reference/components/sinks/vector.cue +++ b/docs/reference/components/sinks/vector.cue @@ -84,4 +84,8 @@ components: sinks: vector: { } how_it_works: components.sources.vector.how_it_works + + telemetry: metrics: { + protobuf_decode_errors_total: components.sources.internal_metrics.output.metrics.protobuf_decode_errors_total + } } diff --git a/docs/reference/components/sources/apache_metrics.cue b/docs/reference/components/sources/apache_metrics.cue index 1e2cff445ea1c..a5b3dcc350380 100644 --- a/docs/reference/components/sources/apache_metrics.cue +++ b/docs/reference/components/sources/apache_metrics.cue @@ -112,31 +112,32 @@ components: sources: apache_metrics: { } output: metrics: { - _endpoint: { - description: "The absolute path of originating file." - required: true - examples: ["http://localhost:8080/server-status?auto"] - } - _host: { - description: "The hostname of the Apache HTTP server" - required: true - examples: [_values.local_host] + // Default Apache metrics tags + _apache_metrics_tags: { + endpoint: { + description: "The absolute path of originating file." + required: true + examples: ["http://localhost:8080/server-status?auto"] + } + host: { + description: "The hostname of the Apache HTTP server." + required: true + examples: [_values.local_host] + } } + access_total: { - description: "The total number of time the Apache server has been accessed." - relevant_when: "`ExtendedStatus On`" - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of time the Apache server has been accessed." + relevant_when: "`ExtendedStatus On`" + type: "counter" + default_namespace: "apache" + tags: _apache_metrics_tags } connections: { - description: "The total number of time the Apache server has been accessed." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "The total number of time the Apache server has been accessed." + type: "gauge" + default_namespace: "apache" + tags: _apache_metrics_tags & { state: { description: "The state of the connection" required: true @@ -145,22 +146,19 @@ components: sources: apache_metrics: { } } cpu_load: { - description: "The current CPU of the Apache server." - relevant_when: "`ExtendedStatus On`" - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The current CPU of the Apache server." + relevant_when: "`ExtendedStatus On`" + type: "gauge" + default_namespace: "apache" + tags: _apache_metrics_tags } cpu_seconds_total: { - description: "The CPU time of various Apache processes." - relevant_when: "`ExtendedStatus On`" - type: "counter" - tags: { - endpoint: _endpoint - host: _host - type: { + description: "The CPU time of various Apache processes." + relevant_when: "`ExtendedStatus On`" + type: "counter" + default_namespace: "apache" + tags: _apache_metrics_tags & { + state: { description: "The state of the connection" required: true examples: ["children_system", "children_user", "system", "user"] @@ -168,20 +166,17 @@ components: sources: apache_metrics: { } } duration_seconds_total: { - description: "The amount of time the Apache server has been running." - relevant_when: "`ExtendedStatus On`" - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The amount of time the Apache server has been running." + relevant_when: "`ExtendedStatus On`" + type: "counter" + default_namespace: "apache" + tags: _apache_metrics_tags } scoreboard: { - description: "The amount of times various Apache server tasks have been run." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "The amount of times various Apache server tasks have been run." + type: "gauge" + default_namespace: "apache" + tags: _apache_metrics_tags & { state: { description: "The connect state" required: true @@ -190,28 +185,29 @@ components: sources: apache_metrics: { } } sent_bytes_total: { - description: "The amount of bytes sent by the Apache server." - relevant_when: "`ExtendedStatus On`" - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The amount of bytes sent by the Apache server." + relevant_when: "`ExtendedStatus On`" + type: "counter" + default_namespace: "apache" + tags: _apache_metrics_tags + } + up: { + description: "If the Apache server is up or not." + type: "gauge" + default_namespace: "apache" + tags: _apache_metrics_tags } uptime_seconds_total: { - description: "The amount of time the Apache server has been running." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The amount of time the Apache server has been running." + type: "counter" + default_namespace: "apache" + tags: _apache_metrics_tags } workers: { - description: "Apache worker statuses." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Apache worker statuses." + type: "gauge" + default_namespace: "apache" + tags: _apache_metrics_tags & { state: { description: "The state of the worker" required: true @@ -219,14 +215,6 @@ components: sources: apache_metrics: { } } } - up: { - description: "If the Apache server is up or not." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } - } } how_it_works: {} diff --git a/docs/reference/components/sources/aws_ecs_metrics.cue b/docs/reference/components/sources/aws_ecs_metrics.cue index 85d494377c351..5984950b4e2c8 100644 --- a/docs/reference/components/sources/aws_ecs_metrics.cue +++ b/docs/reference/components/sources/aws_ecs_metrics.cue @@ -103,6 +103,10 @@ components: sources: aws_ecs_metrics: { } output: metrics: { + _awsecs: { + default_namespace: "awsecs" + } + _tags: { container_id: { description: "The identifier of the ECS container." @@ -142,25 +146,25 @@ components: sources: aws_ecs_metrics: { } } - blkio_recursive_io_merged_total: _blkio_counter & {description: "Total number of bios/requests merged into requests."} - blkio_recursive_io_queued_total: _blkio_counter & {description: "Total number of requests queued up at any given instant."} - blkio_recursive_io_service_bytes_total: _blkio_counter & {description: "Number of bytes transferred to/from the disk."} - blkio_recursive_io_service_time_seconds_total: _blkio_counter & {description: "Total amount of time in seconds between request dispatch and request completion for the IOs done."} - blkio_recursive_io_serviced_total: _blkio_counter & {description: "Number of IOs completed to/from the disk."} - blkio_recursive_io_time_seconds_total: _blkio_counter & {description: "Disk time allocated per device in seconds."} - blkio_recursive_io_wait_time_seconds_total: _blkio_counter & {description: "Total amount of time in seconds the IOs spent waiting in the scheduler queues for service."} - blkio_recursive_sectors_total: _blkio_counter & {description: "Number of sectors transferred to/from disk."} - - cpu_online_cpus: _gauge & {description: "Number of CPU cores."} - cpu_usage_system_jiffies_total: _counter & {description: "Jiffies of CPU time used by the system."} - cpu_usage_usermode_jiffies_total: _counter & {description: "Jiffies of CPU time spent in user mode by the container."} - cpu_usage_kernelmode_jiffies_total: _counter & {description: "Jiffies of CPU time spent in kernel mode by the container."} - cpu_usage_total_jiffies_total: _counter & {description: "Jiffies of CPU time used by the container."} - cpu_throttling_periods_total: _counter & {description: "Number of periods."} - cpu_throttled_periods_total: _counter & {description: "Number of periods throttled."} - cpu_throttled_time_seconds_total: _counter & {description: "Throttling time in seconds."} - - cpu_usage_percpu_jiffies_total: { + blkio_recursive_io_merged_total: _awsecs & _blkio_counter & {description: "Total number of bios/requests merged into requests."} + blkio_recursive_io_queued_total: _awsecs & _blkio_counter & {description: "Total number of requests queued up at any given instant."} + blkio_recursive_io_service_bytes_total: _awsecs & _blkio_counter & {description: "Number of bytes transferred to/from the disk."} + blkio_recursive_io_service_time_seconds_total: _awsecs & _blkio_counter & {description: "Total amount of time in seconds between request dispatch and request completion for the IOs done."} + blkio_recursive_io_serviced_total: _awsecs & _blkio_counter & {description: "Number of IOs completed to/from the disk."} + blkio_recursive_io_time_seconds_total: _awsecs & _blkio_counter & {description: "Disk time allocated per device in seconds."} + blkio_recursive_io_wait_time_seconds_total: _awsecs & _blkio_counter & {description: "Total amount of time in seconds the IOs spent waiting in the scheduler queues for service."} + blkio_recursive_sectors_total: _awsecs & _blkio_counter & {description: "Number of sectors transferred to/from disk."} + + cpu_online_cpus: _awsecs & _gauge & {description: "Number of CPU cores."} + cpu_usage_system_jiffies_total: _awsecs & _counter & {description: "Jiffies of CPU time used by the system."} + cpu_usage_usermode_jiffies_total: _awsecs & _counter & {description: "Jiffies of CPU time spent in user mode by the container."} + cpu_usage_kernelmode_jiffies_total: _awsecs & _counter & {description: "Jiffies of CPU time spent in kernel mode by the container."} + cpu_usage_total_jiffies_total: _awsecs & _counter & {description: "Jiffies of CPU time used by the container."} + cpu_throttling_periods_total: _awsecs & _counter & {description: "Number of periods."} + cpu_throttled_periods_total: _awsecs & _counter & {description: "Number of periods throttled."} + cpu_throttled_time_seconds_total: _awsecs & _counter & {description: "Throttling time in seconds."} + + cpu_usage_percpu_jiffies_total: _awsecs & { description: "Jiffies of CPU time used by the container, per CPU core." type: "counter" tags: _tags & { @@ -172,43 +176,43 @@ components: sources: aws_ecs_metrics: { } } - memory_used_bytes: _gauge & {description: "Memory used by the container, in bytes."} - memory_max_used_bytes: _gauge & {description: "Maximum measured memory usage of the container, in bytes."} - memory_limit_bytes: _gauge & {description: "Memory usage limit of the container, in bytes."} - memory_active_anonymous_bytes: _gauge & {description: "Amount of memory that has been identified as active by the kernel. Anonymous memory is memory that is not linked to disk pages."} - memory_active_file_bytes: _gauge & {description: "Amount of active file cache memory. Cache memory = active_file + inactive_file + tmpfs."} - memory_cache_bytes: _gauge & {description: "The amount of memory used by the processes of this cgroup that can be associated with a block on a block device. Also accounts for memory used by tmpfs."} - memory_dirty_bytes: _gauge & {description: "The amount of memory waiting to get written to disk."} - memory_inactive_anonymous_bytes: _gauge & {description: "Amount of memory that has been identified as inactive by the kernel."} - memory_inactive_file_bytes: _gauge & {description: "Amount of inactive file cache memory."} - memory_mapped_file_bytes: _gauge & {description: "Indicates the amount of memory mapped by the processes in the cgroup. It doesn’t give you information about how much memory is used; it rather tells you how it is used."} - memory_page_faults_total: _counter & {description: "Number of times that a process of the cgroup triggered a page fault."} - memory_major_faults_total: _counter & {description: "Number of times that a process of the cgroup triggered a major page fault."} - memory_page_charged_total: _counter & {description: "Number of charging events to the memory cgroup. Charging events happen each time a page is accounted as either mapped anon page(RSS) or cache page to the cgroup."} - memory_page_uncharged_total: _counter & {description: "Number of uncharging events to the memory cgroup. Uncharging events happen each time a page is unaccounted from the cgroup."} - memory_rss_bytes: _gauge & {description: "The amount of memory that doesn’t correspond to anything on disk: stacks, heaps, and anonymous memory maps."} - memory_rss_hugepages_bytes: _gauge & {description: "Amount of memory due to anonymous transparent hugepages."} - memory_unevictable_bytes: _gauge & {description: "The amount of memory that cannot be reclaimed."} - memory_writeback_bytes: _gauge & {description: "The amount of memory from file/anon cache that are queued for syncing to the disk."} - memory_total_active_anonymous_bytes: _gauge & {description: "Total amount of memory that has been identified as active by the kernel."} - memory_total_active_file_bytes: _gauge & {description: "Total amount of active file cache memory."} - memory_total_cache_bytes: _gauge & {description: "Total amount of memory used by the processes of this cgroup that can be associated with a block on a block device."} - memory_total_dirty_bytes: _gauge & {description: "Total amount of memory waiting to get written to disk."} - memory_total_inactive_anonymous_bytes: _gauge & {description: "Total amount of memory that has been identified as inactive by the kernel."} - memory_total_inactive_file_bytes: _gauge & {description: "Total amount of inactive file cache memory."} - memory_total_mapped_file_bytes: _gauge & {description: "Total amount of memory mapped by the processes in the cgroup."} - memory_total_page_faults_total: _counter & {description: "Total number of page faults."} - memory_total_major_faults_total: _counter & {description: "Total number of major page faults."} - memory_total_page_charged_total: _counter & {description: "Total number of charging events."} - memory_total_page_uncharged_total: _counter & {description: "Total number of uncharging events."} - memory_total_rss_bytes: _gauge & {description: "Total amount of memory that doesn’t correspond to anything on disk: stacks, heaps, and anonymous memory maps."} - memory_total_rss_hugepages_bytes: _gauge & {description: "Total amount of memory due to anonymous transparent hugepages."} - memory_total_unevictable_bytes: _gauge & {description: "Total amount of memory that can not be reclaimed."} - memory_total_writeback_bytes: _gauge & {description: "Total amount of memory from file/anon cache that are queued for syncing to the disk."} - memory_hierarchical_memory_limit_bytes: _gauge & {description: "The memory limit in place by the hierarchy cgroup."} - memory_hierarchical_memsw_limit_bytes: _gauge & {description: "The memory + swap limit in place by the hierarchy cgroup."} - - _network_counter: { + memory_used_bytes: _awsecs & _gauge & {description: "Memory used by the container, in bytes."} + memory_max_used_bytes: _awsecs & _gauge & {description: "Maximum measured memory usage of the container, in bytes."} + memory_limit_bytes: _awsecs & _gauge & {description: "Memory usage limit of the container, in bytes."} + memory_active_anonymous_bytes: _awsecs & _gauge & {description: "Amount of memory that has been identified as active by the kernel. Anonymous memory is memory that is not linked to disk pages."} + memory_active_file_bytes: _awsecs & _gauge & {description: "Amount of active file cache memory. Cache memory = active_file + inactive_file + tmpfs."} + memory_cache_bytes: _awsecs & _awsecs & _gauge & {description: "The amount of memory used by the processes of this cgroup that can be associated with a block on a block device. Also accounts for memory used by tmpfs."} + memory_dirty_bytes: _awsecs & _gauge & {description: "The amount of memory waiting to get written to disk."} + memory_inactive_anonymous_bytes: _awsecs & _gauge & {description: "Amount of memory that has been identified as inactive by the kernel."} + memory_inactive_file_bytes: _awsecs & _gauge & {description: "Amount of inactive file cache memory."} + memory_mapped_file_bytes: _awsecs & _gauge & {description: "Indicates the amount of memory mapped by the processes in the cgroup. It doesn’t give you information about how much memory is used; it rather tells you how it is used."} + memory_page_faults_total: _awsecs & _counter & {description: "Number of times that a process of the cgroup triggered a page fault."} + memory_major_faults_total: _awsecs & _counter & {description: "Number of times that a process of the cgroup triggered a major page fault."} + memory_page_charged_total: _awsecs & _counter & {description: "Number of charging events to the memory cgroup. Charging events happen each time a page is accounted as either mapped anon page(RSS) or cache page to the cgroup."} + memory_page_uncharged_total: _awsecs & _counter & {description: "Number of uncharging events to the memory cgroup. Uncharging events happen each time a page is unaccounted from the cgroup."} + memory_rss_bytes: _awsecs & _gauge & {description: "The amount of memory that doesn’t correspond to anything on disk: stacks, heaps, and anonymous memory maps."} + memory_rss_hugepages_bytes: _awsecs & _gauge & {description: "Amount of memory due to anonymous transparent hugepages."} + memory_unevictable_bytes: _awsecs & _gauge & {description: "The amount of memory that cannot be reclaimed."} + memory_writeback_bytes: _awsecs & _gauge & {description: "The amount of memory from file/anon cache that are queued for syncing to the disk."} + memory_total_active_anonymous_bytes: _awsecs & _gauge & {description: "Total amount of memory that has been identified as active by the kernel."} + memory_total_active_file_bytes: _awsecs & _gauge & {description: "Total amount of active file cache memory."} + memory_total_cache_bytes: _awsecs & _gauge & {description: "Total amount of memory used by the processes of this cgroup that can be associated with a block on a block device."} + memory_total_dirty_bytes: _awsecs & _gauge & {description: "Total amount of memory waiting to get written to disk."} + memory_total_inactive_anonymous_bytes: _awsecs & _gauge & {description: "Total amount of memory that has been identified as inactive by the kernel."} + memory_total_inactive_file_bytes: _awsecs & _gauge & {description: "Total amount of inactive file cache memory."} + memory_total_mapped_file_bytes: _awsecs & _gauge & {description: "Total amount of memory mapped by the processes in the cgroup."} + memory_total_page_faults_total: _awsecs & _counter & {description: "Total number of page faults."} + memory_total_major_faults_total: _awsecs & _counter & {description: "Total number of major page faults."} + memory_total_page_charged_total: _awsecs & _counter & {description: "Total number of charging events."} + memory_total_page_uncharged_total: _awsecs & _counter & {description: "Total number of uncharging events."} + memory_total_rss_bytes: _awsecs & _gauge & {description: "Total amount of memory that doesn’t correspond to anything on disk: stacks, heaps, and anonymous memory maps."} + memory_total_rss_hugepages_bytes: _awsecs & _gauge & {description: "Total amount of memory due to anonymous transparent hugepages."} + memory_total_unevictable_bytes: _awsecs & _gauge & {description: "Total amount of memory that can not be reclaimed."} + memory_total_writeback_bytes: _awsecs & _gauge & {description: "Total amount of memory from file/anon cache that are queued for syncing to the disk."} + memory_hierarchical_memory_limit_bytes: _awsecs & _gauge & {description: "The memory limit in place by the hierarchy cgroup."} + memory_hierarchical_memsw_limit_bytes: _awsecs & _gauge & {description: "The memory + swap limit in place by the hierarchy cgroup."} + + _network_counter: _awsecs & { type: "counter" tags: _tags & { device: { @@ -219,13 +223,13 @@ components: sources: aws_ecs_metrics: { } } - network_receive_bytes_total: _network_counter & {description: "Bytes received by the container via the network interface."} - network_receive_packets_total: _network_counter & {description: "Number of packets received by the container via the network interface."} - network_receive_packets_drop_total: _network_counter & {description: "Number of inbound packets dropped by the container."} - network_receive_errs_total: _network_counter & {description: "Errors receiving packets."} - network_transmit_bytes_total: _network_counter & {description: "Bytes sent by the container via the network interface."} - network_transmit_packets_total: _network_counter & {description: "Number of packets sent by the container via the network interface."} - network_transmit_packets_drop_total: _network_counter & {description: "Number of outbound packets dropped by the container."} - network_transmit_errs_total: _network_counter & {description: "Errors sending packets."} + network_receive_bytes_total: _awsecs & _network_counter & {description: "Bytes received by the container via the network interface."} + network_receive_packets_total: _awsecs & _network_counter & {description: "Number of packets received by the container via the network interface."} + network_receive_packets_drop_total: _awsecs & _network_counter & {description: "Number of inbound packets dropped by the container."} + network_receive_errs_total: _awsecs & _network_counter & {description: "Errors receiving packets."} + network_transmit_bytes_total: _awsecs & _network_counter & {description: "Bytes sent by the container via the network interface."} + network_transmit_packets_total: _awsecs & _network_counter & {description: "Number of packets sent by the container via the network interface."} + network_transmit_packets_drop_total: _awsecs & _network_counter & {description: "Number of outbound packets dropped by the container."} + network_transmit_errs_total: _awsecs & _network_counter & {description: "Errors sending packets."} } } diff --git a/docs/reference/components/sources/aws_kinesis_firehose.cue b/docs/reference/components/sources/aws_kinesis_firehose.cue index 1e72ae5b3a9c2..891cab7bbd278 100644 --- a/docs/reference/components/sources/aws_kinesis_firehose.cue +++ b/docs/reference/components/sources/aws_kinesis_firehose.cue @@ -187,4 +187,9 @@ components: sources: aws_kinesis_firehose: { """ } } + + telemetry: metrics: { + request_read_errors_total: components.sources.internal_metrics.output.metrics.request_read_errors_total + requests_received_total: components.sources.internal_metrics.output.metrics.requests_received_total + } } diff --git a/docs/reference/components/sources/aws_s3.cue b/docs/reference/components/sources/aws_s3.cue index f869292a21a58..a5502fdd10808 100644 --- a/docs/reference/components/sources/aws_s3.cue +++ b/docs/reference/components/sources/aws_s3.cue @@ -239,4 +239,15 @@ components: sources: aws_s3: { """ } } + + telemetry: metrics: { + sqs_message_delete_failed_total: components.sources.internal_metrics.output.metrics.sqs_message_delete_failed_total + sqs_message_delete_succeeded_total: components.sources.internal_metrics.output.metrics.sqs_message_delete_succeeded_total + sqs_message_processing_failed_total: components.sources.internal_metrics.output.metrics.sqs_message_processing_failed_total + sqs_message_processing_succeeded_total: components.sources.internal_metrics.output.metrics.sqs_message_processing_succeeded_total + sqs_message_receive_failed_total: components.sources.internal_metrics.output.metrics.sqs_message_receive_failed_total + sqs_message_receive_succeeded_total: components.sources.internal_metrics.output.metrics.sqs_message_receive_succeeded_total + sqs_message_received_messages_total: components.sources.internal_metrics.output.metrics.sqs_message_received_messages_total + sqs_s3_event_record_ignored_total: components.sources.internal_metrics.output.metrics.sqs_s3_event_record_ignored_total + } } diff --git a/docs/reference/components/sources/docker_logs.cue b/docs/reference/components/sources/docker_logs.cue index f8fd9c258a5f0..260e146cac84c 100644 --- a/docs/reference/components/sources/docker_logs.cue +++ b/docs/reference/components/sources/docker_logs.cue @@ -265,4 +265,13 @@ components: sources: docker_logs: { """ } } + + telemetry: metrics: { + communication_errors_total: components.sources.internal_metrics.output.metrics.communication_errors_total + container_events_processed_total: components.sources.internal_metrics.output.metrics.container_events_processed_total + container_metadata_fetch_errors_total: components.sources.internal_metrics.output.metrics.container_metadata_fetch_errors_total + containers_unwatched_total: components.sources.internal_metrics.output.metrics.containers_unwatched_total + containers_watched_total: components.sources.internal_metrics.output.metrics.containers_watched_total + logging_driver_errors_total: components.sources.internal_metrics.output.metrics.logging_driver_errors_total + } } diff --git a/docs/reference/components/sources/file.cue b/docs/reference/components/sources/file.cue index 670c8e9ccbbf6..6678f41c36a7e 100644 --- a/docs/reference/components/sources/file.cue +++ b/docs/reference/components/sources/file.cue @@ -515,4 +515,17 @@ components: sources: file: { """ } } + + telemetry: metrics: { + checkpoint_write_errors_total: components.sources.internal_metrics.output.metrics.checkpoint_write_errors_total + checkpoints_total: components.sources.internal_metrics.output.metrics.checkpoints_total + checksum_errors: components.sources.internal_metrics.output.metrics.checksum_errors + file_delete_errors: components.sources.internal_metrics.output.metrics.file_delete_errors + file_watch_errors: components.sources.internal_metrics.output.metrics.file_watch_errors + files_added: components.sources.internal_metrics.output.metrics.files_added + files_deleted: components.sources.internal_metrics.output.metrics.files_deleted + files_resumed: components.sources.internal_metrics.output.metrics.files_resumed + files_unwatched: components.sources.internal_metrics.output.metrics.files_unwatched + fingerprint_read_errors: components.sources.internal_metrics.output.metrics.fingerprint_read_errors + } } diff --git a/docs/reference/components/sources/host_metrics.cue b/docs/reference/components/sources/host_metrics.cue index b2d6f78fb1b80..f4cd1a1306372 100644 --- a/docs/reference/components/sources/host_metrics.cue +++ b/docs/reference/components/sources/host_metrics.cue @@ -261,22 +261,23 @@ components: sources: host_metrics: { } output: metrics: { - _tags: { + _host_metrics_tags: { + collector: { + description: "Which collector this metric comes from." + required: true + } host: { description: "The hostname of the originating system." required: true examples: [_values.local_host] } - collector: { - description: "Which collector this metric comes from." - required: true - } } - cpu_seconds_total: { + // Host CPU + host_cpu_seconds_total: _host & { description: "The number of CPU seconds accumulated in different operating modes." type: "counter" - tags: _tags & { + tags: _host_metrics_tags & { collector: examples: ["cpu"] cpu: { description: "The index of the CPU core or socket." @@ -291,6 +292,57 @@ components: sources: host_metrics: { } } + // Host disk + host_disk_read_bytes_total: _host & _disk_counter & {description: "The accumulated number of bytes read in."} + host_disk_reads_completed_total: _host & _disk_counter & {description: "The accumulated number of read operations completed."} + host_disk_written_bytes_total: _host & _disk_counter & {description: "The accumulated number of bytes written out."} + host_disk_writes_completed_total: _host & _disk_counter & {description: "The accumulated number of write operations completed."} + + // Host filesystem + host_filesystem_free_bytes: _host & _filesystem_bytes & {description: "The number of bytes free on the named filesystem."} + host_filesystem_total_bytes: _host & _filesystem_bytes & {description: "The total number of bytes in the named filesystem."} + host_filesystem_used_bytes: _host & _filesystem_bytes & {description: "The number of bytes used on the named filesystem."} + + // Host load + host_load1: _host & _loadavg & {description: "System load averaged over the last 1 second."} + host_load5: _host & _loadavg & {description: "System load averaged over the last 5 seconds."} + host_load15: _host & _loadavg & {description: "System load averaged over the last 15 seconds."} + + // Host memory + host_memory_active_bytes: _host & _memory_gauge & _memory_nowin & {description: "The number of bytes of active main memory."} + host_memory_available_bytes: _host & _memory_gauge & {description: "The number of bytes of main memory available."} + host_memory_buffers_bytes: _host & _memory_linux & {description: "The number of bytes of main memory used by buffers."} + host_memory_cached_bytes: _host & _memory_linux & {description: "The number of bytes of main memory used by cached blocks."} + host_memory_free_bytes: _host & _memory_gauge & {description: "The number of bytes of main memory not used."} + host_memory_inactive_bytes: _host & _memory_macos & {description: "The number of bytes of main memory that is not active."} + host_memory_shared_bytes: _host & _memory_linux & {description: "The number of bytes of main memory shared between processes."} + host_memory_swap_free_bytes: _host & _memory_gauge & {description: "The number of free bytes of swap space."} + host_memory_swapped_in_bytes_total: _host & _memory_counter & _memory_nowin & { + description: "The number of bytes that have been swapped in to main memory." + } + host_memory_swapped_out_bytes_total: _host & _memory_counter & _memory_nowin & { + description: "The number of bytes that have been swapped out from main memory." + } + host_memory_swap_total_bytes: _host & _memory_gauge & {description: "The total number of bytes of swap space."} + host_memory_swap_used_bytes: _host & _memory_gauge & {description: "The number of used bytes of swap space."} + host_memory_total_bytes: _host & _memory_gauge & {description: "The total number of bytes of main memory."} + host_memory_used_bytes: _host & _memory_linux & {description: "The number of bytes of main memory used by programs or caches."} + host_memory_wired_bytes: _host & _memory_macos & {description: "The number of wired bytes of main memory."} + + // Host network + host_network_receive_bytes_total: _host & _network_gauge & {description: "The number of bytes received on this interface."} + host_network_receive_errs_total: _host & _network_gauge & {description: "The number of errors encountered during receives on this interface."} + host_network_receive_packets_total: _host & _network_gauge & {description: "The number of packets received on this interface."} + host_network_transmit_bytes_total: _host & _network_gauge & {description: "The number of bytes transmitted on this interface."} + host_network_transmit_errs_total: _host & _network_gauge & {description: "The number of errors encountered during transmits on this interface."} + host_network_transmit_packets_drop_total: _host & _network_nomac & {description: "The number of packets dropped during transmits on this interface."} + host_network_transmit_packets_total: _host & _network_nomac & {description: "The number of packets transmitted on this interface."} + + // Helpers + _host: { + default_namespace: "host" + } + _disk_device: { description: "The disk device name." required: true @@ -298,19 +350,14 @@ components: sources: host_metrics: { } _disk_counter: { type: "counter" - tags: _tags & { + tags: _host_metrics_tags & { collector: examples: ["disk"] device: _disk_device } } - disk_read_bytes_total: _disk_counter & {description: "The accumulated number of bytes read in."} - disk_reads_completed_total: _disk_counter & {description: "The accumulated number of read operations completed."} - disk_written_bytes_total: _disk_counter & {description: "The accumulated number of bytes written out."} - disk_writes_completed_total: _disk_counter & {description: "The accumulated number of write operations completed."} - _filesystem_bytes: { type: "gauge" - tags: _tags & { + tags: _host_metrics_tags & { collector: examples: ["filesystem"] device: _disk_device filesystem: { @@ -320,59 +367,31 @@ components: sources: host_metrics: { } } } - filesystem_free_bytes: _filesystem_bytes & {description: "The number of bytes free on the named filesystem."} - filesystem_total_bytes: _filesystem_bytes & {description: "The total number of bytes in the named filesystem."} - filesystem_used_bytes: _filesystem_bytes & {description: "The number of bytes used on the named filesystem."} - - _memory_gauge: { + _loadavg: { type: "gauge" - tags: _tags & { - collector: examples: ["memory"] + tags: _host_metrics_tags & { + collector: examples: ["loadavg"] } + relevant_when: "OS is not Windows" } _memory_counter: { type: "counter" - tags: _tags & { + tags: _host_metrics_tags & { collector: examples: ["memory"] } } - _memory_linux: _memory_gauge & {relevant_when: "OS is Linux"} - _memory_macos: _memory_gauge & {relevant_when: "OS is MacOS X"} - _memory_nowin: {relevant_when: "OS is not Windows"} - memory_free_bytes: _memory_gauge & {description: "The number of bytes of main memory not used."} - memory_available_bytes: _memory_gauge & {description: "The number of bytes of main memory available."} - memory_swap_free_bytes: _memory_gauge & {description: "The number of free bytes of swap space."} - memory_swap_total_bytes: _memory_gauge & {description: "The total number of bytes of swap space."} - memory_swap_used_bytes: _memory_gauge & {description: "The number of used bytes of swap space."} - memory_total_bytes: _memory_gauge & {description: "The total number of bytes of main memory."} - memory_active_bytes: _memory_gauge & _memory_nowin & {description: "The number of bytes of active main memory."} - memory_buffers_bytes: _memory_linux & {description: "The number of bytes of main memory used by buffers."} - memory_cached_bytes: _memory_linux & {description: "The number of bytes of main memory used by cached blocks."} - memory_shared_bytes: _memory_linux & {description: "The number of bytes of main memory shared between processes."} - memory_used_bytes: _memory_linux & {description: "The number of bytes of main memory used by programs or caches."} - memory_inactive_bytes: _memory_macos & {description: "The number of bytes of main memory that is not active."} - memory_swapped_in_bytes_total: _memory_counter & _memory_nowin & { - description: "The number of bytes that have been swapped in to main memory." - } - memory_swapped_out_bytes_total: _memory_counter & _memory_nowin & { - description: "The number of bytes that have been swapped out from main memory." - } - memory_wired_bytes: _memory_macos & {description: "The number of wired bytes of main memory."} - - _loadavg: { + _memory_gauge: { type: "gauge" - tags: _tags & { - collector: examples: ["loadavg"] + tags: _host_metrics_tags & { + collector: examples: ["memory"] } - relevant_when: "OS is not Windows" } - load1: _loadavg & {description: "System load averaged over the last 1 second."} - load5: _loadavg & {description: "System load averaged over the last 5 seconds."} - load15: _loadavg & {description: "System load averaged over the last 15 seconds."} - + _memory_linux: _memory_gauge & {relevant_when: "OS is Linux"} + _memory_macos: _memory_gauge & {relevant_when: "OS is MacOS X"} + _memory_nowin: {relevant_when: "OS is not Windows"} _network_gauge: { type: "gauge" - tags: _tags & { + tags: _host_metrics_tags & { collector: examples: ["network"] device: { description: "The network interface device name." @@ -381,13 +400,6 @@ components: sources: host_metrics: { } } } - _network_nomac: _network_gauge & {relevant_when: "OS is not MacOS"} - network_receive_bytes_total: _network_gauge & {description: "The number of bytes received on this interface."} - network_receive_errs_total: _network_gauge & {description: "The number of errors encountered during receives on this interface."} - network_receive_packets_total: _network_gauge & {description: "The number of packets received on this interface."} - network_transmit_bytes_total: _network_gauge & {description: "The number of bytes transmitted on this interface."} - network_transmit_errs_total: _network_gauge & {description: "The number of errors encountered during transmits on this interface."} - network_transmit_packets_drop_total: _network_nomac & {description: "The number of packets dropped during transmits on this interface."} - network_transmit_packets_total: _network_nomac & {description: "The number of packets transmitted on this interface."} + _network_nomac: _network_gauge & {relevant_when: "OS is not MacOS"} } } diff --git a/docs/reference/components/sources/http.cue b/docs/reference/components/sources/http.cue index 7367d7fdb9f7a..97f5773777040 100644 --- a/docs/reference/components/sources/http.cue +++ b/docs/reference/components/sources/http.cue @@ -206,4 +206,8 @@ components: sources: http: { }] }, ] + + telemetry: metrics: { + http_bad_requests_total: components.sources.internal_metrics.output.metrics.http_bad_requests_total + } } diff --git a/docs/reference/components/sources/internal_metrics.cue b/docs/reference/components/sources/internal_metrics.cue new file mode 100644 index 0000000000000..ac7367ff8cf0c --- /dev/null +++ b/docs/reference/components/sources/internal_metrics.cue @@ -0,0 +1,680 @@ +package metadata + +components: sources: internal_metrics: { + title: "Internal Metrics" + description: "The internal metrics source exposes metrics emitted by the running Vector instance (as opposed to components in its topology)." + + classes: { + commonly_used: true + delivery: "at_least_once" + deployment_roles: ["aggregator", "daemon", "sidecar"] + development: "beta" + egress_method: "batch" + } + + features: { + collect: { + checkpoint: enabled: false + from: { + name: "Vector instance" + thing: "a \(name)" + url: urls.vector_docs + versions: ">= 0.11.0" + } + } + multiline: enabled: false + } + + support: { + platforms: { + "aarch64-unknown-linux-gnu": true + "aarch64-unknown-linux-musl": true + "x86_64-apple-darwin": true + "x86_64-pc-windows-msv": true + "x86_64-unknown-linux-gnu": true + "x86_64-unknown-linux-musl": true + } + + notices: [] + requirements: [] + warnings: [] + } + + output: metrics: { + // Default internal metrics tags + _internal_metrics_tags: { + instance: { + description: "The Vector instance identified by host and port." + required: true + examples: [_values.instance] + } + job: { + description: "The name of the job producing Vector metrics." + required: true + default: "vector" + } + } + + // Instance-level "process" metrics + api_started_total: { + description: "The number of times the Vector GraphQL API has been started." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + config_load_errors_total: { + description: "The total number of errors loading the Vector configuration." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + connection_errors_total: { + description: "The total number of connection errors for this Vector instance." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + quit_total: { + description: "The total number of times the Vector instance has quit." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + recover_errors_total: { + description: "The total number of errors caused by Vector failing to recover from a failed reload." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + reload_errors_total: { + description: "The total number of errors encountered when reloading Vector." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + reloaded_total: { + description: "The total number of times the Vector instance has been reloaded." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + started_total: { + description: "The total number of times the Vector instance has been started." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + stopped_total: { + description: "The total number of times the Vector instance has been stopped." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + + // Metrics emitted by one or more components + // Reusable metric definitions + auto_concurrency_averaged_rtt: { + description: "The average round-trip time (RTT) from the HTTP sink across the current window." + type: "histogram" + default_namespace: "vector" + tags: _internal_metrics_tags + } + auto_concurrency_in_flight: { + description: "The number of outbound requests from the HTTP sink currently awaiting a response." + type: "histogram" + default_namespace: "vector" + tags: _internal_metrics_tags + } + auto_concurrency_limit: { + description: "The concurrency limit that the auto-concurrency feature has decided on for this current window." + type: "histogram" + default_namespace: "vector" + tags: _internal_metrics_tags + } + auto_concurrency_observed_rtt: { + description: "The observed round-trip time (RTT) for requests from this HTTP sink." + type: "histogram" + default_namespace: "vector" + tags: _internal_metrics_tags + } + checkpoint_write_errors_total: { + description: "The total number of errors writing checkpoints." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + checkpoints_total: { + description: "The total number of files checkpointed." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + checksum_errors: { + description: "The total number of errors identifying files via checksum." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + collect_completed_total: { + description: "The total number of MongoDB metrics collections completed." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + collect_duration_nanoseconds: { + description: "The duration spent collecting MongoDB metrics." + type: "histogram" + default_namespace: "vector" + tags: _internal_metrics_tags + } + communication_errors_total: { + description: "The total number of errors stemming from communication with the Docker daemon." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + connection_read_errors_total: { + description: "The total number of errors reading datagram." + type: "counter" + default_namespace: "vector" + tags: _component_tags & { + mode: { + description: "" + required: true + options: { + udp: "User Datagram Protocol" + } + } + } + } + consumer_offset_updates_failed_total: { + description: "The total number of failures to update a Kafka consumer offset." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + container_events_processed_total: { + description: "The total number of container events processed." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + container_metadata_fetch_errors_total: { + description: "The total number of errors encountered when fetching container metadata." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + containers_unwatched_total: { + description: "The total number of times Vector stopped watching for container logs." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + containers_watched_total: { + description: "The total number of times Vector started watching for container logs." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + docker_format_parse_failures_total: { + description: "The total number of failures to parse a message as a JSON object." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + event_annotation_failures_total: { + description: "The total number of failures to annotate Vector events with Kubernetes Pod metadata." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + events_discarded_total: { + description: "The total number of events discarded by this component." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + events_failed_total: { + description: "The total number of failures to read a Kafka message." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + events_processed_total: { + description: "The total number of events processed by this component." + type: "counter" + default_namespace: "vector" + tags: _component_tags & { + file: _file + } + } + file_delete_errors: { + description: "The total number of failures to delete a file." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + file_watch_errors: { + description: "The total number of errors encountered when watching files." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + files_added: { + description: "The total number of files Vector has found to watch." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + files_deleted: { + description: "The total number of files deleted." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + files_resumed: { + description: "The total number of times Vector has resumed watching a file." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + files_unwatched: { + description: "The total number of times Vector has stopped watching a file." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + fingerprint_read_errors: { + description: "The total number of times Vector failed to read a file for fingerprinting." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags & { + file: _file + } + } + http_bad_requests_total: { + description: "The total number of HTTP `400 Bad Request` errors encountered." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + http_error_response_total: { + description: "The total number of HTTP error responses for this component." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + http_request_errors_total: { + description: "The total number of HTTP request errors for this component." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + http_requests_total: { + description: "The total number of HTTP requests issued by this component." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + invalid_record_total: { + description: "The total number of invalid records that have been discarded." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + invalid_record_bytes_total: { + description: "The total number of bytes from invalid records that have been discarded." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + logging_driver_errors_total: { + description: """ + The total number of logging driver errors encountered caused by not using either + the `jsonfile` or `journald` driver. + """ + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + memory_used: { + description: "The total memory currently being used by Vector (in bytes)." + type: "gauge" + default_namespace: "vector" + tags: _internal_metrics_tags + } + metadata_refresh_failed_total: { + description: "The total number of failed efforts to refresh AWS EC2 metadata." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + metadata_refresh_successful_total: { + description: "The total number of AWS EC2 metadata refreshes." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + missing_keys_total: { + description: "The total number of events dropped due to keys missing from the event." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + open_connections: { + description: "The number of current open connections to Vector." + type: "gauge" + default_namespace: "vector" + tags: _internal_metrics_tags + } + parse_errors_total: { + description: "The total number of errors parsing Prometheus metrics." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + processed_bytes_total: { + description: "The total number of bytes processed by the component." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + processing_errors_total: { + description: "The total number of processing errors encountered by this component." + type: "counter" + default_namespace: "vector" + tags: _component_tags & { + error_type: _error_type + } + } + protobuf_decode_errors_total: { + description: "The total number of [Protocol Buffers](\(urls.protobuf)) errors thrown during communication between Vector instances." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + request_duration_nanoseconds: { + description: "The request duration for this component (in nanoseconds)." + type: "histogram" + default_namespace: "vector" + tags: _component_tags + } + request_error_total: { + description: "The total number of MongoDB request errors." + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + request_read_errors_total: { + description: "The total number of request read errors for this component." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + requests_completed_total: { + description: "The total number of requests completed by this component." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + requests_received_total: { + description: "The total number of requests received by this component." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_message_delete_failed_total: { + description: "The total number of failures to delete SQS messages." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_message_delete_succeeded_total: { + description: "The total number of successful deletions of SQS messages." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_message_processing_failed_total: { + description: "The total number of failures to process SQS messages." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_message_processing_succeeded_total: { + description: "The total number of SQS messages successfully processed." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + + sqs_message_receive_failed_total: { + description: "The total number of failures to receive SQS messages." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_message_receive_succeeded_total: { + description: "The total number of times successfully receiving SQS messages." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_message_received_messages_total: { + description: "The total number of received SQS messages." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + sqs_s3_event_record_ignored_total: { + description: "The total number of times an S3 record in an SQS message was ignored (for an event that was not `ObjectCreated`)." + type: "counter" + default_namespace: "vector" + + tags: _component_tags & { + ignore_type: { + description: "The reason for ignoring the S3 record" + required: true + options: [ + "invalid_event_kind", + ] + } + } + } + stale_events_flushed_total: { + description: "The number of stale events that Vector has flushed." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + stdin_reads_failed_total: { + description: "The total number of errors reading from stdin." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + tag_value_limit_exceeded_total: { + description: """ + The total number of events discarded because the tag has been rejected after + hitting the configured `value_limit`. + """ + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + timestamp_parse_errors_total: { + description: "The total number of errors encountered parsing [RFC3339](\(urls.rfc_3339)) timestamps." + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + uptime_seconds: { + description: "The total number of seconds the Vector instance has been up." + type: "gauge" + default_namespace: "vector" + tags: _component_tags + } + utf8_convert_errors_total: { + description: "The total number of errors converting bytes to a UTF-8 string in UDP mode." + type: "counter" + default_namespace: "vector" + tags: _component_tags & { + mode: { + description: "The connection mode used by the component." + required: true + options: { + udp: "User Datagram Protocol" + } + } + } + } + value_limit_reached_total: { + description: """ + The total number of times new values for a key have been rejected because the + value limit has been reached. + """ + type: "counter" + default_namespace: "vector" + tags: _component_tags + } + + // Windows metrics + windows_service_does_not_exist_total: { + description: """ + The total number of errors raised due to the Windows service not + existing. + """ + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + windows_service_install_total: { + description: """ + The total number of times the Windows service has been installed. + """ + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + windows_service_restart_total: { + description: """ + The total number of times the Windows service has been restarted. + """ + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + windows_service_start_total: { + description: """ + The total number of times the Windows service has been started. + """ + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + windows_service_stop_total: { + description: """ + The total number of times the Windows service has been stopped. + """ + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + windows_service_uninstall_total: { + description: """ + The total number of times the Windows service has been uninstalled. + """ + type: "counter" + default_namespace: "vector" + tags: _internal_metrics_tags + } + + // Helpful tag groupings + _component_tags: _internal_metrics_tags & { + component_kind: _component_kind + component_name: _component_name + component_type: _component_type + } + + _internal_metrics_tags: { + instance: _instance + job: _job + } + + // All available tags + _collector: { + description: "Which collector this metric comes from." + required: true + } + _component_kind: { + description: "The component's kind (options are `source`, `sink`, or `transform`)." + required: true + options: ["sink", "source", "transform"] + } + _component_name: { + description: "The name of the component as specified in the Vector configuration." + required: true + examples: ["file_source", "splunk_sink"] + } + _component_type: { + description: "The type of component (source, transform, or sink)." + required: true + examples: ["file", "http", "honeycomb", "splunk_hec"] + } + _endpoint: { + description: "The absolute path of originating file." + required: true + examples: ["http://localhost:8080/server-status?auto"] + } + _error_type: { + description: "The type of the error" + required: true + options: [ + "field_missing", + "invalid_metric", + "mapping_failed", + "match_failed", + "parse_failed", + "render_error", + "type_conversion_failed", + "type_field_does_not_exist", + "type_ip_address_parse_error", + "value_invalid", + ] + } + _file: { + description: "The file that produced the error" + required: false + } + _host: { + description: "The hostname of the originating system." + required: true + examples: [_values.local_host] + } + _instance: { + description: "The Vector instance identified by host and port." + required: true + examples: [_values.instance] + } + _job: { + description: "The name of the job producing Vector metrics." + required: true + default: "vector" + } + } +} diff --git a/docs/reference/components/sources/journald.cue b/docs/reference/components/sources/journald.cue index 1344b9de4b552..01f1da261f4e4 100644 --- a/docs/reference/components/sources/journald.cue +++ b/docs/reference/components/sources/journald.cue @@ -189,4 +189,9 @@ components: sources: journald: { """ } } + + telemetry: metrics: { + invalid_record_total: components.sources.internal_metrics.output.metrics.invalid_record_total + invalid_record_bytes_total: components.sources.internal_metrics.output.metrics.invalid_record_bytes_total + } } diff --git a/docs/reference/components/sources/kubernetes_logs.cue b/docs/reference/components/sources/kubernetes_logs.cue index 9fd9ffb100b6f..ca6e848ca2306 100644 --- a/docs/reference/components/sources/kubernetes_logs.cue +++ b/docs/reference/components/sources/kubernetes_logs.cue @@ -299,4 +299,9 @@ components: sources: kubernetes_logs: { """ } } + + telemetry: metrics: { + docker_format_parse_failures_total: components.sources.internal_metrics.output.metrics.docker_format_parse_failures_total + event_annotation_failures_total: components.sources.internal_metrics.output.metrics.event_annotation_failures_total + } } diff --git a/docs/reference/components/sources/logplex.cue b/docs/reference/components/sources/logplex.cue index 43178d79387ae..03dd32bc6cf72 100644 --- a/docs/reference/components/sources/logplex.cue +++ b/docs/reference/components/sources/logplex.cue @@ -97,4 +97,9 @@ components: sources: logplex: { timestamp: fields._current_timestamp } } + + telemetry: metrics: { + request_read_errors_total: components.sources.internal_metrics.output.metrics.request_read_errors_total + requests_received_total: components.sources.internal_metrics.output.metrics.requests_received_total + } } diff --git a/docs/reference/components/sources/mongodb_metrics.cue b/docs/reference/components/sources/mongodb_metrics.cue index 48250358e2ab5..7d8b514231574 100644 --- a/docs/reference/components/sources/mongodb_metrics.cue +++ b/docs/reference/components/sources/mongodb_metrics.cue @@ -80,31 +80,46 @@ components: sources: mongodb_metrics: { } } - output: metrics: { - _endpoint: { - description: "The absolute path of originating file." - required: true - examples: ["mongodb://localhost:27017"] - } - _host: { - description: "The hostname of the MongoDB server" - required: true - examples: [_values.local_host] + how_it_works: { + mod_status: { + title: "MongoDB `serverStatus` command" + body: """ + The [serverStatus][urls.mongodb_command_server_status] command + returns a document that provides an overview of the database’s + state. The output fields vary depending on the version of + MongoDB, underlying operating system platform, the storage + engine, and the kind of node, including `mongos`, `mongod` or + `replica set` member. + """ } - up: { - description: "If the MongoDB server is up or not." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + } + + telemetry: metrics: { + collect_duration_nanoseconds: components.sources.internal_metrics.output.metrics.collect_duration_nanoseconds + collect_completed_total: components.sources.internal_metrics.output.metrics.collect_completed_total + request_error_total: components.sources.internal_metrics.output.metrics.request_error_total + } + + output: metrics: { + // Default MongoDB tags + _mongodb_metrics_tags: { + endpoint: { + description: "The absolute path of the originating file." + required: true + examples: ["mongodb://localhost:27017"] + } + host: { + description: "The hostname of the MongoDB server." + required: true + examples: [_values.local_host] } } + assets_total: { - description: "Number of assertions raised since the MongoDB process started." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Number of assertions raised since the MongoDB process started." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "The assertion type" required: true @@ -112,12 +127,17 @@ components: sources: mongodb_metrics: { } } } + bson_parse_error_total: { + description: "The total number of BSON parsing errors." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags + } connections: { - description: "Number of connections in some state." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Number of connections in some state." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { state: { description: "The connection state" required: true @@ -126,52 +146,41 @@ components: sources: mongodb_metrics: { } } extra_info_heap_usage_bytes: { - description: "The total size in bytes of heap space used by the database process." - relevant_when: "Unix/Linux" - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total size in bytes of heap space used by the database process." + relevant_when: "Unix/Linux" + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } extra_info_page_faults: { - description: "The total number of page faults." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of page faults." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } instance_local_time: { - description: "The ISODate representing the current time, according to the server, in UTC." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The ISODate representing the current time, according to the server, in UTC." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } instance_uptime_estimate_seconds_total: { - description: "The uptime in seconds as calculated from MongoDB’s internal course-grained time keeping system." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The uptime in seconds as calculated from MongoDB’s internal course-grained time keeping system." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } instance_uptime_seconds_total: { - description: "The number of seconds that the current MongoDB process has been active." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The number of seconds that the current MongoDB process has been active." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } memory: { - description: "Current memory unsage." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Current memory unsage." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Memory type" required: true @@ -179,20 +188,11 @@ components: sources: mongodb_metrics: { } } } - mongod_global_lock_total_time_seconds: { - description: "The time since the database last started and created the globalLock. This is roughly equivalent to total server uptime." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } - } mongod_global_lock_active_clients: { - description: "Number of connected clients and the read and write operations performed by these clients." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Number of connected clients and the read and write operations performed by these clients." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Number type." required: true @@ -201,11 +201,10 @@ components: sources: mongodb_metrics: { } } mongod_global_lock_current_queue: { - description: "Number of operations queued because of a lock." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Number of operations queued because of a lock." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Number type." required: true @@ -213,12 +212,17 @@ components: sources: mongodb_metrics: { } } } + mongod_global_lock_total_time_seconds: { + description: "The time since the database last started and created the globalLock. This is roughly equivalent to total server uptime." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags + } mongod_locks_time_acquiring_global_seconds_total: { - description: "Amount of time that any database has spent waiting for the global lock." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Amount of time that any database has spent waiting for the global lock." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Lock type." required: true @@ -231,20 +235,11 @@ components: sources: mongodb_metrics: { } } } - mongod_metrics_cursor_timed_out_total: { - description: "The total number of cursors that have timed out since the server process started." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } - } mongod_metrics_cursor_open: { - description: "Number of cursors." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Number of cursors." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { state: { description: "Cursor state." required: true @@ -252,12 +247,17 @@ components: sources: mongodb_metrics: { } } } + mongod_metrics_cursor_timed_out_total: { + description: "The total number of cursors that have timed out since the server process started." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags + } mongod_metrics_document_total: { - description: "Document access and modification patterns." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Document access and modification patterns." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { state: { description: "Document state." required: true @@ -266,35 +266,28 @@ components: sources: mongodb_metrics: { } } mongod_metrics_get_last_error_wtime_num: { - description: "The total number of getLastError operations with a specified write concern." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of getLastError operations with a specified write concern." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_get_last_error_wtime_seconds_total: { - description: "The total amount of time that the mongod has spent performing getLastError operations." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total amount of time that the mongod has spent performing getLastError operations." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_get_last_error_wtimeouts_total: { - description: "The number of times that write concern operations have timed out as a result of the wtimeout threshold to getLastError." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The number of times that write concern operations have timed out as a result of the wtimeout threshold to getLastError." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_operation_total: { - description: "Update and query operations that MongoDB handles using special operation types." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Update and query operations that MongoDB handles using special operation types." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Operation type." required: true @@ -303,11 +296,10 @@ components: sources: mongodb_metrics: { } } mongod_metrics_query_executor_total: { - description: "Data from query execution system." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Data from query execution system." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { state: { description: "Query state." required: true @@ -316,67 +308,52 @@ components: sources: mongodb_metrics: { } } mongod_metrics_record_moves_total: { - description: "Moves reports the total number of times documents move within the on-disk representation of the MongoDB data set. Documents move as a result of operations that increase the size of the document beyond their allocated record size." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "Moves reports the total number of times documents move within the on-disk representation of the MongoDB data set. Documents move as a result of operations that increase the size of the document beyond their allocated record size." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_apply_batches_num_total: { - description: "The total number of batches applied across all databases." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of batches applied across all databases." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_apply_batches_seconds_total: { - description: "The total amount of time the mongod has spent applying operations from the oplog." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total amount of time the mongod has spent applying operations from the oplog." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_apply_ops_total: { - description: "The total number of oplog operations applied." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of oplog operations applied." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_buffer_count: { - description: "The current number of operations in the oplog buffer." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The current number of operations in the oplog buffer." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_buffer_max_size_bytes_total: { - description: "The maximum size of the buffer." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The maximum size of the buffer." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_buffer_size_bytes: { - description: "The current size of the contents of the oplog buffer." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The current size of the contents of the oplog buffer." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_executor_queue: { - description: "Number of queued operations in the replication executor." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Number of queued operations in the replication executor." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Queue type." required: true @@ -385,75 +362,58 @@ components: sources: mongodb_metrics: { } } mongod_metrics_repl_executor_unsignaled_events: { - description: "Number of unsignaled events in the replication executor." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "Number of unsignaled events in the replication executor." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_network_bytes_total: { - description: "The total amount of data read from the replication sync source." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total amount of data read from the replication sync source." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_network_getmores_num_total: { - description: "The total number of getmore operations, which are operations that request an additional set of operations from the replication sync source." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of getmore operations, which are operations that request an additional set of operations from the replication sync source." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_network_getmores_seconds_total: { - description: "The total amount of time required to collect data from getmore operations." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total amount of time required to collect data from getmore operations." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_network_ops_total: { - description: "The total number of operations read from the replication source." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of operations read from the replication source." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_repl_network_readers_created_total: { - description: "The total number of oplog query processes created." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of oplog query processes created." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_ttl_deleted_documents_total: { - description: "The total number of documents deleted from collections with a ttl index." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The total number of documents deleted from collections with a ttl index." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_metrics_ttl_passes_total: { - description: "The number of times the background process removes documents from collections with a ttl index." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "The number of times the background process removes documents from collections with a ttl index." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_op_latencies_histogram: { - description: "Latency statistics." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Latency statistics." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Latency type." required: true @@ -467,11 +427,10 @@ components: sources: mongodb_metrics: { } } mongod_op_latencies_latency: { - description: "A 64-bit integer giving the total combined latency in microseconds." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "A 64-bit integer giving the total combined latency in microseconds." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Latency type." required: true @@ -480,11 +439,10 @@ components: sources: mongodb_metrics: { } } mongod_op_latencies_ops_total: { - description: "A 64-bit integer giving the total number of operations performed on the collection since startup." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "A 64-bit integer giving the total number of operations performed on the collection since startup." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Latency type." required: true @@ -493,11 +451,10 @@ components: sources: mongodb_metrics: { } } mongod_storage_engine: { - description: "The name of the current storage engine." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "The name of the current storage engine." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { engine: { description: "Engine name." required: true @@ -506,12 +463,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_blockmanager_blocks_total: { - description: "Statistics on the block manager operations." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on the block manager operations." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Operation type." required: true @@ -520,12 +476,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_blockmanager_bytes_total: { - description: "Statistics on the block manager operations." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on the block manager operations." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Operation type." required: true @@ -534,12 +489,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_cache_bytes: { - description: "Statistics on the cache and page evictions from the cache." - relevant_when: "Storage engine is `wiredTiger`." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on the cache and page evictions from the cache." + relevant_when: "Storage engine is `wiredTiger`." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Statistics type." required: true @@ -548,12 +502,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_cache_bytes_total: { - description: "Statistics on the cache and page evictions from the cache." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on the cache and page evictions from the cache." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Statistics type." required: true @@ -562,12 +515,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_cache_evicted_total: { - description: "Statistics on the cache and page evictions from the cache." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on the cache and page evictions from the cache." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Statistics type." required: true @@ -576,28 +528,23 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_cache_max_bytes: { - description: "Maximum cache size." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "Maximum cache size." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_wiredtiger_cache_overhead_percent: { - description: "Percentage overhead." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host - } + description: "Percentage overhead." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_wiredtiger_cache_pages: { - description: "Pages in the cache." - relevant_when: "Storage engine is `wiredTiger`." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Pages in the cache." + relevant_when: "Storage engine is `wiredTiger`." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Pages type." required: true @@ -606,12 +553,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_cache_pages_total: { - description: "Pages in the cache." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Pages in the cache." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Pages type." required: true @@ -620,12 +566,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_concurrent_transactions_available_tickets: { - description: "Information on the number of concurrent of read and write transactions allowed into the WiredTiger storage engine" - relevant_when: "Storage engine is `wiredTiger`." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Information on the number of concurrent of read and write transactions allowed into the WiredTiger storage engine" + relevant_when: "Storage engine is `wiredTiger`." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Transactions type." required: true @@ -634,12 +579,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_concurrent_transactions_out_tickets: { - description: "Information on the number of concurrent of read and write transactions allowed into the WiredTiger storage engine" - relevant_when: "Storage engine is `wiredTiger`." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Information on the number of concurrent of read and write transactions allowed into the WiredTiger storage engine" + relevant_when: "Storage engine is `wiredTiger`." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Transactions type." required: true @@ -648,12 +592,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_concurrent_transactions_total_tickets: { - description: "Information on the number of concurrent of read and write transactions allowed into the WiredTiger storage engine" - relevant_when: "Storage engine is `wiredTiger`." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Information on the number of concurrent of read and write transactions allowed into the WiredTiger storage engine" + relevant_when: "Storage engine is `wiredTiger`." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Transactions type." required: true @@ -662,12 +605,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_log_bytes_total: { - description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Bytes type." required: true @@ -676,12 +618,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_log_operations_total: { - description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Operations type." required: true @@ -690,12 +631,11 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_log_records_scanned_total: { - description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Scanned records type." required: true @@ -704,30 +644,25 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_log_records_total: { - description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "Statistics on WiredTiger’s write ahead log (i.e. the journal)." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_wiredtiger_session_open_sessions: { - description: "Open session count." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } + description: "Open session count." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_wiredtiger_transactions_checkpoint_seconds: { - description: "Statistics on transaction checkpoints and operations." - relevant_when: "Storage engine is `wiredTiger`." - type: "gauge" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on transaction checkpoints and operations." + relevant_when: "Storage engine is `wiredTiger`." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Checkpoint type." required: true @@ -736,22 +671,25 @@ components: sources: mongodb_metrics: { } } mongod_wiredtiger_transactions_checkpoint_seconds_total: { - description: "Statistics on transaction checkpoints and operations." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" + description: "Statistics on transaction checkpoints and operations." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_wiredtiger_transactions_running_checkpoints: { - description: "Statistics on transaction checkpoints and operations." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" + description: "Statistics on transaction checkpoints and operations." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } mongod_wiredtiger_transactions_total: { - description: "Statistics on transaction checkpoints and operations." - relevant_when: "Storage engine is `wiredTiger`." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "Statistics on transaction checkpoints and operations." + relevant_when: "Storage engine is `wiredTiger`." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Transactions type." required: true @@ -760,11 +698,10 @@ components: sources: mongodb_metrics: { } } network_bytes_total: { - description: "The number of bytes that reflects the amount of network traffic." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "The number of bytes that reflects the amount of network traffic." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { state: { description: "Bytes state." required: true @@ -773,19 +710,16 @@ components: sources: mongodb_metrics: { } } network_metrics_num_requests_total: { - description: "The total number of distinct requests that the server has received." - type: "counter" - tags: { - endpoint: _endpoint - host: _host - } - } - op_counters_repl_total: { - description: "Database replication operations by type since the mongod instance last started." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + description: "The total number of distinct requests that the server has received." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags + } + mongodb_op_counters_repl_total: { + description: "Database replication operations by type since the mongod instance last started." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Counter type." required: true @@ -793,12 +727,11 @@ components: sources: mongodb_metrics: { } } } - op_counters_total: { - description: "Database operations by type since the mongod instance last started." - type: "counter" - tags: { - endpoint: _endpoint - host: _host + mongodb_op_counters_total: { + description: "Database operations by type since the mongod instance last started." + type: "counter" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags & { type: { description: "Counter type." required: true @@ -806,19 +739,11 @@ components: sources: mongodb_metrics: { } } } - } - - how_it_works: { - mod_status: { - title: "MongoDB `serverStatus` command" - body: """ - The [serverStatus][urls.mongodb_command_server_status] command - returns a document that provides an overview of the database’s - state. The output fields vary depending on the version of - MongoDB, underlying operating system platform, the storage - engine, and the kind of node, including `mongos`, `mongod` or - `replica set` member. - """ + up: { + description: "If the MongoDB server is up or not." + type: "gauge" + default_namespace: "mongodb" + tags: _mongodb_metrics_tags } } } diff --git a/docs/reference/components/sources/socket.cue b/docs/reference/components/sources/socket.cue index 54b6b9629c76b..2e7d220488ce3 100644 --- a/docs/reference/components/sources/socket.cue +++ b/docs/reference/components/sources/socket.cue @@ -147,5 +147,10 @@ components: sources: socket: { message: _line host: _values.local_host } - }] + }, + ] + + telemetry: metrics: { + connection_errors_total: components.sources.internal_metrics.output.metrics.connection_errors_total + } } diff --git a/docs/reference/components/sources/splunk_hec.cue b/docs/reference/components/sources/splunk_hec.cue index 1e92294a52836..c4d60938e42a3 100644 --- a/docs/reference/components/sources/splunk_hec.cue +++ b/docs/reference/components/sources/splunk_hec.cue @@ -92,4 +92,9 @@ components: sources: splunk_hec: { timestamp: fields._current_timestamp } } + + telemetry: metrics: { + http_request_errors_total: components.sources.internal_metrics.output.metrics.http_request_errors_total + requests_received_total: components.sources.internal_metrics.output.metrics.requests_received_total + } } diff --git a/docs/reference/components/sources/statsd.cue b/docs/reference/components/sources/statsd.cue index 54746f750db11..8ae463bc6aaab 100644 --- a/docs/reference/components/sources/statsd.cue +++ b/docs/reference/components/sources/statsd.cue @@ -120,4 +120,10 @@ components: sources: statsd: { """ } } + + telemetry: metrics: { + connection_errors_total: components.sources.internal_metrics.output.metrics.connection_errors_total + invalid_record_total: components.sources.internal_metrics.output.metrics.invalid_record_total + invalid_record_bytes_total: components.sources.internal_metrics.output.metrics.invalid_record_bytes_total + } } diff --git a/docs/reference/components/sources/stdin.cue b/docs/reference/components/sources/stdin.cue index 22fa8c3041cd9..a9568b2beefff 100644 --- a/docs/reference/components/sources/stdin.cue +++ b/docs/reference/components/sources/stdin.cue @@ -100,4 +100,8 @@ components: sources: stdin: { """ } } + + telemetry: metrics: { + stdin_reads_failed_total: components.sources.internal_metrics.output.metrics.stdin_reads_failed_total + } } diff --git a/docs/reference/components/sources/syslog.cue b/docs/reference/components/sources/syslog.cue index 6fba35e8eed00..e313900d79bab 100644 --- a/docs/reference/components/sources/syslog.cue +++ b/docs/reference/components/sources/syslog.cue @@ -182,4 +182,9 @@ components: sources: syslog: { """ } } + + telemetry: metrics: { + connection_read_errors_total: components.sources.internal_metrics.output.metrics.connection_read_errors_total + utf8_convert_errors_total: components.sources.internal_metrics.output.metrics.utf8_convert_errors_total + } } diff --git a/docs/reference/components/sources/vector.cue b/docs/reference/components/sources/vector.cue index b64c8c92633ab..3ff70bdcf4932 100644 --- a/docs/reference/components/sources/vector.cue +++ b/docs/reference/components/sources/vector.cue @@ -110,4 +110,8 @@ components: sources: vector: { } } + + telemetry: metrics: { + protobuf_decode_errors_total: components.sources.internal_metrics.output.metrics.protobuf_decode_errors_total + } } diff --git a/docs/reference/components/splunk.cue b/docs/reference/components/splunk.cue new file mode 100644 index 0000000000000..83c5bb6bc0f15 --- /dev/null +++ b/docs/reference/components/splunk.cue @@ -0,0 +1,27 @@ +package metadata + +components: _splunk: { + telemetry: metrics: { + encode_errors_total: { + description: """ + The total number of errors encoding [Splunk HEC](\(urls.splunk_hec_protocol)) events + to JSON for this `splunk_hec` sink. + """ + type: "counter" + default_namespace: "vector" + tags: telemetry.metrics._component_tags + } + source_missing_keys_total: { + description: "The total number of errors rendering the template for this source." + type: "counter" + default_namespace: "vector" + tags: telemetry.metrics._component_tags + } + sourcetype_missing_keys_total: { + description: "The total number of errors rendering the template for this sourcetype." + type: "counter" + default_namespace: "vector" + tags: telemetry.metrics._component_tags + } + } +} diff --git a/docs/reference/components/transforms/ansi_stripper.cue b/docs/reference/components/transforms/ansi_stripper.cue index 99617617760b3..690f2250d17f7 100644 --- a/docs/reference/components/transforms/ansi_stripper.cue +++ b/docs/reference/components/transforms/ansi_stripper.cue @@ -45,4 +45,8 @@ components: transforms: ansi_stripper: { logs: true metrics: null } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/aws_cloudwatch_logs_subscription_parser.cue b/docs/reference/components/transforms/aws_cloudwatch_logs_subscription_parser.cue index 3923e2fa5fc1f..6489d0baaab68 100644 --- a/docs/reference/components/transforms/aws_cloudwatch_logs_subscription_parser.cue +++ b/docs/reference/components/transforms/aws_cloudwatch_logs_subscription_parser.cue @@ -142,4 +142,8 @@ components: transforms: aws_cloudwatch_logs_subscription_parser: { body: "Note that the events themselves are not parsed. If they are structured data, you will typically want to pass them through a [parsing transform](\(urls.vector_parsing_transforms))." } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/aws_ec2_metadata.cue b/docs/reference/components/transforms/aws_ec2_metadata.cue index d4ef44f7b1b75..7b4f9e83480c9 100644 --- a/docs/reference/components/transforms/aws_ec2_metadata.cue +++ b/docs/reference/components/transforms/aws_ec2_metadata.cue @@ -170,4 +170,9 @@ components: transforms: aws_ec2_metadata: { } } } + + telemetry: metrics: { + metadata_refresh_failed_total: components.sources.internal_metrics.output.metrics.metadata_refresh_failed_total + metadata_refresh_successful_total: components.sources.internal_metrics.output.metrics.metadata_refresh_successful_total + } } diff --git a/docs/reference/components/transforms/dedupe.cue b/docs/reference/components/transforms/dedupe.cue index 3612228bab056..3b53bf7938ccc 100644 --- a/docs/reference/components/transforms/dedupe.cue +++ b/docs/reference/components/transforms/dedupe.cue @@ -146,4 +146,8 @@ components: transforms: dedupe: { """ } } + + telemetry: metrics: { + events_discarded_total: components.sources.internal_metrics.output.metrics.events_discarded_total + } } diff --git a/docs/reference/components/transforms/grok_parser.cue b/docs/reference/components/transforms/grok_parser.cue index b7070265f1521..2f99ea2e096fd 100644 --- a/docs/reference/components/transforms/grok_parser.cue +++ b/docs/reference/components/transforms/grok_parser.cue @@ -95,4 +95,8 @@ components: transforms: grok_parser: { """ } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/logfmt_parser.cue b/docs/reference/components/transforms/logfmt_parser.cue index 28d978f6b299c..06e5eb0abdb0b 100644 --- a/docs/reference/components/transforms/logfmt_parser.cue +++ b/docs/reference/components/transforms/logfmt_parser.cue @@ -178,4 +178,8 @@ components: transforms: logfmt_parser: { """ } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/lua.cue b/docs/reference/components/transforms/lua.cue index f73491ad01b7e..07ad1fca20e46 100644 --- a/docs/reference/components/transforms/lua.cue +++ b/docs/reference/components/transforms/lua.cue @@ -470,4 +470,9 @@ components: transforms: lua: { """ } } + + telemetry: metrics: { + memory_used: components.sources.internal_metrics.output.metrics.memory_used + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/metric_to_log.cue b/docs/reference/components/transforms/metric_to_log.cue index 54051a696075d..d494446ed82d6 100644 --- a/docs/reference/components/transforms/metric_to_log.cue +++ b/docs/reference/components/transforms/metric_to_log.cue @@ -93,4 +93,8 @@ components: transforms: metric_to_log: { ] how_it_works: {} + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/reduce.cue b/docs/reference/components/transforms/reduce.cue index fe9971cc211f9..5bae46c028409 100644 --- a/docs/reference/components/transforms/reduce.cue +++ b/docs/reference/components/transforms/reduce.cue @@ -144,4 +144,8 @@ components: transforms: reduce: { } }, ] + + telemetry: metrics: { + stale_events_flushed_total: components.sources.internal_metrics.output.metrics.stale_events_flushed_total + } } diff --git a/docs/reference/components/transforms/regex_parser.cue b/docs/reference/components/transforms/regex_parser.cue index 5c4cb7fcc256b..a44ee53f137ba 100644 --- a/docs/reference/components/transforms/regex_parser.cue +++ b/docs/reference/components/transforms/regex_parser.cue @@ -178,4 +178,8 @@ components: transforms: regex_parser: { """ } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/remap.cue b/docs/reference/components/transforms/remap.cue index 5e3c3cc9f3279..91197d70045b3 100644 --- a/docs/reference/components/transforms/remap.cue +++ b/docs/reference/components/transforms/remap.cue @@ -130,4 +130,8 @@ components: transforms: remap: { """# } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/sampler.cue b/docs/reference/components/transforms/sampler.cue index 3b86d481c0192..0614a2aeef2ba 100644 --- a/docs/reference/components/transforms/sampler.cue +++ b/docs/reference/components/transforms/sampler.cue @@ -64,4 +64,8 @@ components: transforms: sampler: { logs: true metrics: null } + + telemetry: metrics: { + events_discarded_total: components.sources.internal_metrics.output.metrics.events_discarded_total + } } diff --git a/docs/reference/components/transforms/split.cue b/docs/reference/components/transforms/split.cue index 4de8c9156fee8..366a5003393a7 100644 --- a/docs/reference/components/transforms/split.cue +++ b/docs/reference/components/transforms/split.cue @@ -95,4 +95,8 @@ components: transforms: split: { } }, ] + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/components/transforms/swimlanes.cue b/docs/reference/components/transforms/swimlanes.cue index 55c8878f48283..3079c9c22c895 100644 --- a/docs/reference/components/transforms/swimlanes.cue +++ b/docs/reference/components/transforms/swimlanes.cue @@ -70,4 +70,8 @@ components: transforms: swimlanes: { } }, ] + + telemetry: metrics: { + events_discarded_total: components.sources.internal_metrics.output.metrics.events_discarded_total + } } diff --git a/docs/reference/components/transforms/tag_cardinality_limit.cue b/docs/reference/components/transforms/tag_cardinality_limit.cue index 943785d1af791..766f525b57beb 100644 --- a/docs/reference/components/transforms/tag_cardinality_limit.cue +++ b/docs/reference/components/transforms/tag_cardinality_limit.cue @@ -218,4 +218,9 @@ components: transforms: tag_cardinality_limit: { """ } } + + telemetry: metrics: { + tag_value_limit_exceeded_total: components.sources.internal_metrics.output.metrics.tag_value_limit_exceeded_total + value_limit_reached_total: components.sources.internal_metrics.output.metrics.value_limit_reached_total + } } diff --git a/docs/reference/components/transforms/tokenizer.cue b/docs/reference/components/transforms/tokenizer.cue index 9f0481a8d494b..3ba7aac2ecb81 100644 --- a/docs/reference/components/transforms/tokenizer.cue +++ b/docs/reference/components/transforms/tokenizer.cue @@ -114,4 +114,8 @@ components: transforms: tokenizer: { """# } } + + telemetry: metrics: { + processing_errors_total: components.sources.internal_metrics.output.metrics.processing_errors_total + } } diff --git a/docs/reference/metrics.cue b/docs/reference/metrics.cue deleted file mode 100644 index d015180291973..0000000000000 --- a/docs/reference/metrics.cue +++ /dev/null @@ -1,74 +0,0 @@ -package metadata - -// All available metrics -_vector_events_processed_total: { - type: "counter" - description: "The total number of events processed by this component." - tags: _component_tags -} -_vector_processed_bytes_total: { - description: "The total number of bytes processed by the component." - type: "counter" - tags: _component_tags -} -_vector_processing_errors_total: { - description: "The total number of processing errors encountered by the component." - type: "counter" - tags: _component_tags & { - error_type: _error_type - } -} - -// Convenient groupings of tags -_component_tags: { - component_kind: _component_kind - component_name: _component_name - component_type: _component_type - instance: _instance - job: _job -} - -// All available tags -_component_kind: { - description: "The component's kind (options are `source`, `sink`, or `transform`)." - required: true - options: { - sink: "Sink component." - source: "Source component." - transform: "Transform component." - } -} -_component_name: { - description: "The name of the component as specified in the Vector configuration." - required: true - examples: ["file_source", "splunk_sink"] -} -_component_type: { - description: "The type of component (source, transform, or sink)." - required: true - examples: ["file", "http", "honeycomb", "splunk_hec"] -} -_error_type: { - description: "The type of the error" - required: true - options: [ - "field_missing", - "invalid_metric", - "mapping_failed", - "match_failed", - "parse_failed", - "render_error", - "type_conversion_failed", - "value_invalid", - ] -} -_instance: { - description: "The Vector instance identified by host and port." - required: true - examples: [_values.instance] -} -_job: { - description: "The name of the job producing Vector metrics." - required: true - default: "vector" -} diff --git a/docs/reference/urls.cue b/docs/reference/urls.cue index b425a89249ef7..76b616dcbfa63 100644 --- a/docs/reference/urls.cue +++ b/docs/reference/urls.cue @@ -263,12 +263,14 @@ urls: { prometheus_metric_naming: "https://prometheus.io/docs/practices/naming/#metric-names" prometheus_remote_integrations: "https://prometheus.io/docs/operating/integrations/#remote-endpoints-and-storage" prometheus_remote_write: "https://prometheus.io/docs/prometheus/latest/configuration/configuration/#remote_write" + protobuf: "https://developers.google.com/protocol-buffers" pulsar: "https://pulsar.apache.org/" pulsar_protocol: "https://pulsar.apache.org/docs/en/develop-binary-protocol/" rdkafka: "https://github.com/edenhill/librdkafka" regex: "https://en.wikipedia.org/wiki/Regular_expression" regex_grouping_and_flags: "https://docs.rs/regex/1.3.9/regex/#grouping-and-flags" regex_tester: "https://rustexp.lpil.uk/" + rfc_3339: "https://tools.ietf.org/html/rfc3339" rfc_4180: "https://tools.ietf.org/html/rfc4180" rlua: "https://github.com/kyren/rlua" rpm: "https://rpm.org/"