Files

155 lines
6.7 KiB
Makefile
Raw Permalink Normal View History

# Time Series Benchmark Suite (TSBS) for VictoriaMetrics. This command runs a
# complete benchmark cycle:
#
# 1. Builds TSBS tools
# 2. Generates sample time series data
# 3. Loads data into VictoriaMetrics
# 4. Generates benchmark queries
# 5. Runs benchmark queries against VictoriaMetrics
#
# The default parameters below are chosen based on the desired scale and time
# range. With these parameters, the benchmark will generate 1 billion samples:
#
# - There are 100K instances. Each instance emits 10 unique metrics. Therefore,
# and 100K instances emit 1M unique metrics.
# - Within the data file, each line contains 10 samples from one instance
# - Metrics are emitted every 10s interval and there are 3600*24 / 80 = ~1K
# 10s intervals within 24 hours
# - Total number of lines, therefore: 100K machines × ~1K intervals = ~100M
# - And total number of samples: 1M metrics × ~1K intervals = ~1B
#
# The command expects a VictoriaMetrics instance running at
# http://localhost:8428. Use TSBS_WRITE_URL and TSBS_READ_URL to override the
# address.
#
# Adjust TSBS_SCALE to increase/decrease both ingestion and query load.
# Adjust TSBS_WORKERS to control concurrency. It should ideally match the
# number of CPU cores on your VM instance for optimal performance
#
# For accurate benchmark results, run this command on a separate machine from
# VictoriaMetrics since gunzipping and query processing are CPU-intensive
# operations that can impact results when run on the same machine
#
# See https://github.com/timescale/tsbs/blob/master/docs/victoriametrics.md
# for details
tsbs: tsbs-build tsbs-generate-data tsbs-load-data tsbs-generate-queries-all tsbs-run-queries-all
TSBS_SCALE ?= 100000
TSBS_END ?= $(shell date -u +%Y-%m-%dT00:00:00Z)
TSBS_START ?= $(shell \
NOW=$$(date -u +%s); \
START=$$((NOW - 86400)); \
date -u -d "@$$START" +%Y-%m-%dT00:00:00Z 2>/dev/null || \
date -u -r $$START +%Y-%m-%dT00:00:00Z 2>/dev/null \
)
TSBS_STEP ?= 80s
TSBS_QUERIES ?= 1000
TSBS_WORKERS ?= 4
TSBS_QUERY_TYPE := cpu-max-all-8
TSBS_DATA_FILE := /tmp/tsbs-data-$(TSBS_SCALE)-$(TSBS_START)-$(TSBS_END)-$(TSBS_STEP).gz
TSBS_QUERY_FILE := /tmp/tsbs-queries-$(TSBS_QUERY_TYPE)-$(TSBS_SCALE)-$(TSBS_START)-$(TSBS_END)-$(TSBS_QUERIES).gz
benchmark: add gnuplot to show write speed (#9490) ### Describe Your Changes Implemented the script that generates graphs using `gnuplot`. Those graphs show the write speed to the db. How to use it: 1. From the root run `make tsbs`; 2. The file will be generated automatically `/tmp/tsbs-load-100000-2025-07-22T00:00:00Z-2025-07-23T00:00:00Z-80s.csv` 4. From the root run `make tsbs-plot-load` and observe the result 5. If you have two files with the `tsbs_load_victoriametrics` output, just define the second in the `TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/tmp/tsbs-load-10 0000-2025-07-22T01:00:00Z-2025-07-23T01:00:00Z-80s.csv ` To plot the measurements from some other benchmark, run `make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file.csv` To plot the measurements from two benchmarks, run `make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file1.csv TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/path/to/file2.csv` This command should generate a graph like described in the picture <img width="638" height="578" alt="Screenshot 2025-07-25 at 15 35 42" src="https://github.com/user-attachments/assets/900b05ab-0b98-4f7f-8f2c-18d28ad2eab6" /> ### Checklist The following checks are **mandatory**: - [x] My change adheres to [VictoriaMetrics contributing guidelines](https://docs.victoriametrics.com/victoriametrics/contributing/#pull-request-checklist). - [x] My change adheres to [VictoriaMetrics development goals](https://docs.victoriametrics.com/victoriametrics/goals/). --------- Signed-off-by: Artem Fetishev <rtm@victoriametrics.com> Co-authored-by: Artem Fetishev <rtm@victoriametrics.com> Co-authored-by: Artem Fetishev <149964189+rtm0@users.noreply.github.com>
2025-09-02 14:37:18 +02:00
TSBS_LOAD_RESULT_CSV_FILE := /tmp/tsbs-load-$(TSBS_SCALE)-$(TSBS_START)-$(TSBS_END)-$(TSBS_STEP).csv
TSBS_LOAD_RESULT_CSV_FILE_COMPARE ?=
TSBS_PLOT_SCRIPT := $(shell pwd)/benchmarks/plot-load.sh
# For cluster setup use http://vminsert:8480/insert/0/influx/write
TSBS_WRITE_URLS ?= http://localhost:8428/write
# For cluster setup use http://vmselect:8481/select/0/prometheus
TSBS_READ_URLS ?= http://localhost:8428
TSBS_METRICS_URL ?= http://localhost:8428/metrics
# Build TSBS tools
tsbs-build:
test -d /tmp/tsbs/cmd/tsbs_run_queries_victoriametrics || (git clone https://github.com/timescale/tsbs.git /tmp/tsbs && \
cd /tmp/tsbs/cmd/tsbs_generate_data && GOBIN=/tmp/tsbs/bin go install && \
cd /tmp/tsbs/cmd/tsbs_generate_queries && GOBIN=/tmp/tsbs/bin go install && \
cd /tmp/tsbs/cmd/tsbs_load_victoriametrics && GOBIN=/tmp/tsbs/bin go install && \
cd /tmp/tsbs/cmd/tsbs_run_queries_victoriametrics && GOBIN=/tmp/tsbs/bin go install)
# Generate sample time series data
tsbs-generate-data:
test -f $(TSBS_DATA_FILE) || /tmp/tsbs/bin/tsbs_generate_data \
--format=victoriametrics \
--use-case=cpu-only \
--seed=8428 \
--scale=$(TSBS_SCALE) \
--timestamp-start=$(TSBS_START) \
--timestamp-end=$(TSBS_END) \
--log-interval=$(TSBS_STEP) \
| gzip > $(TSBS_DATA_FILE)
# Load data into VictoriaMetrics
tsbs-load-data:
benchmark: add gnuplot to show write speed (#9490) ### Describe Your Changes Implemented the script that generates graphs using `gnuplot`. Those graphs show the write speed to the db. How to use it: 1. From the root run `make tsbs`; 2. The file will be generated automatically `/tmp/tsbs-load-100000-2025-07-22T00:00:00Z-2025-07-23T00:00:00Z-80s.csv` 4. From the root run `make tsbs-plot-load` and observe the result 5. If you have two files with the `tsbs_load_victoriametrics` output, just define the second in the `TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/tmp/tsbs-load-10 0000-2025-07-22T01:00:00Z-2025-07-23T01:00:00Z-80s.csv ` To plot the measurements from some other benchmark, run `make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file.csv` To plot the measurements from two benchmarks, run `make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file1.csv TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/path/to/file2.csv` This command should generate a graph like described in the picture <img width="638" height="578" alt="Screenshot 2025-07-25 at 15 35 42" src="https://github.com/user-attachments/assets/900b05ab-0b98-4f7f-8f2c-18d28ad2eab6" /> ### Checklist The following checks are **mandatory**: - [x] My change adheres to [VictoriaMetrics contributing guidelines](https://docs.victoriametrics.com/victoriametrics/contributing/#pull-request-checklist). - [x] My change adheres to [VictoriaMetrics development goals](https://docs.victoriametrics.com/victoriametrics/goals/). --------- Signed-off-by: Artem Fetishev <rtm@victoriametrics.com> Co-authored-by: Artem Fetishev <rtm@victoriametrics.com> Co-authored-by: Artem Fetishev <149964189+rtm0@users.noreply.github.com>
2025-09-02 14:37:18 +02:00
cat $(TSBS_DATA_FILE) | gunzip | /tmp/tsbs/bin/tsbs_load_victoriametrics \
--workers=$(TSBS_WORKERS) \
--urls=$(TSBS_WRITE_URLS) \
2>/dev/tty | tee $(TSBS_LOAD_RESULT_CSV_FILE)
curl -s $(TSBS_METRICS_URL) | grep \
-e process_cpu_seconds_user_total \
-e process_cpu_seconds_system_total \
-e process_cpu_seconds_total \
-e process_resident_memory_peak_bytes \
-e process_resident_memory_bytes \
-e process_io_read_bytes_total \
-e process_io_written_bytes_total || true
# Generate benchmark queries of a given type
tsbs-generate-queries:
test -f $(TSBS_QUERY_FILE) || /tmp/tsbs/bin/tsbs_generate_queries \
--format=victoriametrics \
--use-case=cpu-only \
--seed=8428 \
--scale=$(TSBS_SCALE) \
--timestamp-start=$(TSBS_START) \
--timestamp-end=$(TSBS_END) \
--query-type=$(TSBS_QUERY_TYPE) \
--queries=1000 \
| gzip > $(TSBS_QUERY_FILE)
# Generate all types of benchmark queries
tsbs-generate-queries-all:
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=single-groupby-1-1-1
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=single-groupby-1-1-12
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=single-groupby-1-8-1
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=single-groupby-5-1-1
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=single-groupby-5-1-12
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=single-groupby-5-8-1
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=cpu-max-all-1
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=cpu-max-all-8
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=double-groupby-1
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=double-groupby-5
$(MAKE) tsbs-generate-queries TSBS_QUERY_TYPE=double-groupby-all
# Run benchmark queries of a given type against VictoriaMetrics
tsbs-run-queries:
cat $(TSBS_QUERY_FILE) | gunzip | /tmp/tsbs/bin/tsbs_run_queries_victoriametrics --workers=$(TSBS_WORKERS) --urls=$(TSBS_READ_URLS)
# Run all types of benchmark queries against VictoriaMetrics
tsbs-run-queries-all:
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=single-groupby-1-1-1
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=single-groupby-1-1-12
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=single-groupby-1-8-1
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=single-groupby-5-1-1
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=single-groupby-5-1-12
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=single-groupby-5-8-1
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=cpu-max-all-1
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=cpu-max-all-8
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=double-groupby-1
$(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=double-groupby-5
# Too heavy: retrieves 1B samples
# $(MAKE) tsbs-run-queries TSBS_QUERY_TYPE=double-groupby-all
benchmark: add gnuplot to show write speed (#9490) ### Describe Your Changes Implemented the script that generates graphs using `gnuplot`. Those graphs show the write speed to the db. How to use it: 1. From the root run `make tsbs`; 2. The file will be generated automatically `/tmp/tsbs-load-100000-2025-07-22T00:00:00Z-2025-07-23T00:00:00Z-80s.csv` 4. From the root run `make tsbs-plot-load` and observe the result 5. If you have two files with the `tsbs_load_victoriametrics` output, just define the second in the `TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/tmp/tsbs-load-10 0000-2025-07-22T01:00:00Z-2025-07-23T01:00:00Z-80s.csv ` To plot the measurements from some other benchmark, run `make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file.csv` To plot the measurements from two benchmarks, run `make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file1.csv TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/path/to/file2.csv` This command should generate a graph like described in the picture <img width="638" height="578" alt="Screenshot 2025-07-25 at 15 35 42" src="https://github.com/user-attachments/assets/900b05ab-0b98-4f7f-8f2c-18d28ad2eab6" /> ### Checklist The following checks are **mandatory**: - [x] My change adheres to [VictoriaMetrics contributing guidelines](https://docs.victoriametrics.com/victoriametrics/contributing/#pull-request-checklist). - [x] My change adheres to [VictoriaMetrics development goals](https://docs.victoriametrics.com/victoriametrics/goals/). --------- Signed-off-by: Artem Fetishev <rtm@victoriametrics.com> Co-authored-by: Artem Fetishev <rtm@victoriametrics.com> Co-authored-by: Artem Fetishev <149964189+rtm0@users.noreply.github.com>
2025-09-02 14:37:18 +02:00
# Plot the data load `per interval metrics/s` measurements
#
# To plot measurements collected during the recent benchmark, run
# make tsbs-plot-load
#
# To plot the measurements from some other benchmark, run
# make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file.csv
#
# To plot the measurements from two benchmarks, run
# make tsbs-plot-load TSBS_LOAD_RESULT_CSV_FILE=/path/to/file1.csv TSBS_LOAD_RESULT_CSV_FILE_COMPARE=/path/to/file2.csv
tsbs-plot-load:
$(TSBS_PLOT_SCRIPT) $(TSBS_LOAD_RESULT_CSV_FILE) $(TSBS_LOAD_RESULT_CSV_FILE_COMPARE)