Skip to content

Commit 54a91c1

Browse files
committed
drtprod: archive previous 300 node runs
Epic: None Release note: None
1 parent 5e92542 commit 54a91c1

File tree

2 files changed

+171
-0
lines changed

2 files changed

+171
-0
lines changed
Lines changed: 171 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,171 @@
1+
# Yaml for creating and configuring the drt-scale cluster. This also configures Datadog.
2+
# Build the roachprod and roachtest binaries (using --cross) before running this script
3+
environment:
4+
ROACHPROD_GCE_DEFAULT_SERVICE_ACCOUNT: 622274581499-compute@developer.gserviceaccount.com
5+
ROACHPROD_DNS: drt.crdb.io
6+
ROACHPROD_GCE_DNS_DOMAIN: drt.crdb.io
7+
ROACHPROD_GCE_DNS_ZONE: drt
8+
ROACHPROD_GCE_DEFAULT_PROJECT: cockroach-drt
9+
CLUSTER: drt-scale-300
10+
WORKLOAD_CLUSTER: workload-scale-300
11+
CLUSTER_NODES: 300
12+
TOTAL_PARTITIONS: 15
13+
WORKLOAD_NODES: 15
14+
15+
dependent_file_locations:
16+
- pkg/cmd/drtprod/scripts/setup_datadog_cluster
17+
- pkg/cmd/drtprod/scripts/setup_datadog_workload
18+
- pkg/cmd/drtprod/scripts/tpcc_init.sh
19+
- pkg/cmd/drtprod/scripts/generate_tpcc_run.sh
20+
- artifacts/roachtest
21+
- artifacts/drtprod
22+
23+
targets:
24+
# crdb cluster specs
25+
- target_name: $CLUSTER
26+
steps:
27+
- command: create
28+
args:
29+
- $CLUSTER
30+
flags:
31+
clouds: gce
32+
gce-managed: true
33+
gce-enable-multiple-stores: true
34+
gce-zones: "us-central1-a:30,us-central1-b:30,us-central1-c:30"
35+
nodes: $CLUSTER_NODES
36+
gce-machine-type: n2-standard-16
37+
local-ssd: false
38+
gce-pd-volume-size: 2048
39+
gce-pd-volume-type: pd-ssd
40+
gce-pd-volume-count: 2
41+
os-volume-size: 100
42+
username: drt
43+
lifetime: 8760h
44+
gce-image: "ubuntu-2204-jammy-v20250112"
45+
- command: sync
46+
flags:
47+
clouds: gce
48+
- command: stage
49+
args:
50+
- $CLUSTER
51+
- release
52+
- v25.2.0-rc.1 # for libgeos
53+
- command: stage
54+
args:
55+
- $CLUSTER
56+
- cockroach
57+
- release-25.2.1-rc
58+
- script: "pkg/cmd/drtprod/scripts/setup_datadog_cluster"
59+
- command: start
60+
args:
61+
- $CLUSTER
62+
- "--binary"
63+
- "./cockroach"
64+
flags:
65+
# add flag to set provisioned throughput on each store according to their cloud provider limits
66+
enable-fluent-sink: true
67+
store-count: 2
68+
args: --wal-failover=among-stores
69+
restart: false
70+
sql-port: 26257
71+
- command: run
72+
args:
73+
- $CLUSTER
74+
- --
75+
- "sudo systemctl unmask cron.service ; sudo systemctl enable cron.service ; echo \"crontab -l ; echo '@reboot sleep 100 && ~/cockroach.sh' | crontab -\" > t.sh ; sh t.sh ; rm t.sh"
76+
- command: sql
77+
args:
78+
- $CLUSTER:1
79+
- --
80+
- -e
81+
- "SET CLUSTER SETTING kv.snapshot_rebalance.max_rate='256 MB'"
82+
# workload cluster specs
83+
- target_name: $WORKLOAD_CLUSTER
84+
steps:
85+
- command: create
86+
args:
87+
- $WORKLOAD_CLUSTER
88+
flags:
89+
clouds: gce
90+
gce-zones: "us-central1-a"
91+
nodes: $WORKLOAD_NODES
92+
gce-machine-type: n2-standard-8
93+
os-volume-size: 100
94+
username: workload
95+
lifetime: 8760h
96+
gce-image: "ubuntu-2204-jammy-v20250112"
97+
on_rollback:
98+
- command: destroy
99+
args:
100+
- $WORKLOAD_CLUSTER
101+
- command: sync
102+
flags:
103+
clouds: gce
104+
- command: stage
105+
args:
106+
- $WORKLOAD_CLUSTER
107+
- cockroach
108+
- command: put
109+
args:
110+
- $WORKLOAD_CLUSTER
111+
- artifacts/roachtest
112+
- roachtest-operations
113+
- command: put
114+
args:
115+
- $WORKLOAD_CLUSTER
116+
- artifacts/drtprod
117+
- script: "pkg/cmd/drtprod/scripts/setup_datadog_workload"
118+
- target_name: post_tasks
119+
dependent_targets:
120+
- $CLUSTER
121+
- $WORKLOAD_CLUSTER
122+
steps:
123+
- script: rm
124+
args:
125+
- -rf
126+
- certs-$CLUSTER
127+
- command: get
128+
args:
129+
- $CLUSTER:1
130+
- certs
131+
- certs-$CLUSTER
132+
- command: put
133+
args:
134+
- $WORKLOAD_CLUSTER
135+
- certs-$CLUSTER
136+
- certs
137+
- command: ssh
138+
args:
139+
- $WORKLOAD_CLUSTER
140+
- --
141+
- chmod
142+
- 600
143+
- './certs/*'
144+
- script: "pkg/cmd/drtprod/scripts/tpcc_init.sh"
145+
args:
146+
- cct_tpcc
147+
- false
148+
flags:
149+
warehouses: 4000000
150+
db: cct_tpcc
151+
- script: pkg/cmd/drtprod/scripts/populate_workload_keys.sh
152+
- target_name: tpcc_run
153+
dependent_targets:
154+
- $CLUSTER
155+
- $WORKLOAD_CLUSTER
156+
steps:
157+
- script: "pkg/cmd/drtprod/scripts/generate_tpcc_run.sh"
158+
args:
159+
- cct_tpcc
160+
- false
161+
flags:
162+
db: cct_tpcc
163+
warehouses: 4000000
164+
active-warehouses: 500000
165+
active-workers: 2000
166+
conns: 2000
167+
max-rate: 2500
168+
workers: 500000
169+
duration: 12h
170+
ramp: 1h
171+
wait: 0

pkg/cmd/drtprod/configs/drt_scale_300_bench.yaml renamed to pkg/cmd/drtprod/configs/archived/2025_07_drt_scale_300_bench.yaml

File renamed without changes.

0 commit comments

Comments
 (0)