Skip to content

Commit 7e7aab2

Browse files
committed
remove old naming scheme and use DD where appropriate
1 parent 00ac55a commit 7e7aab2

21 files changed

+180
-351
lines changed

k8s/cluster.yaml

Lines changed: 25 additions & 29 deletions
Original file line numberDiff line numberDiff line change
@@ -1,34 +1,34 @@
11
apiVersion: v1
22
kind: Service
33
metadata:
4-
name: service-dfray-proxy
4+
name: service-dd-proxy
55
labels:
6-
app: dfray-proxy
6+
app: dd-proxy
77
spec:
88
type: ClusterIP
99
ports:
10-
- name: dfray-proxy
10+
- name: dd-proxy
1111
port: 20200
1212
targetPort: 20200
1313
selector:
14-
app: dfray-proxy
14+
app: dd-proxy
1515
---
1616
apiVersion: apps/v1
1717
kind: Deployment
1818
metadata:
19-
name: deployment-dfray-proxy
19+
name: deployment-dd-proxy
2020
labels:
21-
app: dfray-proxy
21+
app: dd-proxy
2222
spec:
2323
replicas: 2
2424
selector:
2525
matchLabels:
26-
app: dfray-proxy
26+
app: dd-proxy
2727
template:
2828
metadata:
2929
labels:
30-
app: dfray-proxy
31-
service: dfray-proxy
30+
app: dd-proxy
31+
service: dd-proxy
3232
team: mint
3333
admission.datadoghq.com/enabled: "true"
3434
annotations:
@@ -52,16 +52,14 @@ spec:
5252
- key: "node-role.kubernetes.io/nodeless"
5353
operator: Exists
5454
containers:
55-
- name: dfray-proxy
56-
image: registry.ddbuild.io/dfray-amd64:2025-06-17-b
55+
- name: dd-proxy
56+
image: registry.ddbuild.io/dd-amd64:2025-06-17-b
5757
env:
58-
- name: DATAFUSION_RAY_LOG_LEVEL
59-
value: trace
60-
- name: DFRAY_WORKER_DEPLOYMENT
61-
value: deployment-dfray-worker
62-
- name: DFRAY_WORKER_DEPLOYMENT_PORT
58+
- name: dd_WORKER_DEPLOYMENT
59+
value: deployment-dd-worker
60+
- name: dd_WORKER_DEPLOYMENT_PORT
6361
value: "20201"
64-
- name: DFRAY_WORKER_DEPLOYMENT_NAMESPACE
62+
- name: dd_WORKER_DEPLOYMENT_NAMESPACE
6563
valueFrom:
6664
fieldRef:
6765
fieldPath: metadata.namespace
@@ -76,7 +74,7 @@ spec:
7674
command:
7775
- sh
7876
- "-c"
79-
- "/dfray --mode proxy --port 20200"
77+
- "/dd --mode proxy --port 20200"
8078
ports:
8179
- containerPort: 20200
8280
resources:
@@ -90,19 +88,19 @@ spec:
9088
apiVersion: apps/v1
9189
kind: Deployment
9290
metadata:
93-
name: deployment-dfray-worker
91+
name: deployment-dd-worker
9492
labels:
95-
app: dfray-worker
93+
app: dd-worker
9694
spec:
9795
replicas: 2
9896
selector:
9997
matchLabels:
100-
app: dfray-worker
98+
app: dd-worker
10199
template:
102100
metadata:
103101
labels:
104-
app: dfray-worker
105-
service: service-dfray-worker
102+
app: dd-worker
103+
service: service-dd-worker
106104
team: mint
107105
admission.datadoghq.com/enabled: "true"
108106
annotations:
@@ -126,13 +124,11 @@ spec:
126124
- key: "node-role.kubernetes.io/nodeless"
127125
operator: Exists
128126
containers:
129-
- name: dfray-worker
130-
image: registry.ddbuild.io/dfray-amd64:2025-06-17-b
127+
- name: dd-worker
128+
image: registry.ddbuild.io/dd-amd64:2025-06-17-b
131129
env:
132-
- name: DATAFUSION_RAY_LOG_LEVEL
133-
value: trace
134130
- name: RUST_LOG
135-
value: datafusion_bindings=info,cs3_query=info
131+
value: distributed_datafusion=trace,datafusion_bindings=info,cs3_query=info
136132
- name: HDQ_URL
137133
value: http://hdq-creed.data-eng.all-clusters.local-dc.fabric.dog:6420
138134
- name: MEM_THRESHOLD
@@ -142,7 +138,7 @@ spec:
142138
command:
143139
- sh
144140
- "-c"
145-
- "/dfray --mode worker --port 20201"
141+
- "/dd --mode worker --port 20201"
146142
ports:
147143
- containerPort: 20201
148144
resources:

k8s/dev_cluster.yaml

Lines changed: 26 additions & 30 deletions
Original file line numberDiff line numberDiff line change
@@ -1,51 +1,49 @@
11
apiVersion: v1
22
kind: Service
33
metadata:
4-
name: service-dfray-proxy
4+
name: service-dd-proxy
55
labels:
6-
app: dfray-proxy
6+
app: dd-proxy
77
spec:
88
type: ClusterIP
99
ports:
10-
- name: dfray-proxy
10+
- name: dd-proxy
1111
port: 20200
1212
targetPort: 20200
1313
selector:
14-
app: dfray-proxy
14+
app: dd-proxy
1515
---
1616
apiVersion: apps/v1
1717
kind: Deployment
1818
metadata:
19-
name: deployment-dfray-proxy
19+
name: deployment-dd-proxy
2020
labels:
21-
app: dfray-proxy
21+
app: dd-proxy
2222
spec:
2323
replicas: 1
2424
selector:
2525
matchLabels:
26-
app: dfray-proxy
26+
app: dd-proxy
2727
template:
2828
metadata:
2929
labels:
30-
app: dfray-proxy
31-
service: dfray-proxy
30+
app: dd-proxy
31+
service: dd-proxy
3232
spec:
3333
containers:
34-
- name: dfray-proxy
35-
image: registry.ddbuild.io/dfray:2025-06-16-e
34+
- name: dd-proxy
35+
image: registry.ddbuild.io/dd:2025-06-16-e
3636
env:
37-
- name: DATAFUSION_RAY_LOG_LEVEL
38-
value: debug
39-
- name: DFRAY_WORKER_DEPLOYMENT
40-
value: deployment-dfray-worker
41-
- name: DFRAY_WORKER_DEPLOYMENT_PORT
37+
- name: dd_WORKER_DEPLOYMENT
38+
value: deployment-dd-worker
39+
- name: dd_WORKER_DEPLOYMENT_PORT
4240
value: "20201"
43-
- name: DFRAY_WORKER_DEPLOYMENT_NAMESPACE
41+
- name: dd_WORKER_DEPLOYMENT_NAMESPACE
4442
valueFrom:
4543
fieldRef:
4644
fieldPath: metadata.namespace
4745
- name: RUST_LOG
48-
value: datafusion_bindings=info,cs3_query=info
46+
value: datafusion_bindings=info,cs3_query=info,distributed_datafusion=debug
4947
- name: HDQ_URL
5048
value: http://hdq-creed.data-eng.all-clusters.local-dc.fabric.dog:6420
5149
- name: MEM_THRESHOLD
@@ -55,35 +53,33 @@ spec:
5553
command:
5654
- sh
5755
- "-c"
58-
- "/dfray --mode proxy --port 20200"
56+
- "/dd --mode proxy --port 20200"
5957
ports:
6058
- containerPort: 20200
6159
---
6260
apiVersion: apps/v1
6361
kind: Deployment
6462
metadata:
65-
name: deployment-dfray-worker
63+
name: deployment-dd-worker
6664
labels:
67-
app: dfray-worker
65+
app: dd-worker
6866
spec:
6967
replicas: 2
7068
selector:
7169
matchLabels:
72-
app: dfray-worker
70+
app: dd-worker
7371
template:
7472
metadata:
7573
labels:
76-
app: dfray-worker
77-
service: service-dfray-worker
74+
app: dd-worker
75+
service: service-dd-worker
7876
spec:
7977
containers:
80-
- name: dfray-worker
81-
image: registry.ddbuild.io/dfray:2025-06-16-e
78+
- name: dd-worker
79+
image: registry.ddbuild.io/dd:2025-06-16-e
8280
env:
83-
- name: DATAFUSION_RAY_LOG_LEVEL
84-
value: debug
8581
- name: RUST_LOG
86-
value: datafusion_bindings=info,cs3_query=info
82+
value: datafusion_bindings=info,cs3_query=info,distributed_datafusion=debug
8783
- name: HDQ_URL
8884
value: http://hdq-creed.data-eng.all-clusters.local-dc.fabric.dog:6420
8985
- name: MEM_THRESHOLD
@@ -93,7 +89,7 @@ spec:
9389
command:
9490
- sh
9591
- "-c"
96-
- "/dfray --mode worker --port 20201"
92+
- "/dd --mode worker --port 20201"
9793
ports:
9894
- containerPort: 20201
9995
---

scripts/build_and_push_docker.sh

Lines changed: 0 additions & 39 deletions
This file was deleted.

scripts/launch_tpch_cluster.sh

Lines changed: 4 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -59,6 +59,7 @@ done
5959
NUM_WORKERS=${NUM_WORKERS:-$DEFAULT_NUM_WORKERS}
6060
TPCH_DATA_DIR=${TPCH_DATA_DIR:-$DEFAULT_TPCH_PATH}
6161
LOG_DIR=${LOG_DIR:-$DEFAULT_LOG_PATH}
62+
RUST_LOG=${RUST_LOG:-"info,distributed_datafusion=debug"}
6263

6364
# Validate inputs
6465
if [ "$NUM_WORKERS" -lt 1 ]; then
@@ -116,8 +117,7 @@ echo " - Log Directory: $LOG_DIR"
116117
echo
117118

118119
# Define environment variables
119-
export DATAFUSION_RAY_LOG_LEVEL=trace
120-
export DFRAY_TABLES="customer:parquet:${TPCH_DATA_DIR}/customer.parquet,\
120+
export DD_TABLES="customer:parquet:${TPCH_DATA_DIR}/customer.parquet,\
121121
lineitem:parquet:${TPCH_DATA_DIR}/lineitem.parquet,\
122122
nation:parquet:${TPCH_DATA_DIR}/nation.parquet,\
123123
orders:parquet:${TPCH_DATA_DIR}/orders.parquet,\
@@ -147,8 +147,7 @@ for ((i = 0; i < NUM_WORKERS; i++)); do
147147
WORKER_NAME="worker$((i + 1))"
148148
LOG_FILE="${LOG_DIR}/${WORKER_NAME}.log"
149149
echo " Starting $WORKER_NAME on port $PORT..."
150-
#env DATAFUSION_RAY_LOG_LEVEL="$DATAFUSION_RAY_LOG_LEVEL" DFRAY_TABLES="$DFRAY_TABLES" ./target/release/distributed-datafusion --mode worker --port $PORT >"$LOG_FILE" 2>&1 &
151-
env RUST_BACKTRACE=1 DATAFUSION_RAY_LOG_LEVEL="$DATAFUSION_RAY_LOG_LEVEL" DFRAY_TABLES="$DFRAY_TABLES" ./target/debug/distributed-datafusion --mode worker --port $PORT >"$LOG_FILE" 2>&1 &
150+
env RUST_LOG="$RUST_LOG" RUST_BACKTRACE=1 DD_TABLES="$DD_TABLES" ./target/debug/distributed-datafusion --mode worker --port $PORT >"$LOG_FILE" 2>&1 &
152151
WORKER_PIDS[$i]=$!
153152
WORKER_ADDRESSES[$i]="localhost:${PORT}"
154153
done
@@ -167,8 +166,7 @@ WORKER_ADDRESSES_STR=$(
167166
echo "Starting proxy on port 20200..."
168167
echo "Connecting to workers: $WORKER_ADDRESSES_STR"
169168
PROXY_LOG="${LOG_DIR}/proxy.log"
170-
#env DATAFUSION_RAY_LOG_LEVEL="$DATAFUSION_RAY_LOG_LEVEL" DFRAY_TABLES="$DFRAY_TABLES" DFRAY_WORKER_ADDRESSES="$WORKER_ADDRESSES_STR" ./target/release/distributed-datafusion --mode proxy --port 20200 >"$PROXY_LOG" 2>&1 &
171-
env RUST_BACKTRACE=1 DATAFUSION_RAY_LOG_LEVEL="$DATAFUSION_RAY_LOG_LEVEL" DFRAY_TABLES="$DFRAY_TABLES" DFRAY_WORKER_ADDRESSES="$WORKER_ADDRESSES_STR" ./target/debug/distributed-datafusion --mode proxy --port 20200 >"$PROXY_LOG" 2>&1 &
169+
env RUST_LOG="$RUST_LOG" RUST_BACKTRACE=1 DD_TABLES="$DD_TABLES" DD_WORKER_ADDRESSES="$WORKER_ADDRESSES_STR" ./target/debug/distributed-datafusion --mode proxy --port 20200 >"$PROXY_LOG" 2>&1 &
172170
PROXY_PID=$!
173171

174172
echo

scripts/python_tests.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,4 +23,4 @@ maturin develop
2323

2424
python tpch/make_data.py $TPCH_SCALING_FACTOR $TPCH_DATA_PATH
2525

26-
DATAFUSION_RAY_LOG_LEVEL=debug RAY_COLOR_PREFIX=1 RAY_DEDUP_LOGS=0 python tpch/tpcbench.py --data=file:///$TPCH_DATA_PATH/ --concurrency 3 --partitions-per-processor 2 --batch-size=8192 --worker-pool-min=20 --validate
26+
RUST_LOG=distributed_datafusion=debug python tpch/tpcbench.py --data=file:///$TPCH_DATA_PATH/ --concurrency 3 --partitions-per-processor 2 --batch-size=8192 --worker-pool-min=20 --validate

0 commit comments

Comments
 (0)