Skip to content
This repository was archived by the owner on Aug 8, 2025. It is now read-only.

Commit 67d02f0

Browse files
committed
Update to 0.14.2, use method helpers for message and http, ask for user and token when running plan
1 parent 94fffcc commit 67d02f0

27 files changed

Lines changed: 274 additions & 271 deletions

Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
1-
FROM datacatering/data-caterer:0.14.0
1+
FROM datacatering/data-caterer:0.14.2
22

33
COPY --chown=app:app build/libs/data-caterer-example-0.1.0.jar /opt/app/job.jar

benchmark/run_benchmark.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ case "${uname_out}" in
1818
*) sed_option="-r";;
1919
esac
2020
data_sizes=(10000 100000 1000000)
21-
job_names=("BenchmarkForeignKeyPlanRun" "BenchmarkJsonPlanRun" "BenchmarkParquetPlanRun") #"BenchmarkAdvancedKafkaPlanRun"
21+
job_names=("BenchmarkForeignKeyPlanRun" "BenchmarkJsonPlanRun" "BenchmarkParquetPlanRun")
2222

2323
spark_query_execution_engines=("default" "blaze" "comet" "gluten")
2424
gluten_spark_conf="--conf \"spark.plugins=io.glutenproject.GlutenPlugin\" --conf \"spark.memory.offHeap.enabled=true\" --conf \"spark.memory.offHeap.size=1024mb\" --conf \"spark.shuffle.manager=org.apache.spark.shuffle.sort.ColumnarShuffleManager\""

docker/data/custom/task/http/http-account-task-simple.yaml

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -14,26 +14,26 @@ steps:
1414
fields:
1515
- name: "id"
1616
options:
17-
sql: "bodyContent.account_id"
17+
sql: "body.account_id"
1818
- name: "queryParam"
1919
fields:
2020
- name: "limit"
2121
type: "integer"
2222
options:
23-
oneOf:
24-
- 10
25-
- 5
23+
min: 1
24+
max: 10
2625
- name: "httpHeaders"
2726
fields:
2827
- name: "Content-Type"
2928
static: "application/json"
29+
- name: "Content-Length"
3030
- name: "X-Account-Id"
3131
options:
32-
sql: "bodyContent.account_id"
32+
sql: "body.account_id"
3333
- name: "X-Updated"
3434
type: "timestamp"
3535
options:
36-
sql: "bodyContent.details.updated_by.time"
36+
sql: "body.details.updated_by.time"
3737
- name: "httpBody"
3838
fields:
3939
- name: "account_id"

docker/data/custom/task/kafka/kafka-account-task-simple.yaml

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ steps:
1010
- name: "key"
1111
type: "string"
1212
options:
13-
sql: "content.account_id"
13+
sql: "body.account_id"
1414
- name: "messageBody"
1515
fields:
1616
- name: "account_id"
@@ -27,11 +27,10 @@ steps:
2727
- name: "details"
2828
fields:
2929
- name: "name"
30-
- name: "txn_date"
30+
- name: "first_txn_date"
3131
type: "date"
3232
options:
33-
min: "2021-01-01"
34-
max: "2021-12-31"
33+
sql: "ELEMENT_AT(SORT_ARRAY(body.transactions.txn_date), 1)"
3534
- name: "updated_by"
3635
fields:
3736
- name: "user"
@@ -48,7 +47,7 @@ steps:
4847
fields:
4948
- name: "account-id"
5049
options:
51-
sql: "content.account_id"
50+
sql: "body.account_id"
5251
- name: "updated"
5352
options:
54-
sql: "content.details.update_by.time"
53+
sql: "body.details.update_by.time"

docker/data/custom/validation/simple-validation.yaml

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,20 @@ dataSources:
77
path: "app/src/test/resources/sample/json/txn-gen"
88
validations:
99
- expr: "amount < 100"
10+
- field: amount
11+
validation:
12+
- type: "null"
13+
negate: true
14+
- type: "between"
15+
min: 1
16+
max: 10
17+
description: "hello"
18+
errorThreshold: 2
19+
- type: "quantileValuesBetween"
20+
quantileRanges:
21+
0.1:
22+
- - 1.0
23+
- 10.0
1024
- expr: "year == 2021"
1125
errorThreshold: 0.1
1226
- expr: "regexp_like(name, 'Peter .*')"

gradle.properties

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,5 +8,5 @@ version=0.1.0
88

99
scalaVersion=2.12
1010
scalaSpecificVersion=2.12.19
11-
dataCatererVersion=0.14.1
11+
dataCatererVersion=0.14.2
1212
sparkMajorVersion=3.5

helm/data-caterer/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ image:
88
repository: "datacatering/data-caterer"
99
pullPolicy: "IfNotPresent"
1010
# Overrides the image tag whose default is the chart appVersion.
11-
tag: "0.14.0"
11+
tag: "0.14.2"
1212

1313
imagePullSecrets: []
1414
nameOverride: ""

run.sh

Lines changed: 18 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,26 @@
11
#!/usr/bin/env bash
22

3+
DATA_CATERER_ENV_FILE="$HOME/.data-caterer-env"
4+
35
data_caterer_version=$(grep dataCatererVersion gradle.properties | cut -d= -f2)
46
data_caterer_user=${DATA_CATERER_API_USER:-}
57
data_caterer_token=${DATA_CATERER_API_TOKEN:-}
68

79
echo "Checking for Data Caterer user and token..."
8-
if [[ -z ${DATA_CATERER_API_USER} ]]; then
9-
read -p "Data Caterer user: " data_caterer_user
10-
DATA_CATERER_API_USER=data_caterer_user
11-
fi
12-
if [[ -z ${DATA_CATERER_API_TOKEN} ]]; then
13-
read -p "Data Caterer token: " -s data_caterer_token
14-
DATA_CATERER_API_TOKEN=data_caterer_token
15-
echo
10+
if [[ -f "$DATA_CATERER_ENV_FILE" ]]; then
11+
source "$DATA_CATERER_ENV_FILE"
12+
else
13+
if [[ -z ${DATA_CATERER_API_USER} ]]; then
14+
read -p "Data Caterer user: " data_caterer_user
15+
echo "export DATA_CATERER_API_USER=$data_caterer_user" > "$DATA_CATERER_ENV_FILE"
16+
fi
17+
if [[ -z ${DATA_CATERER_API_TOKEN} ]]; then
18+
read -p "Data Caterer token: " -s data_caterer_token
19+
echo "export DATA_CATERER_API_TOKEN=$data_caterer_token" >> "$DATA_CATERER_ENV_FILE"
20+
echo
21+
fi
1622
fi
23+
source "$DATA_CATERER_ENV_FILE"
1724

1825
if [[ -s ".tmp_prev_class_name" ]]; then
1926
prev_class_name=$(cat .tmp_prev_class_name)
@@ -58,9 +65,9 @@ DOCKER_CMD=(
5865
-e "DEPLOY_MODE=client"
5966
-e "DRIVER_MEMORY=2g"
6067
-e "EXECUTOR_MEMORY=2g"
61-
-e "DATA_CATERER_API_USER=$data_caterer_user"
62-
-e "DATA_CATERER_API_TOKEN=$data_caterer_token"
63-
--network "docker_default"
68+
-e "DATA_CATERER_API_USER=$DATA_CATERER_API_USER"
69+
-e "DATA_CATERER_API_TOKEN=$DATA_CATERER_API_TOKEN"
70+
--network "insta-infra_default"
6471
datacatering/data-caterer:"$data_caterer_version"
6572
)
6673

src/main/java/io/github/datacatering/plan/AdvancedBatchEventJavaPlanRun.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77

88
public class AdvancedBatchEventJavaPlanRun extends PlanRun {
99
{
10-
var kafkaTask = new AdvancedKafkaJavaPlanRun().getKafkaTask();
10+
var kafkaTask = new KafkaJavaPlanRun().getKafkaTask();
1111

1212
var csvTask = csv("my_csv", "/opt/app/data/csv/account")
1313
.fields(

src/main/java/io/github/datacatering/plan/AdvancedKafkaJavaPlanRun.java

Lines changed: 0 additions & 63 deletions
This file was deleted.

0 commit comments

Comments
 (0)