File tree Expand file tree Collapse file tree 2 files changed +54
-1
lines changed
Expand file tree Collapse file tree 2 files changed +54
-1
lines changed Original file line number Diff line number Diff line change @@ -17,7 +17,7 @@ services:
1717
1818 stream-collector :
1919 container_name : " snowplow-stream-collector"
20- image : snowplow/scala-stream-collector-kinesis:3.2.0 -distroless
20+ image : snowplow/scala-stream-collector-kinesis:3.2.1 -distroless
2121 command : ["--config", "/snowplow/collector/config.hocon"]
2222 depends_on :
2323 - localstack
Original file line number Diff line number Diff line change 1+ {
2+ "license" : {
3+ "accept" : ${ACCEPT_LICENSE}
4+ },
5+ "input" : {
6+ "streamName" : "enriched-good"
7+ "appName" : "lake-loader-iceberg"
8+ "customEndpoint" : "http://localhost.localstack.cloud:4566"
9+ "initialPosition" : {
10+ "type" : "LATEST"
11+ }
12+ "retrievalMode" : {
13+ "type" : "FanOut"
14+ }
15+ "workerIdentifier" : ${HOSTNAME}
16+ "leaseDuration" : "10 seconds"
17+ }
18+
19+ "output" : {
20+
21+ "good" : {
22+ "type" : "Iceberg" ,
23+ "database" : "atomic"
24+ "table" : "events"
25+ "location" : "s3a://snowplow-lake-loader/events" # this can also be S3!
26+ "catalog" : {
27+ "type" : "Hadoop"
28+ }
29+ }
30+
31+ "bad" : {
32+ "streamName" : "bad"
33+ }
34+ }
35+
36+ "spark" : {
37+
38+ # -- How many times a Spark task should be retried in case of failure.
39+ "taskRetries" : 3
40+ # -- Any valid spark configuration key/value.
41+ # -- This can be blank in most setups because the loader already sets sensible defaults.
42+ # https://github.com/apache/iceberg/commit/fa6403b1888847ce04de50c6b159dd43fdcb4590
43+ "conf" : {
44+ "fs.s3a.endpoint" : "http://s3.localhost.localstack.cloud:4566"
45+ }
46+ }
47+
48+ "windowing" : "15 seconds" # deliberately short period for frequent writes
49+ "inMemBatchBytes" : 1000
50+ "telemetry" : {
51+ "disable" : true
52+ }
53+ }
You can’t perform that action at this time.
0 commit comments