-
Notifications
You must be signed in to change notification settings - Fork 89
/
simple-impala-part.conf
53 lines (51 loc) · 1.06 KB
/
simple-impala-part.conf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
application {
name = Simple Impala Partitioned HDFS Example
}
include file("env.conf")
steps {
loop_dates {
type = loop
mode = serial
source = range
range.start = 20190101
range.end = 20190102
parameter = processing_date
}
fsInput {
dependencies = [loop_dates]
input {
type = filesystem
path = "/tmp/example-input/example-input-${processing_date}.json"
format = json
}
}
fsProcess {
dependencies = [fsInput, loop_dates]
deriver {
type = sql
query.literal = "SELECT id,foo,blah,ymd FROM fsInput_${processing_date}"
}
planner = {
type = overwrite
}
output = {
type = filesystem
path = "/tmp/example-output-partitioned/ymd=${processing_date}"
format = parquet
}
}
ddl {
dependencies = [fsProcess, loop_dates]
type = task
task = ${env.impala} {
type = impala_ddl
query {
type = "add_partition"
table = "example_output_part"
partition {
spec = "ymd=${processing_date}"
}
}
}
}
}