-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathdbt_project.yml
192 lines (183 loc) · 4.86 KB
/
dbt_project.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
name: 'calitp_warehouse'
version: '1.0.0'
config-version: 2
# This setting configures which "profile" dbt uses for this project.
profile: 'calitp_warehouse'
# These configurations specify where dbt should look for different types of files.
# The `model-paths` config, for example, states that models in this project can be
# found in the "models/" directory. You probably won't need to change these!
model-paths: ["models"]
analysis-paths: ["analyses"]
test-paths: ["tests"]
seed-paths: ["seeds"]
macro-paths: ["macros"]
snapshot-paths: ["snapshots"]
target-path: "target" # directory which will store compiled SQL files
clean-targets: # directories to be removed by `dbt clean`
- "target"
- "dbt_packages"
vars:
surrogate_key_treat_nulls_as_empty_strings: true # enable legacy behavior for dbt_utils surrogate keys, i.e. coalesce nulls to empty strings
GTFS_SCHEDULE_START: '2021-04-16'
PROD_GTFS_RT_START: '2022-09-15'
INCREMENTAL_MAX_DT: ''
'dbt_date:time_zone': 'America/Los_Angeles'
SOURCE_DATABASE: cal-itp-data-infra # you can override with DBT_SOURCE_DATABASE env var rather than constantly using --vars
models:
calitp_warehouse:
schema: staging
+persist_docs:
relation: true
columns: true
staging:
+materialized: view
schema: staging
amplitude:
+labels:
domain: staging
dataset: benefits
audit:
+labels:
domain: staging
dataset: audit
gtfs:
+labels:
domain: staging
dataset: gtfs
gtfs_quality:
+labels:
domain: staging
dataset: gtfs_quality
ntd:
+labels:
domain: staging
dataset: ntd
ntd_annual_reporting:
+labels:
domain: staging
dataset: ntd_annual_reporting
ntd_ridership:
+labels:
domain: staging
dataset: ntd_ridership
ntd_safety_and_security:
+labels:
domain: staging
dataset: ntd_safety_and_security
ntd_validation:
+labels:
domain: staging
dataset: ntd_validation
payments:
+labels:
domain: staging
dataset: payments
rt:
+labels:
domain: staging
dataset: gtfs
state_geoportal:
+labels:
domain: staging
dataset: state_geoportal
transit_database:
+labels:
domain: staging
dataset: transit_database
intermediate:
gtfs:
+labels:
domain: intermediate
dataset: gtfs
gtfs_quality:
+labels:
domain: intermediate
dataset: gtfs_quality
guidelines_checks:
+materialized: table
ntd:
+labels:
domain: intermediate
dataset: ntd
ntd_validation:
+labels:
domain: intermediate
dataset: ntd_validation
payments:
+labels:
domain: intermediate
dataset: payments
transit_database:
+labels:
domain: intermediate
dataset: transit_database
mart:
audit:
+labels:
domain: mart
dataset: audit
schema: mart_audit
benefits:
+labels:
domain: mart
dataset: benefits
schema: mart_benefits
gtfs:
+labels:
domain: mart
dataset: gtfs
schema: mart_gtfs
gtfs_quality:
+labels:
domain: mart
dataset: gtfs_quality
schema: mart_gtfs_quality
gtfs_schedule_latest:
+labels:
domain: mart
dataset: gtfs_schedule_latest
schema: mart_gtfs_schedule_latest
ntd:
+labels:
domain: mart
dataset: ntd
schema: mart_ntd
ntd_annual_reporting:
+materialized: table
+labels:
domain: mart
dataset: ntd_annual_reporting
schema: mart_ntd_annual_reporting
ntd_ridership:
+materialized: table
+labels:
domain: mart
dataset: ntd_ridership
schema: mart_ntd_ridership
ntd_safety_and_security:
+materialized: table
+labels:
domain: mart
dataset: ntd_safety_and_security
schema: mart_ntd_safety_and_security
ntd_validation:
+labels:
domain: mart
dataset: ntd_validation
schema: mart_ntd_validation
payments:
+materialized: table
+labels:
domain: mart
dataset: payments
schema: mart_payments
transit_database:
+labels:
domain: mart
dataset: transit_database
schema: mart_transit_database
transit_database_latest:
+labels:
domain: mart
dataset: transit_database_latest
schema: mart_transit_database_latest