-
Notifications
You must be signed in to change notification settings - Fork 45
/
schema.yml
360 lines (251 loc) · 11.7 KB
/
schema.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
version: 2
models:
- name: snowplow_web_events
description: Schema and table for web page context
columns:
- name: domain_userid
tests:
- not_null
- name: collector_tstamp
tests:
- not_null
- name: domain_sessionid
tests:
- not_null
- name: page_view_id
tests:
- not_null
- unique
- relationships:
to: ref('snowplow_web_page_context')
field: page_view_id
severity: warn
- name: snowplow_web_events_time
columns:
- name: page_view_id
tests:
- unique
- relationships:
to: ref('snowplow_web_page_context')
field: page_view_id
severity: warn
- name: snowplow_web_events_scroll_depth
columns:
- name: page_view_id
tests:
- unique
- relationships:
to: ref('snowplow_web_page_context')
field: page_view_id
severity: warn
- name: snowplow_web_page_context
tests:
- dbt_utils.unique_combination_of_columns:
combination_of_columns:
- page_view_id
- root_id
columns:
- name: page_view_id
tests:
- not_null
- name: root_id
- name: snowplow_page_views
description: '{{ doc("snowplow_page_views") }}'
columns:
- name: user_custom_id
description: Unique ID set by business, user_id atomic field
- name: user_snowplow_domain_id
description: User ID set by Snowplow using 1st party cookie
tests:
- not_null
- name: user_snowplow_crossdomain_id
description: User ID set by Snowplow using 3rd party cookie
- name: session_id
description: A visit / session identifier
tests:
- not_null
- name: min_tstamp
- name: max_tstamp
- name: max_session_page_view_index
- name: last_page_view_in_session
- name: session_index
description: A visit / session index
tests:
- not_null
- name: page_view_id
description: Universally unique identifier
tests:
- unique
- not_null
- name: page_view_index
description: A page view index
- name: page_view_in_session_index
description: A page view index within a single session
- name: page_view_start
description: Timestamp for the start of the page view on your preferred clock
- name: page_view_end
description: Timestamp for the end of the page view on your preferred clock
- name: page_view_start_local
description: Timestamp for the start of the page view on the user's clock
- name: page_view_end_local
description: Timestamp for the end of the page view on the user's clock
- name: time_engaged_in_s
description: Time spent by the user on the page
- name: time_engaged_in_s_tier
description: Range of time spent by the user on the page
- name: horizontal_pixels_scrolled
description: Distance the user scrolled horizontally in pixels
- name: vertical_pixels_scrolled
description: Distance the user scrolled vertically in pixels
- name: horizontal_percentage_scrolled
description: Percentage of page scrolled horizontally
- name: vertical_percentage_scrolled
description: Percentage of page scrolled vertically
- name: vertical_percentage_scrolled_tier
description: Range of percentage of page scrolled vertically
- name: user_engaged
description: Did the user engage with the page?
- name: page_url
description: The page URL
- name: page_url_scheme
description: Scheme aka protocol
- name: page_url_host
description: Host aka domain
- name: page_url_port
description: Port if specified, 80 if not
- name: page_url_path
description: Path to page
- name: page_url_query
description: Querystring
- name: page_url_fragment
description: Fragment aka anchor
- name: page_title
description: Web page title
- name: page_width
description: The page's width in pixels
- name: page_height
description: The page's height in pixels
- name: referer_url
description: The referer URL
- name: referer_url_scheme
description: Referer scheme
- name: referer_url_host
description: Referer host
- name: referer_url_port
description: Referer port
- name: referer_url_path
description: Referer page path
- name: referer_url_query
description: Referer URL querystring
- name: referer_url_fragment
description: Referer URL fragment
- name: referer_medium
description: Type of referer
- name: referer_source
description: Name of referer if recognised
- name: referer_term
description: Keywords if source is a search engine
- name: marketing_medium
description: Type of traffic source
- name: marketing_source
description: The company / website where the traffic came from
- name: marketing_term
description: Any keywords associated with the referer
- name: marketing_content
description: The content of the ad. (Or an ID so that it can be looked up.)
- name: marketing_campaign
description: The campaign ID
- name: marketing_click_id
description: The click ID
- name: marketing_network
description: The ad network to which the click ID belongs
- name: geo_country
description: ISO 3166-1 code for the country the visitor is located in
- name: geo_region
description: ISO-3166-2 code for country region the visitor is in
- name: geo_region_name
description: Visitor region name
- name: geo_city
description: City the visitor is in
- name: geo_zipcode
description: Postcode the visitor is in
- name: geo_latitude
description: Visitor location latitude
- name: geo_longitude
description: Visitor location longitude
- name: geo_timezone
description: Visitor timezone name
- name: ip_address
description: The IP address of the visitor
- name: ip_isp
description: Visitor's ISP
- name: ip_organization
description: Organization associated with the visitor's IP address - defaults to ISP name if none is found
- name: ip_domain
description: Second level domain name associated with the visitor's IP address
- name: ip_net_speed
description: Visitor's connection type
- name: browser
description: The name and version of the visitor's browser
- name: browser_name
description: The name, or family, of the visitor's browser
- name: browser_major_version
description: Browser major version
- name: browser_minor_version
description: Browser minor version
- name: browser_build_version
description: Browser build version
- name: browser_engine
description: Browser rendering engine
- name: browser_window_width
description: Viewport width
- name: browser_window_height
description: Viewport height
- name: browser_language
description: Language the browser is set to
- name: os
description: The name and version of the visitor's OS
- name: os_name
description: The name of the visitor's OS
- name: os_major_version
description: OS major version
- name: os_minor_version
description: OS minor version
- name: os_build_version
description: OS build version
- name: os_manufacturer
description: OS manufacturer
- name: os_timezone
description: Time zone the OS is set to
- name: device
description: Device model
- name: device_type
description: Type of device
- name: device_is_mobile
description: Is the device mobile?
- name: redirect_time_in_ms
description: Time to redirect the visitor
- name: unload_time_in_ms
description: Time to complete the unload event
- name: app_cache_time_in_ms
description: Time to fetch resource from relevant application cache
- name: dns_time_in_ms
description: Time to complete domain lookup
- name: tcp_time_in_ms
description: Time to establish connection
- name: request_time_in_ms
description: Time between the user agent sending a request and receiving the first byte of the response
- name: response_time_in_ms
description: Time to complete the response
- name: processing_time_in_ms
description: Processing time
- name: dom_loading_to_interactive_time_in_ms
description: Time for the current document readiness to change from 'loading' to 'interactive'
- name: dom_interactive_to_complete_time_in_ms
description: Time for the current document readiness to change from 'interactive' to 'complete'
- name: onload_time_in_ms
description: Time to complete the load event
- name: total_time_in_ms
description: Total time from navigation start to load event completion
- name: app_id
description: Application ID