forked from datacontract/datacontract-specification
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdatacontract.init.yaml
109 lines (91 loc) · 2.08 KB
/
datacontract.init.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
dataContractSpecification: 0.9.3
id: my-data-contract-id
info:
title: My Data Contract
version: 0.0.1
# description:
# owner:
# contact:
# name:
# url:
# email:
### servers
#servers:
# production:
# type: s3
# location: s3://
# format: parquet
# delimiter: new_line
### terms
#terms:
# usage:
# limitations:
# billing:
# noticePeriod:
### models
# models:
# my_model:
# description:
# type:
# fields:
# my_field:
# type:
# description:
### definitions
# definitions:
# my_field:
# domain:
# name:
# title:
# type:
# description:
# example:
# pii:
# classification:
### examples
#examples:
# - type: csv
# model: my_model
# data: |-
# id,timestamp,amount
# "1001","2023-09-09T08:30:00Z",2500
# "1002","2023-09-08T15:45:00Z",1800
### servicelevels
#servicelevels:
# availability:
# description: The server is available during support hours
# percentage: 99.9%
# retention:
# description: Data is retained for one year because!
# period: P1Y
# unlimited: false
# latency:
# description: Data is available within 25 hours after the order was placed
# threshold: 25h
# sourceTimestampField: orders.order_timestamp
# processedTimestampField: orders.processed_timestamp
# freshness:
# description: The age of the youngest row in a table.
# threshold: 25h
# timestampField: orders.order_timestamp
# frequency:
# description: Data is delivered once a day
# type: batch # or streaming
# interval: daily # for batch, either or cron
# cron: 0 0 * * * # for batch, either or interval
# support:
# description: The data is available during typical business hours at headquarters
# time: 9am to 5pm in EST on business days
# responseTime: 1h
# backup:
# description: Data is backed up once a week, every Sunday at 0:00 UTC.
# interval: weekly
# cron: 0 0 * * 0
# recoveryTime: 24 hours
# recoveryPoint: 1 week
### quality
#quality:
# type: SodaCL
# specification:
# checks for my_model: |-
# - duplicate_count(id) = 0