-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathWastewater SQL Schema.r
395 lines (342 loc) · 7.01 KB
/
Wastewater SQL Schema.r
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
# Databricks notebook source
###### This code contains the up to date version of the ODM schema that is in production.
# COMMAND ----------
###### Aggregate tables - Derived based on ODM table
# COMMAND ----------
# DBTITLE 1,allSites - The table that contains information about ww daily signal average per replicate level assocaited with a given site
allSites {
collDT
name
healthReg
measure
fraction
datasetID
valavg
sampleID
MA7
sd_avg
Tests_performed
siteID
}
# COMMAND ----------
# DBTITLE 1,allSitesAdj- The table that contains information about the adjusted (based on Quality Flag) ww daily signal average per replicate level assocaited with a given site
allSitesAdj {
collDT
name
healthReg
measure
fraction
datasetID
valavg
sampleID
MA7
sd_avg
Tests_performed
siteID
}
# COMMAND ----------
###### ODM tables
# COMMAND ----------
# DBTITLE 1,Dataset - A report table for capturing details about data’s parental data set and data custodians. Supplying attribution for data collectors.
datasets {
parDatasetID
datasetID
name
license
descr
refLink
langID
funderCont
custodyCont
funderID
custodyID
notes
}
# COMMAND ----------
# DBTITLE 1,Infobase - subset of allsite table that is publishing on public health infobase
Infobase {
Date
Location
region
measureid
fractionid
viral_load
seven_day_rolling_avg
pruid
}
# COMMAND ----------
# DBTITLE 1,InfobaseTrend- The table that contains information about the trend flag assocaited with a given site
InfobaseTrend {
Location
measure
latestTrends
pruid
t_low
t_high
LatestLevel
Grouping
City
Province
Country
Viral_Activity_Level
}
# COMMAND ----------
# DBTITLE 1, measures - The table that contains information and details about a given measure adapt from verson 1 documentation
measures {
measureRepID
protocolID
sampleID
purposeID
polygonID
siteID
datasetID
measureSetRepID
compartment
specimenID
fraction
group
class
measure
value
unit
aggregation
nomenclature
index
measureLic
reportable
organizationID
contactID
refLink
}
# COMMAND ----------
# DBTITLE 1,samples - The table that contains information about a sample. A sample is defined as a representative volume of wastewater (or other forms of water or liquid), air, or surface area taken from a site. Samples can be combined, split, stored and reused.
samples {
sampleID
protocolID
organizationID
contactID
siteID
purposeID
saMaterial
datasetID
origin
repType
collType
collPer
collNum
pooled
collDT
collDTStart
collDTEnd
sentDate
recDate
reportable
lastEdited
notes
}
# COMMAND ----------
# DBTITLE 1,qualityReports - The table for recording the various quality metrics and indicators for samples and measures.
qualityReports {
quality
measureRepID
sampleID
measureSetRepID
qualityFlag
severity
notes
}
# COMMAND ----------
# DBTITLE 1,sites - The table that contains information about a site; the location where an environmental sample was taken. The site of an eviromental sample. Information in the site table does not regularly change. Consider using the MeasureReport table if the infomation changes often.
sites {
parSiteID
siteID
datasetID
polygonID
siteType
sampleShed
addressID
organizationID
contactID
name
descr
repOrg1
repOrg2
healthReg
popServ
geoLat
geoLong
geoEPSG
lastEdited
notes
}
# COMMAND ----------
# DBTITLE 1,StandardCurve - Table that contains the std curve information along with Lot number that serve for quantification
StandardCurve {
sampleID
N2_Curve_ID
PMMV_Curve_ID
CDCA_Curve_ID
CDCB_Curve_ID
RSVA_Curve_ID
RSVB_Curve_ID
LotNumber
}
# COMMAND ----------
###### ODM Dictionary tables - Theses tables are pulled from the ODM working group osfhome or page
# COMMAND ----------
# DBTITLE 1,parts - Look up table containing all parts in of the data model. Contains all parts, including self-referential parts.
parts {
partID
partLabel
partType
shortName
partDesc
partInstr
domain
specimenSet
compartmentSet
group
class
nomenclature
ontologyRef
latExp
mmaSet
unitSet
aggreationScale
aggregationSet
qualitySet
missingnessSet
status
changes
protocolSteps
protocolStepsRequired
protocolStepsOrder
protocolRelationships
protocolRelationshipsRequired
protocolRelationshipsOrder
measures
measuresRequired
measuresOrder
measureSets
measureSetsRequired
measureSetsOrder
datasets
datasetsRequired
datasetsOrder
sites
sitesRequired
sitesOrder
samples
samplesRequired
samplesOrder
addresses
addressesRequired
addressesOrder
contacts
contactsRequired
contactsOrder
organizations
organizationsRequired
organizationsOrder
instruments
instrumentsRequired
instrumentsOrder
polygons
polygonsRequired
polygonsOrder
languages
languagesRequired
languagesOrder
translations
translationsRequired
translationsOrder
parts
partsRequired
partsOrder
sets
setsRquired
setsOrder
qualityReports
qualityReportsRequired
qualityReportsOrder
sampleRelationships
sampleRelationshipsRequired
sampleRelationshipsOrder
protocols
protocolsRequired
protocolsOrder
countries
countriesRequired
countriesOrder
zones
zonesRequired
zonesOrder
refLink
dataType
minValue
maxValue
minLength
maxLength
}
# COMMAND ----------
# DBTITLE 1,countries - Look up table for the possible country inputs.
countries {
isoCode
isoCodeX
numCode
tld
nameEngl
nameOffical
sovereignity
countryExonym
capitalExonym
countryEndonym
capitalEndonym
langScript
phone
utc
utcDST
}
# COMMAND ----------
sets {
setID
setType
partID
partLabel
status
changes
notes
}
# COMMAND ----------
# DBTITLE 1,translations - Look up table for translations of the description, label, and instruction for all parts. The default language if a translation is not specified is English.
translations {
lang
part
partLabel
partDesc
partInstr
changes
notes
}
# COMMAND ----------
# DBTITLE 1,zones - Look up table for the possible sub-national region or zone inputs.
zones {
isoCode
isoZone
zoneName
}
# COMMAND ----------
# DBTITLE 1,languages - Look up table for all languages, used to give structure to the translation table.
languages {
lang
langFam
langName
natName
ISO6391
ISO6392B
ISO6392T
ISO6393
ISO6396
changes
notes
}