forked from microbiomedata/nmdc-schema
-
Notifications
You must be signed in to change notification settings - Fork 0
/
nmdc.schema.json
3603 lines (3602 loc) · 147 KB
/
nmdc.schema.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
{
"$defs": {
"Activity": {
"additionalProperties": false,
"description": "a provence-generating activity",
"properties": {
"ended_at_time": {
"format": "date-time",
"type": "string"
},
"id": {
"description": "A unique identifier for a thing. Must be either a CURIE shorthand for a URI or a complete URI",
"type": "string"
},
"name": {
"description": "A human readable label for an entity",
"type": "string"
},
"started_at_time": {
"format": "date-time",
"type": "string"
},
"used": {
"type": "string"
},
"was_associated_with": {
"$ref": "#/$defs/Agent"
},
"was_informed_by": {
"type": "string"
}
},
"required": [
"id"
],
"title": "Activity",
"type": "object"
},
"Agent": {
"additionalProperties": false,
"description": "a provence-generating agent",
"properties": {
"acted_on_behalf_of": {
"$ref": "#/$defs/Agent"
},
"was_informed_by": {
"type": "string"
}
},
"required": [],
"title": "Agent",
"type": "object"
},
"AttributeValue": {
"additionalProperties": false,
"description": "The value for any value of a attribute for a sample. This object can hold both the un-normalized atomic value and the structured value",
"properties": {
"has_raw_value": {
"description": "The value that was specified for an annotation in raw form, i.e. a string. E.g. \"2 cm\" or \"2-4 cm\"",
"type": "string"
},
"type": {
"description": "An optional string that specified the type of object.",
"type": "string"
},
"was_generated_by": {
"type": "string"
}
},
"required": [],
"title": "AttributeValue",
"type": "object"
},
"Biosample": {
"additionalProperties": false,
"description": "A material sample. It may be environmental (encompassing many organisms) or isolate or tissue. An environmental sample containing genetic material from multiple individuals is commonly referred to as a biosample.",
"properties": {
"GOLD_sample_identifiers": {
"description": "identifiers for corresponding sample in GOLD",
"items": {
"type": "string"
},
"pattern": "^GOLD:Gb[0-9]+$",
"type": "array"
},
"INSDC_biosample_identifiers": {
"description": "identifiers for corresponding sample in INSDC",
"items": {
"type": "string"
},
"pattern": "^biosample:SAM[NED]([A-Z])?[0-9]+$",
"type": "array"
},
"INSDC_secondary_sample_identifiers": {
"description": "secondary identifiers for corresponding sample in INSDC",
"items": {
"type": "string"
},
"pattern": "^biosample:(E|D|S)RS[0-9]{6,}$",
"type": "array"
},
"add_date": {
"description": "The date on which the information was added to the database.",
"type": "string"
},
"agrochem_addition": {
"$ref": "#/$defs/QuantityValue",
"description": "Addition of fertilizers, pesticides, etc. - amount and time of applications"
},
"al_sat": {
"$ref": "#/$defs/QuantityValue",
"description": "Aluminum saturation (esp. For tropical soils)",
"pattern": "\\d+[.\\d+] \\S+"
},
"al_sat_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining Al saturation"
},
"alkalinity": {
"$ref": "#/$defs/QuantityValue",
"description": "Alkalinity, the ability of a solution to neutralize acids to the equivalence point of carbonate or bicarbonate",
"pattern": "\\d+[.\\d+] \\S+"
},
"alkalinity_method": {
"$ref": "#/$defs/TextValue",
"description": "Method used for alkalinity measurement"
},
"alkyl_diethers": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of alkyl diethers ",
"pattern": "\\d+[.\\d+] \\S+"
},
"alt": {
"$ref": "#/$defs/QuantityValue",
"description": "Altitude is a term used to identify heights of objects such as airplanes, space shuttles, rockets, atmospheric balloons and heights of places such as atmospheric layers and clouds. It is used to measure the height of an object which is above the earthbs surface. In this context, the altitude measurement is the vertical distance between the earth's surface above sea level and the sampled position in the air",
"pattern": "\\d+[.\\d+] \\S+"
},
"alternative_identifiers": {
"description": "A list of alternative identifiers for the entity.",
"items": {
"type": "string"
},
"type": "array"
},
"aminopept_act": {
"$ref": "#/$defs/QuantityValue",
"description": "Measurement of aminopeptidase activity",
"pattern": "\\d+[.\\d+] \\S+"
},
"ammonium": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of ammonium in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"annual_precpt": {
"$ref": "#/$defs/QuantityValue",
"description": "The average of all annual precipitation values known, or an estimated equivalent value derived by such methods as regional indexes or Isohyetal maps.",
"pattern": "\\d+[.\\d+] \\S+"
},
"annual_temp": {
"$ref": "#/$defs/QuantityValue",
"description": "Mean annual temperature",
"pattern": "\\d+[.\\d+] \\S+"
},
"bacteria_carb_prod": {
"$ref": "#/$defs/QuantityValue",
"description": "Measurement of bacterial carbon production",
"pattern": "\\d+[.\\d+] \\S+"
},
"bishomohopanol": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of bishomohopanol ",
"pattern": "\\d+[.\\d+] \\S+"
},
"bromide": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of bromide ",
"pattern": "\\d+[.\\d+] \\S+"
},
"calcium": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of calcium in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"carb_nitro_ratio": {
"$ref": "#/$defs/QuantityValue",
"description": "Ratio of amount or concentrations of carbon to nitrogen",
"pattern": "\\d+[.\\d+] \\S+"
},
"chem_administration": {
"$ref": "#/$defs/ControlledTermValue",
"description": "List of chemical compounds administered to the host or site where sampling occurred, and when (e.g. Antibiotics, n fertilizer, air filter); can include multiple compounds. For chemical entities of biological interest ontology (chebi) (v 163), http://purl.bioontology.org/ontology/chebi"
},
"chloride": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of chloride in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"chlorophyll": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of chlorophyll",
"pattern": "\\d+[.\\d+] \\S+"
},
"collection_date": {
"$ref": "#/$defs/TimestampValue",
"description": "The time of sampling, either as an instance (single point in time) or interval. In case no exact time is available, the date/time can be right truncated i.e. all of these are valid times: 2008-01-23T19:23:10+00:00; 2008-01-23T19:23:10; 2008-01-23; 2008-01; 2008; Except: 2008-01; 2008 all are ISO8601 compliant"
},
"community": {
"type": "string"
},
"crop_rotation": {
"$ref": "#/$defs/TextValue",
"description": "Whether or not crop is rotated, and if yes, rotation schedule"
},
"cur_land_use": {
"$ref": "#/$defs/TextValue",
"description": "Present state of sample site",
"pattern": "[cities|farmstead|industrial areas|roads\\/railroads|rock|sand|gravel|mudflats|salt flats|badlands|permanent snow or ice|saline seeps|mines\\/quarries|oil waste areas|small grains|row crops|vegetable crops|horticultural plants (e.g. tulips)|marshlands (grass,sedges,rushes)|tundra (mosses,lichens)|rangeland|pastureland (grasslands used for livestock grazing)|hayland|meadows (grasses,alfalfa,fescue,bromegrass,timothy)|shrub land (e.g. mesquite,sage\\-brush,creosote bush,shrub oak,eucalyptus)|successional shrub land (tree saplings,hazels,sumacs,chokecherry,shrub dogwoods,blackberries)|shrub crops (blueberries,nursery ornamentals,filberts)|vine crops (grapes)|conifers (e.g. pine,spruce,fir,cypress)|hardwoods (e.g. oak,hickory,elm,aspen)|intermixed hardwood and conifers|tropical (e.g. mangrove,palms)|rainforest (evergreen forest receiving >406 cm annual rainfall)|swamp (permanent or semi\\-permanent water body dominated by woody plants)|crop trees (nuts,fruit,christmas trees,nursery trees)]"
},
"cur_vegetation": {
"$ref": "#/$defs/TextValue",
"description": "Vegetation classification from one or more standard classification systems, or agricultural crop"
},
"cur_vegetation_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in vegetation classification "
},
"density": {
"$ref": "#/$defs/QuantityValue",
"description": "Density of the sample, which is its mass per unit volume (aka volumetric mass density)",
"pattern": "\\d+[.\\d+] \\S+"
},
"depth": {
"$ref": "#/$defs/QuantityValue",
"description": "Depth is defined as the vertical distance below local surface, e.g. For sediment or soil samples depth is measured from sediment or soil surface, respectively. Depth can be reported as an interval for subsurface samples"
},
"depth2": {
"$ref": "#/$defs/QuantityValue"
},
"description": {
"description": "a human-readable description of a thing",
"type": "string"
},
"diss_carb_dioxide": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of dissolved carbon dioxide in the sample or liquid portion of the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"diss_hydrogen": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of dissolved hydrogen",
"pattern": "\\d+[.\\d+] \\S+"
},
"diss_inorg_carb": {
"$ref": "#/$defs/QuantityValue",
"description": "Dissolved inorganic carbon concentration in the sample, typically measured after filtering the sample using a 0.45 micrometer filter",
"pattern": "\\d+[.\\d+] \\S+"
},
"diss_inorg_phosp": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of dissolved inorganic phosphorus in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"diss_org_carb": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of dissolved organic carbon in the sample, liquid portion of the sample, or aqueous phase of the fluid",
"pattern": "\\d+[.\\d+] \\S+"
},
"diss_org_nitro": {
"$ref": "#/$defs/QuantityValue",
"description": "Dissolved organic nitrogen concentration measured as; total dissolved nitrogen - NH4 - NO3 - NO2",
"pattern": "\\d+[.\\d+] \\S+"
},
"diss_oxygen": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of dissolved oxygen",
"pattern": "\\d+[.\\d+] \\S+"
},
"drainage_class": {
"$ref": "#/$defs/TextValue",
"description": "Drainage classification from a standard system such as the USDA system",
"pattern": "[very poorly|poorly|somewhat poorly|moderately well|well|excessively drained]"
},
"ecosystem": {
"description": "An ecosystem is a combination of a physical environment (abiotic factors) and all the organisms (biotic factors) that interact with this environment. Ecosystem is in position 1/5 in a GOLD path.",
"type": "string"
},
"ecosystem_category": {
"description": "Ecosystem categories represent divisions within the ecosystem based on specific characteristics of the environment from where an organism or sample is isolated. Ecosystem category is in position 2/5 in a GOLD path.",
"type": "string"
},
"ecosystem_subtype": {
"description": "Ecosystem subtypes represent further subdivision of Ecosystem types into more distinct subtypes. Ecosystem subtype is in position 4/5 in a GOLD path.",
"type": "string"
},
"ecosystem_type": {
"description": "Ecosystem types represent things having common characteristics within the Ecosystem Category. These common characteristics based grouping is still broad but specific to the characteristics of a given environment. Ecosystem type is in position 3/5 in a GOLD path.",
"type": "string"
},
"elev": {
"$ref": "#/$defs/QuantityValue",
"description": "Elevation of the sampling site is its height above a fixed reference point, most commonly the mean sea level. Elevation is mainly used when referring to points on the earth's surface, while altitude is used for points above the surface, such as an aircraft in flight or a spacecraft in orbit",
"pattern": "\\d+[.\\d+] \\S+"
},
"env_broad_scale": {
"$ref": "#/$defs/ControlledTermValue",
"description": "In this field, report which major environmental system your sample or specimen came from. The systems identified should have a coarse spatial grain, to provide the general environmental context of where the sampling was done (e.g. were you in the desert or a rainforest?). We recommend using subclasses of ENVOUs biome class: http://purl.obolibrary.org/obo/ENVO_00000428. Format (one term): termLabel [termID], Format (multiple terms): termLabel [termID]|termLabel [termID]|termLabel [termID]. Example: Annotating a water sample from the photic zone in middle of the Atlantic Ocean, consider: oceanic epipelagic zone biome [ENVO:01000033]. Example: Annotating a sample from the Amazon rainforest consider: tropical moist broadleaf forest biome [ENVO:01000228]. If needed, request new terms on the ENVO tracker, identified here: http://www.obofoundry.org/ontology/envo.html",
"pattern": ".* \\S+:\\S+"
},
"env_local_scale": {
"$ref": "#/$defs/ControlledTermValue",
"description": "In this field, report the entity or entities which are in your sample or specimenUs local vicinity and which you believe have significant causal influences on your sample or specimen. Please use terms that are present in ENVO and which are of smaller spatial grain than your entry for env_broad_scale. Format (one term): termLabel [termID]; Format (multiple terms): termLabel [termID]|termLabel [termID]|termLabel [termID]. Example: Annotating a pooled sample taken from various vegetation layers in a forest consider: canopy [ENVO:00000047]|herb and fern layer [ENVO:01000337]|litter layer [ENVO:01000338]|understory [01000335]|shrub layer [ENVO:01000336]. If needed, request new terms on the ENVO tracker, identified here: http://www.obofoundry.org/ontology/envo.html",
"pattern": ".* \\S+:\\S+"
},
"env_medium": {
"$ref": "#/$defs/ControlledTermValue",
"description": "In this field, report which environmental material or materials (pipe separated) immediately surrounded your sample or specimen prior to sampling, using one or more subclasses of ENVOUs environmental material class: http://purl.obolibrary.org/obo/ENVO_00010483. Format (one term): termLabel [termID]; Format (multiple terms): termLabel [termID]|termLabel [termID]|termLabel [termID]. Example: Annotating a fish swimming in the upper 100 m of the Atlantic Ocean, consider: ocean water [ENVO:00002151]. Example: Annotating a duck on a pond consider: pond water [ENVO:00002228]|air ENVO_00002005. If needed, request new terms on the ENVO tracker, identified here: http://www.obofoundry.org/ontology/envo.html",
"pattern": ".* \\S+:\\S+"
},
"env_package": {
"$ref": "#/$defs/TextValue",
"description": "MIxS extension for reporting of measurements and observations obtained from one or more of the environments where the sample was obtained. All environmental packages listed here are further defined in separate subtables. By giving the name of the environmental package, a selection of fields can be made from the subtables and can be reported",
"pattern": "[air|built environment|host\\-associated|human\\-associated|human\\-skin|human\\-oral|human\\-gut|human\\-vaginal|hydrocarbon resources\\-cores|hydrocarbon resources\\-fluids\\/swabs|microbial mat\\/biofilm|misc environment|plant\\-associated|sediment|soil|wastewater\\/sludge|water]"
},
"extreme_event": {
"$ref": "#/$defs/TimestampValue",
"description": "Unusual physical events that may have affected microbial populations"
},
"fao_class": {
"$ref": "#/$defs/TextValue",
"description": "Soil classification from the FAO World Reference Database for Soil Resources. The list can be found at http://www.fao.org/nr/land/sols/soil/wrb-soil-maps/reference-groups",
"pattern": "[Acrisols|Andosols|Arenosols|Cambisols|Chernozems|Ferralsols|Fluvisols|Gleysols|Greyzems|Gypsisols|Histosols|Kastanozems|Lithosols|Luvisols|Nitosols|Phaeozems|Planosols|Podzols|Podzoluvisols|Rankers|Regosols|Rendzinas|Solonchaks|Solonetz|Vertisols|Yermosols]"
},
"fire": {
"$ref": "#/$defs/TimestampValue",
"description": "Historical and/or physical evidence of fire"
},
"flooding": {
"$ref": "#/$defs/TimestampValue",
"description": "Historical and/or physical evidence of flooding"
},
"geo_loc_name": {
"$ref": "#/$defs/TextValue",
"description": "The geographical origin of the sample as defined by the country or sea name followed by specific region name. Country or sea names should be chosen from the INSDC country list (http://insdc.org/country.html), or the GAZ ontology (v 1.512) (http://purl.bioontology.org/ontology/GAZ)"
},
"glucosidase_act": {
"$ref": "#/$defs/QuantityValue",
"description": "Measurement of glucosidase activity",
"pattern": "\\d+[.\\d+] \\S+"
},
"habitat": {
"type": "string"
},
"heavy_metals": {
"$ref": "#/$defs/QuantityValue",
"description": "Heavy metals present and concentrationsany drug used by subject and the frequency of usage; can include multiple heavy metals and concentrations"
},
"heavy_metals_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining heavy metals"
},
"horizon": {
"$ref": "#/$defs/TextValue",
"description": "Specific layer in the land area which measures parallel to the soil surface and possesses physical characteristics which differ from the layers above and beneath",
"pattern": "[O horizon|A horizon|E horizon|B horizon|C horizon|R layer|Permafrost]"
},
"horizon_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining the horizon"
},
"host_name": {
"type": "string"
},
"id": {
"description": "A unique identifier for a thing. Must be either a CURIE shorthand for a URI or a complete URI",
"type": "string"
},
"identifier": {
"type": "string"
},
"lat_lon": {
"$ref": "#/$defs/GeolocationValue",
"description": "This is currently a required field but it's not clear if this should be required for human hosts",
"pattern": "\\d+[.\\d+] \\d+[.\\d+]"
},
"link_addit_analys": {
"$ref": "#/$defs/TextValue",
"description": "Link to additional analysis results performed on the sample"
},
"link_class_info": {
"$ref": "#/$defs/TextValue",
"description": "Link to digitized soil maps or other soil classification information"
},
"link_climate_info": {
"$ref": "#/$defs/TextValue",
"description": "Link to climate resource"
},
"local_class": {
"$ref": "#/$defs/TextValue",
"description": "Soil classification based on local soil classification system"
},
"local_class_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining the local soil classification "
},
"location": {
"type": "string"
},
"magnesium": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of magnesium in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"mean_frict_vel": {
"$ref": "#/$defs/QuantityValue",
"description": "Measurement of mean friction velocity",
"pattern": "\\d+[.\\d+] \\S+"
},
"mean_peak_frict_vel": {
"$ref": "#/$defs/QuantityValue",
"description": "Measurement of mean peak friction velocity",
"pattern": "\\d+[.\\d+] \\S+"
},
"microbial_biomass": {
"$ref": "#/$defs/QuantityValue",
"description": "The part of the organic matter in the soil that constitutes living microorganisms smaller than 5-10 micrometer. If you keep this, you would need to have correction factors used for conversion to the final units",
"pattern": "\\d+[.\\d+] \\S+"
},
"microbial_biomass_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining microbial biomass"
},
"misc_param": {
"$ref": "#/$defs/QuantityValue",
"description": "Any other measurement performed or parameter collected, that is not listed here"
},
"mod_date": {
"description": "The last date on which the database information was modified.",
"type": "string"
},
"n_alkanes": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of n-alkanes; can include multiple n-alkanes"
},
"name": {
"description": "A human readable label for an entity",
"type": "string"
},
"ncbi_taxonomy_name": {
"type": "string"
},
"nitrate": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of nitrate in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"nitrite": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of nitrite in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"org_matter": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of organic matter ",
"pattern": "\\d+[.\\d+] \\S+"
},
"org_nitro": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of organic nitrogen",
"pattern": "\\d+[.\\d+] \\S+"
},
"organism_count": {
"$ref": "#/$defs/QuantityValue",
"description": "Total cell count of any organism (or group of organisms) per gram, volume or area of sample, should include name of organism followed by count. The method that was used for the enumeration (e.g. qPCR, atp, mpn, etc.) Should also be provided. (example: total prokaryotes; 3.5e7 cells per ml; qpcr)"
},
"oxy_stat_samp": {
"$ref": "#/$defs/TextValue",
"description": "Oxygenation status of sample",
"pattern": "[aerobic|anaerobic|other]"
},
"part_of": {
"description": "Links a resource to another resource that either logically or physically includes it.",
"items": {
"type": "string"
},
"type": "array"
},
"part_org_carb": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of particulate organic carbon",
"pattern": "\\d+[.\\d+] \\S+"
},
"perturbation": {
"$ref": "#/$defs/TextValue",
"description": "Type of perturbation, e.g. chemical administration, physical disturbance, etc., coupled with perturbation regimen including how many times the perturbation was repeated, how long each perturbation lasted, and the start and end time of the entire perturbation period; can include multiple perturbation types"
},
"petroleum_hydrocarb": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of petroleum hydrocarbon",
"pattern": "\\d+[.\\d+] \\S+"
},
"ph": {
"$ref": "#/$defs/QuantityValue",
"description": "Ph measurement of the sample, or liquid portion of sample, or aqueous phase of the fluid",
"pattern": "\\d+[.\\d+]"
},
"ph_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining ph"
},
"phaeopigments": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of phaeopigments; can include multiple phaeopigments"
},
"phosplipid_fatt_acid": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of phospholipid fatty acids; can include multiple values"
},
"pool_dna_extracts": {
"$ref": "#/$defs/TextValue",
"description": "Indicate whether multiple DNA extractions were mixed. If the answer yes, the number of extracts that were pooled should be given"
},
"potassium": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of potassium in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"pressure": {
"$ref": "#/$defs/QuantityValue",
"description": "Pressure to which the sample is subject to, in atmospheres",
"pattern": "\\d+[.\\d+] \\S+"
},
"previous_land_use": {
"$ref": "#/$defs/TextValue",
"description": "Previous land use and dates"
},
"previous_land_use_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining previous land use and dates"
},
"profile_position": {
"$ref": "#/$defs/TextValue",
"description": "Cross-sectional position in the hillslope where sample was collected.sample area position in relation to surrounding areas",
"pattern": "[summit|shoulder|backslope|footslope|toeslope]"
},
"proport_woa_temperature": {
"type": "string"
},
"redox_potential": {
"$ref": "#/$defs/QuantityValue",
"description": "Redox potential, measured relative to a hydrogen cell, indicating oxidation or reduction potential",
"pattern": "\\d+[.\\d+] \\S+"
},
"salinity": {
"$ref": "#/$defs/QuantityValue",
"description": "Salinity is the total concentration of all dissolved salts in a water sample. While salinity can be measured by a complete chemical analysis, this method is difficult and time consuming. More often, it is instead derived from the conductivity measurement. This is known as practical salinity. These derivations compare the specific conductance of the sample to a salinity standard such as seawater",
"pattern": "\\d+[.\\d+] \\S+"
},
"salinity_category": {
"description": "Categorcial description of the sample's salinity. Examples: halophile, halotolerant, hypersaline, huryhaline",
"type": "string"
},
"salinity_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining salinity"
},
"samp_collect_device": {
"$ref": "#/$defs/TextValue",
"description": "The method or device employed for collecting the sample"
},
"samp_mat_process": {
"$ref": "#/$defs/ControlledTermValue",
"description": "Any processing applied to the sample during or after retrieving the sample from environment. This field accepts OBI, for a browser of OBI (v 2018-02-12) terms please see http://purl.bioontology.org/ontology/OBI"
},
"samp_store_dur": {
"$ref": "#/$defs/TextValue",
"description": "Duration for which the sample was stored"
},
"samp_store_loc": {
"$ref": "#/$defs/TextValue",
"description": "Location at which sample was stored, usually name of a specific freezer/room"
},
"samp_store_temp": {
"$ref": "#/$defs/QuantityValue",
"description": "Temperature at which sample was stored, e.g. -80 degree Celsius",
"pattern": "\\d+[.\\d+] \\S+"
},
"samp_vol_we_dna_ext": {
"$ref": "#/$defs/QuantityValue",
"description": "Volume (ml), weight (g) of processed sample, or surface area swabbed from sample for DNA extraction",
"pattern": "\\d+[.\\d+] \\S+"
},
"sample_collection_site": {
"type": "string"
},
"season_precpt": {
"$ref": "#/$defs/QuantityValue",
"description": "The average of all seasonal precipitation values known, or an estimated equivalent value derived by such methods as regional indexes or Isohyetal maps.",
"pattern": "\\d+[.\\d+] \\S+"
},
"season_temp": {
"$ref": "#/$defs/QuantityValue",
"description": "Mean seasonal temperature",
"pattern": "\\d+[.\\d+] \\S+"
},
"sieving": {
"$ref": "#/$defs/QuantityValue",
"description": "Collection design of pooled samples and/or sieve size and amount of sample sieved "
},
"size_frac_low": {
"$ref": "#/$defs/QuantityValue",
"description": "Refers to the mesh/pore size used to pre-filter/pre-sort the sample. Materials larger than the size threshold are excluded from the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"size_frac_up": {
"$ref": "#/$defs/QuantityValue",
"description": "Refers to the mesh/pore size used to retain the sample. Materials smaller than the size threshold are excluded from the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"slope_aspect": {
"$ref": "#/$defs/QuantityValue",
"description": "The direction a slope faces. While looking down a slope use a compass to record the direction you are facing (direction or degrees); e.g., nw or 315 degrees. This measure provides an indication of sun and wind exposure that will influence soil temperature and evapotranspiration.",
"pattern": "\\d+[.\\d+] \\S+"
},
"slope_gradient": {
"$ref": "#/$defs/QuantityValue",
"description": "Commonly called 'slope'. The angle between ground surface and a horizontal line (in percent). This is the direction that overland water would flow. This measure is usually taken with a hand level meter or clinometer",
"pattern": "\\d+[.\\d+] \\S+"
},
"sodium": {
"$ref": "#/$defs/QuantityValue",
"description": "Sodium concentration in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"soil_type": {
"$ref": "#/$defs/TextValue",
"description": "Soil series name or other lower-level classification"
},
"soil_type_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining soil series name or other lower-level classification"
},
"soluble_iron_micromol": {
"type": "string"
},
"specific_ecosystem": {
"description": "Specific ecosystems represent specific features of the environment like aphotic zone in an ocean or gastric mucosa within a host digestive system. Specific ecosystem is in position 5/5 in a GOLD path.",
"type": "string"
},
"store_cond": {
"$ref": "#/$defs/TextValue",
"description": "Explain how and for how long the soil sample was stored before DNA extraction"
},
"subsurface_depth": {
"$ref": "#/$defs/QuantityValue"
},
"subsurface_depth2": {
"$ref": "#/$defs/QuantityValue"
},
"sulfate": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of sulfate in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"sulfide": {
"$ref": "#/$defs/QuantityValue",
"description": "Concentration of sulfide in the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"temp": {
"$ref": "#/$defs/QuantityValue",
"description": "Temperature of the sample at the time of sampling",
"pattern": "\\d+[.\\d+] \\S+"
},
"texture": {
"$ref": "#/$defs/QuantityValue",
"description": "The relative proportion of different grain sizes of mineral particles in a soil, as described using a standard system; express as % sand (50 um to 2 mm), silt (2 um to 50 um), and clay (<2 um) with textural name (e.g., silty clay loam) optional.",
"pattern": "\\d+[.\\d+] \\S+"
},
"texture_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining soil texture"
},
"tidal_stage": {
"$ref": "#/$defs/TextValue",
"description": "Stage of tide",
"pattern": "[low tide|ebb tide|flood tide|high tide]"
},
"tillage": {
"$ref": "#/$defs/TextValue",
"description": "Note method(s) used for tilling",
"pattern": "[drill|cutting disc|ridge till|strip tillage|zonal tillage|chisel|tined|mouldboard|disc plough]"
},
"tot_carb": {
"$ref": "#/$defs/QuantityValue",
"description": "Total carbon content",
"pattern": "\\d+[.\\d+] \\S+"
},
"tot_depth_water_col": {
"$ref": "#/$defs/QuantityValue",
"description": "Measurement of total depth of water column",
"pattern": "\\d+[.\\d+] \\S+"
},
"tot_diss_nitro": {
"$ref": "#/$defs/QuantityValue",
"description": "Total dissolved nitrogen concentration, reported as nitrogen, measured by: total dissolved nitrogen = NH4 + NO3NO2 + dissolved organic nitrogen",
"pattern": "\\d+[.\\d+] \\S+"
},
"tot_nitro_content": {
"$ref": "#/$defs/QuantityValue",
"description": "Total nitrogen content of the sample",
"pattern": "\\d+[.\\d+] \\S+"
},
"tot_nitro_content_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining the total nitrogen"
},
"tot_org_c_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining total organic carbon"
},
"tot_org_carb": {
"$ref": "#/$defs/QuantityValue",
"description": "Definition for soil: total organic carbon content of the soil, definition otherwise: total organic carbon content",
"pattern": "\\d+[.\\d+] \\S+"
},
"tot_phosp": {
"$ref": "#/$defs/QuantityValue",
"description": "Total phosphorus concentration in the sample, calculated by: total phosphorus = total dissolved phosphorus + particulate phosphorus",
"pattern": "\\d+[.\\d+] \\S+"
},
"type": {
"description": "An optional string that specifies the type object. This is used to allow for searches for different kinds of objects.",
"type": "string"
},
"water_content": {
"$ref": "#/$defs/QuantityValue",
"description": "Water content measurement",
"pattern": "\\d+[.\\d+] \\S+"
},
"water_content_soil_meth": {
"$ref": "#/$defs/TextValue",
"description": "Reference or method used in determining the water content of soil"
}
},
"required": [
"id",
"part_of",
"env_broad_scale",
"env_local_scale",
"env_medium"
],
"title": "Biosample",
"type": "object"
},
"BiosampleProcessing": {
"additionalProperties": false,
"description": "A process that takes one or more biosamples as inputs and generates one or as outputs. Examples of outputs include samples cultivated from another sample or data objects created by instruments runs.",
"properties": {
"alternative_identifiers": {
"description": "A list of alternative identifiers for the entity.",
"items": {
"type": "string"
},
"type": "array"
},
"description": {
"description": "a human-readable description of a thing",
"type": "string"
},
"has_input": {
"description": "An input to a process.",
"items": {
"type": "string"
},
"type": "array"
},
"id": {
"description": "A unique identifier for a thing. Must be either a CURIE shorthand for a URI or a complete URI",
"type": "string"
},
"name": {
"description": "A human readable label for an entity",
"type": "string"
}
},
"required": [
"id"
],
"title": "BiosampleProcessing",
"type": "object"
},
"BooleanValue": {
"additionalProperties": false,
"description": "A value that is a boolean",
"properties": {
"has_boolean_value": {
"description": "Links a quantity value to a boolean",
"type": "boolean"
},
"has_raw_value": {
"description": "The value that was specified for an annotation in raw form, i.e. a string. E.g. \"2 cm\" or \"2-4 cm\"",
"type": "string"
},
"type": {
"description": "An optional string that specified the type of object.",
"type": "string"
},
"was_generated_by": {
"type": "string"
}
},
"required": [],
"title": "BooleanValue",
"type": "object"
},
"ChemicalEntity": {
"additionalProperties": false,
"description": "An atom or molecule that can be represented with a chemical formula. Include lipids, glycans, natural products, drugs. There may be different terms for distinct acid-base forms, protonation states",
"properties": {
"alternative_identifiers": {
"description": "A list of alternative identifiers for the entity.",
"items": {
"type": "string"
},
"type": "array"
},
"chemical_formula": {
"description": "A generic grouping for miolecular formulae and empirican formulae",
"type": "string"
},
"description": {
"description": "a human-readable description of a thing",
"type": "string"
},
"id": {
"description": "A unique identifier for a thing. Must be either a CURIE shorthand for a URI or a complete URI",
"type": "string"
},
"inchi": {
"type": "string"
},
"inchi_key": {
"type": "string"
},
"name": {
"description": "A human readable label for an entity",
"type": "string"
},
"smiles": {
"description": "A string encoding of a molecular graph, no chiral or isotopic information. There are usually a large number of valid SMILES which represent a given structure. For example, CCO, OCC and C(O)C all specify the structure of ethanol.",
"items": {
"type": "string"
},
"type": "array"
}
},
"required": [
"id"
],
"title": "ChemicalEntity",
"type": "object"
},
"ControlledTermValue": {
"additionalProperties": false,
"description": "A controlled term or class from an ontology",
"properties": {
"has_raw_value": {
"description": "The value that was specified for an annotation in raw form, i.e. a string. E.g. \"2 cm\" or \"2-4 cm\"",
"type": "string"
},
"term": {
"$ref": "#/$defs/OntologyClass",
"description": "pointer to an ontology class"
},
"type": {
"description": "An optional string that specified the type of object.",
"type": "string"
},
"was_generated_by": {
"type": "string"
}
},
"required": [],
"title": "ControlledTermValue",
"type": "object"
},
"CreditAssociation": {
"additionalProperties": false,
"description": "This class supports binding associated researchers to studies. There will be at least a slot for a CRediT Contributor Role (https://casrai.org/credit/) and for a person value Specifically see the associated researchers tab on the NMDC_SampleMetadata-V4_CommentsForUpdates at https://docs.google.com/spreadsheets/d/1INlBo5eoqn2efn4H2P2i8rwRBtnbDVTqXrochJEAPko/edit#gid=0",
"properties": {
"applied_role": {
"$ref": "#/$defs/CreditEnum"
},
"applied_roles": {
"items": {
"$ref": "#/$defs/CreditEnum"
},
"type": "array"
},
"applies_to_person": {
"$ref": "#/$defs/PersonValue"
},
"type": {
"description": "An optional string that specifies the type object. This is used to allow for searches for different kinds of objects.",
"type": "string"
}
},
"required": [
"applies_to_person",
"applied_roles"
],
"title": "CreditAssociation",
"type": "object"
},
"CreditEnum": {
"description": "",
"enum": [
"Conceptualization",
"Data curation",
"Formal Analysis",
"Funding acquisition",
"Investigation",
"Methodology",
"Project administration",
"Resources",
"Software",
"Supervision",
"Validation",
"Visualization",
"Writing original draft",
"Writing review and editing",
"Principal Investigator"
],
"title": "CreditEnum",
"type": "string"
},
"DataObject": {
"additionalProperties": false,
"description": "An object that primarily consists of symbols that represent information. Files, records, and omics data are examples of data objects.",
"properties": {
"alternative_identifiers": {
"description": "A list of alternative identifiers for the entity.",
"items": {
"type": "string"
},
"type": "array"
},
"compression_type": {
"description": "If provided, specifies the compression type",
"type": "string"
},
"data_object_type": {
"$ref": "#/$defs/FileTypeEnum",
"description": "The type of file represented by the data object."
},
"description": {
"description": "a human-readable description of a thing",
"type": "string"
},
"file_size_bytes": {
"description": "Size of the file in bytes",
"type": "integer"
},
"id": {
"description": "A unique identifier for a thing. Must be either a CURIE shorthand for a URI or a complete URI",
"type": "string"
},
"md5_checksum": {
"description": "MD5 checksum of file (pre-compressed)",
"type": "string"
},
"name": {
"description": "A human readable label for an entity",
"type": "string"
},
"type": {
"description": "An optional string that specifies the type object. This is used to allow for searches for different kinds of objects.",
"type": "string"
},
"url": {
"type": "string"
},
"was_generated_by": {
"type": "string"
}
},
"required": [
"id",
"name",
"description"
],
"title": "DataObject",
"type": "object"
},
"Database": {
"additionalProperties": false,
"description": "An abstract holder for any set of metadata and data. It does not need to correspond to an actual managed databse top level holder class. When translated to JSON-Schema this is the 'root' object. It should contain pointers to other objects of interest",
"properties": {
"activity_set": {