Skip to content

Commit

Permalink
Merge pull request #1248 from snowplow/release/r139
Browse files Browse the repository at this point in the history
Release R139
  • Loading branch information
jbeemster authored Jan 12, 2023
2 parents 812dab5 + e67f4ec commit 1861799
Show file tree
Hide file tree
Showing 2 changed files with 161 additions and 0 deletions.
4 changes: 4 additions & 0 deletions CHANGELOG
Original file line number Diff line number Diff line change
@@ -1,3 +1,7 @@
Release 139 (2022-01-09)
------------------------
Add com.snowplowanalytics.snowplow.storage/shredding_complete/jsonschema/2-0-1 (close #1247)

Release 138 (2022-12-20)
------------------------
Add com.snowplowanalytics.snowplow/consent_preferences/jsonschema/1-0-0 (close #1246)
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,157 @@
{
"$schema": "http://iglucentral.com/schemas/com.snowplowanalytics.self-desc/schema/jsonschema/1-0-0#",
"description": "Message with batch metadata, passed from Shredder to Loader",
"self": {
"vendor": "com.snowplowanalytics.snowplow.storage",
"name": "shredding_complete",
"format": "jsonschema",
"version": "2-0-1"
},
"type": "object",
"properties": {
"base": {
"description": "Blob storage path to the root of the batch",
"type": "string",
"format": "uri",
"maxLength": 1024
},
"compression": {
"description": "File compression type",
"enum": ["GZIP", "NONE"]
},
"typesInfo": {
"description": "Info about schemas used in events and output formats in the respective batch",
"type": "object",
"oneOf": [
{
"properties": {
"transformation": {
"description": "Type of the transformation",
"enum": ["SHREDDED"]
},
"types": {
"description": "Set of Iglu URIs and the format they were shredded into",
"type": "array",
"items": {
"properties": {
"schemaKey": {
"description": "Iglu URI",
"type": "string",
"maxLength": 256
},
"format": {
"description": "File format into which the entities were shredded",
"enum": ["TSV", "JSON"]
},
"snowplowEntity": {
"description": "Type of the self-describing JSONs in the event",
"enum": ["SELF_DESCRIBING_EVENT", "CONTEXT"]
}
},
"required": ["schemaKey", "format", "snowplowEntity"],
"additionalProperties": false
}
}
},
"required": ["transformation", "types"],
"additionalProperties": false
},
{
"properties": {
"transformation": {
"description": "Type of the transformation",
"enum": ["WIDEROW"]
},
"fileFormat": {
"description": "Output file format",
"enum": ["JSON", "PARQUET"]
},
"types": {
"description": "Set of Iglu URIs and the format they were shredded into",
"type": "array",
"items": {
"properties": {
"schemaKey": {
"description": "Iglu URI",
"type": "string",
"maxLength": 256
},
"snowplowEntity": {
"description": "Type of the self-describing JSONs in the event",
"enum": ["SELF_DESCRIBING_EVENT", "CONTEXT"]
}
},
"required": ["schemaKey", "snowplowEntity"],
"additionalProperties": false
}
}
},
"required": ["transformation", "fileFormat", "types"],
"additionalProperties": false
}
]
},
"timestamps": {
"description": "Set of timestampts associated with the batch",
"type": "object",
"properties": {
"jobStarted": {
"description": "Time when the batch started being shredded",
"type": "string",
"format": "date-time"
},
"jobCompleted": {
"description": "Time when the batch shredding has been finished (and the message being prepared)",
"type": "string",
"format": "date-time"
},
"min": {
"description": "The earliest collector_stamp available in the batch",
"type": ["string", "null"],
"format": "date-time"
},
"max": {
"description": "The latest collector_tstamp available in the batch",
"type": ["string", "null"],
"format": "date-time"
}
},
"required": ["jobStarted", "jobCompleted", "min", "max"]
},
"processor": {
"description": "Identificator of a shredder sent the message",
"type": "object",
"properties": {
"artifact": {
"description": "Name of the artifact",
"type": "string",
"maxLength": 64
},
"version": {
"description": "Semantic Version of the artifact",
"type": "string",
"maxLength": 16
}
},
"required": ["artifact", "version"]
},
"count": {
"description": "Count of events in the batch, null means the count could not be calculated",
"type": ["object", "null"],
"properties": {
"good": {
"description": "Amount of good events in the batch",
"type": "integer",
"minimum": 0
},
"bad": {
"description": "Amount of bad events in the batch",
"type": "integer",
"minimum": 0
}
}
}
},
"required": ["base", "compression", "typesInfo", "timestamps", "processor"],
"additionalProperties": false
}

0 comments on commit 1861799

Please sign in to comment.