Skip to content

Commit

Permalink
Merge pull request #308 from georgetown-cset/update-events
Browse files Browse the repository at this point in the history
Update time interval in `events`
  • Loading branch information
jmelot authored Mar 25, 2024
2 parents f4ad91e + 0aa62e3 commit b427a0f
Showing 1 changed file with 5 additions and 70 deletions.
75 changes: 5 additions & 70 deletions sql/events.sql
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
-- todo, update so we don't have to edit this query every time the month changes.
-- This queries over 13 TB of data as of 2022-04-20, so run it judiciously
-- This queries over 23 TB of data as of 2024-03-25, so run it judiciously
WITH
relevant_repos AS (
SELECT DISTINCT repo_name
Expand Down Expand Up @@ -186,7 +186,7 @@ curr_data AS (
id,
other
FROM
`githubarchive.month.202301`
`githubarchive.year.2023`
UNION ALL
SELECT
type,
Expand All @@ -199,7 +199,7 @@ curr_data AS (
id,
other
FROM
`githubarchive.month.202302`
`githubarchive.month.202401`
UNION ALL
SELECT
type,
Expand All @@ -212,7 +212,7 @@ curr_data AS (
id,
other
FROM
`githubarchive.month.202303`
`githubarchive.month.202402`
UNION ALL
SELECT
type,
Expand All @@ -225,72 +225,7 @@ curr_data AS (
id,
other
FROM
`githubarchive.month.202304`
UNION ALL
SELECT
type,
public,
payload,
repo,
actor,
org,
created_at,
id,
other
FROM
`githubarchive.month.202305`
UNION ALL
SELECT
type,
public,
payload,
repo,
actor,
org,
created_at,
id,
other
FROM
`githubarchive.month.202306`
UNION ALL
SELECT
type,
public,
payload,
repo,
actor,
org,
created_at,
id,
other
FROM
`githubarchive.month.202307`
UNION ALL
SELECT
type,
public,
payload,
repo,
actor,
org,
created_at,
id,
other
FROM
`githubarchive.month.202308`
UNION ALL
SELECT
type,
public,
payload,
repo,
actor,
org,
created_at,
id,
other
FROM
`githubarchive.month.202309`
`githubarchive.month.202403`
),

-- needed to allow match to data for old repo names
Expand Down

0 comments on commit b427a0f

Please sign in to comment.