Skip to content

Commit

Permalink
skip snapshots for ublad corpus
Browse files Browse the repository at this point in the history
  • Loading branch information
Meesch committed May 24, 2024
1 parent fb04081 commit e5d8971
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions backend/corpora/ublad/ublad.py
Original file line number Diff line number Diff line change
Expand Up @@ -72,6 +72,10 @@ def es_settings(self):

def sources(self, start=min_date, end=max_date):
for directory, _, filenames in os.walk(self.data_directory):
_body, tail = os.path.split(directory)
if tail.startswith("."):
# don't go through directories from snapshots
continue
for filename in filenames:
if filename != '.DS_Store':
full_path = join(directory, filename)
Expand Down

0 comments on commit e5d8971

Please sign in to comment.