Skip to content

Commit

Permalink
skip snapshots for ublad corpus
Browse files Browse the repository at this point in the history
  • Loading branch information
Meesch committed May 28, 2024
1 parent 633be4d commit c4e1e08
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions backend/corpora/ublad/ublad.py
Original file line number Diff line number Diff line change
Expand Up @@ -72,6 +72,10 @@ def es_settings(self):

def sources(self, start=min_date, end=max_date):
for directory, _, filenames in os.walk(self.data_directory):
_body, tail = os.path.split(directory)
if '.snapshot' in _:
_.remove('.snapshot')
continue
for filename in filenames:
if filename != '.DS_Store':
full_path = join(directory, filename)
Expand Down

0 comments on commit c4e1e08

Please sign in to comment.