Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Update Timezone Offsets #22

Merged
merged 11 commits into from
Sep 10, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
19 changes: 19 additions & 0 deletions .pre-commit-config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,19 @@
repos:
- repo: https://github.com/ambv/black
rev: 22.3.0
hooks:
- id: black
name: black
entry: black
require_serial: true
language: python
language_version: python3
types_or: [cython, pyi, python]
minimum_pre_commit_version: '2.9.2'
# additional_dependencies: ['black==22.3.0']
- repo: https://github.com/pre-commit/pre-commit-hooks
rev: v2.0.0
hooks:
- id: flake8
exclude: ^test
args: ['--ignore=F841,E722,F821,E711,E231,W503,E501,F401']
166 changes: 137 additions & 29 deletions pypodcastparser/Item.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,9 +13,32 @@
LOGGER = logging.getLogger(__name__)


pytz_timezon_list = [tz for tz in pytz.all_timezones]
pytz_timezone_list = [tz for tz in pytz.all_timezones]

common_timezones = {
"IDLW": "Pacific/Midway",
"NUT": "Pacific/Niue",
"MART": "Pacific/Marquesas",
"AKST": "America/Anchorage",
"MST": "America/Denver",
"EST": "America/New_York",
"VET": "America/Caracas",
"BRT": "America/Sao_Paulo",
"GST": "Asia/Dubai",
"AZOT": "Atlantic/Azores",
"MSK": "Europe/Moscow",
"PKT": "Asia/Karachi",
"NPT": "Asia/Kathmandu",
"MMT": "Asia/Rangoon",
"ICT": "Asia/Bangkok",
"AWST": "Australia/Perth",
"ACWST": "Australia/Eucla",
"GMT": "GMT",
"ACST": "Australia/Adelaide",
"AEDT": "Australia/Sydney",
"CHAST": "Pacific/Chatham",
"NZDT": "Pacific/Auckland",
"LINT": "Pacific/Kiritimati",
"UTC": "UTC",
"CET": "Europe/Berlin",
"EET": "Africa/Cairo",
Expand All @@ -33,6 +56,47 @@
"CAT": "Africa/Maputo",
"AEST": "Australia/Sydney",
"PDT": "America/Los_Angeles",
"NZST": "Pacific/Auckland",
}

# Map of timezone offsets to timezone abbreviations
offset_map = {
"-1200": "IDLW",
"-1100": "NUT",
"-1000": "HST",
"-0930": "MART",
"-0900": "AKST",
"-0800": "PST",
"-0700": "MST",
"-0600": "CST",
"-0500": "EST",
"-0430": "VET",
"-0400": "AST",
"-0330": "NST",
"-0300": "BRT",
"-0200": "GST",
"-0100": "AZOT",
"-0000": "GMT",
"+0100": "CET",
"+0200": "EET",
"+0300": "MSK",
"+0400": "GST",
"+0500": "PKT",
"+0545": "NPT",
"+0600": "BST",
"+0630": "MMT",
"+0700": "ICT",
"+0800": "AWST",
"+0845": "ACWST",
"+0900": "JST",
"+0930": "ACST",
"+1000": "AEST",
"+1030": "ACST",
"+1100": "AEDT",
"+1200": "NZST",
"+1245": "CHAST",
"+1300": "NZDT",
"+1400": "LINT",
}


Expand Down Expand Up @@ -159,7 +223,9 @@ def set_time_published(self):
except (TypeError, ValueError, IndexError):
self.time_published = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed"
)

def set_dates_published(self):
if self.time_published is None:
Expand All @@ -170,7 +236,9 @@ def set_dates_published(self):
except ValueError:
self.date_time = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed"
)

def to_dict(self):
item = {}
Expand Down Expand Up @@ -203,7 +271,9 @@ def set_author(self, tag):
except AttributeError:
self.author = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level author could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level author could not be parsed"
)

def set_description(self, tag):
"""Parses description and set value."""
Expand All @@ -212,7 +282,9 @@ def set_description(self, tag):
except AttributeError:
self.description = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level description could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level description could not be parsed"
)

def set_content_encoded(self, tag):
"""Parses content_encoded and set value."""
Expand All @@ -223,7 +295,9 @@ def set_content_encoded(self, tag):
except AttributeError:
self.content_encoded = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level content_encoded could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level content_encoded could not be parsed"
)

def set_enclosure(self, tag):
"""Parses enclosure_url, enclosure_type then set values."""
Expand All @@ -248,7 +322,9 @@ def set_guid(self, tag):
except AttributeError:
self.guid = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level guid could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level guid could not be parsed"
)

# TODO convert to one timezone
def set_published_date(self, tag):
Expand All @@ -262,22 +338,28 @@ def set_published_date(self, tag):
raise AttributeError

published_date_timezone = ""
# Check for timezone abbreviation
if re.match("^[a-zA-Z]{3}$", deconstructed_date[-1]):
published_date_timezone = deconstructed_date[-1]
deconstructed_date.pop()
elif "+1000" in self.published_date:
published_date_timezone = "AEST"
deconstructed_date.pop()
else:
# Check for specific timezone offsets
for offset, tz in offset_map.items():
if offset in self.published_date:
published_date_timezone = tz
deconstructed_date.pop()
break
if not published_date_timezone:
published_date_timezone = "EST"

regex_array = [
"^[a-zA-Z]{3},$",
"^\d{1,2}$",
"^[a-zA-Z]{3}$",
"^\d{4}$",
"^\d\d:\d\d",
r"^[a-zA-Z]{3},$", # Raw string, so \ is treated literally
r"^\d{1,2}$",
r"^[a-zA-Z]{3}$",
r"^\d{4}$",
r"^\d\d:\d\d",
]

new_array = []
for array_index, array_value in enumerate(regex_array):
if re.match(deconstructed_date[array_index], array_value):
Expand Down Expand Up @@ -329,7 +411,7 @@ def set_published_date(self, tag):
)

if published_date_timezone not in ["ET", "EST", "EDT"]:
if published_date_timezone in pytz_timezon_list:
if published_date_timezone in pytz_timezone_list:
current_timezone = pytz.timezone(published_date_timezone)
else:
current_timezone = pytz.timezone(
Expand Down Expand Up @@ -360,7 +442,9 @@ def set_title(self, tag):
except AttributeError:
self.title = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level title could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level title could not be parsed"
)

def set_itunes_author_name(self, tag):
"""Parses author name from itunes tags and sets value"""
Expand All @@ -369,7 +453,9 @@ def set_itunes_author_name(self, tag):
except AttributeError:
self.itunes_author_name = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:author could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:author could not be parsed"
)

def set_itunes_episode(self, tag):
"""Parses the episode number and sets value"""
Expand All @@ -381,7 +467,9 @@ def set_itunes_episode(self, tag):
except AttributeError:
self.itunes_episode = "0"
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:episode: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:episode: {tag.string}, could not be parsed"
)

def set_podcast_transcript(self, tag):
"""Parses the episode transcript and sets value
Expand All @@ -399,7 +487,9 @@ def set_podcast_transcript(self, tag):
except AttributeError:
self.podcast_transcript = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode transcription could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode transcription could not be parsed"
)

def set_itunes_season(self, tag):
"""Parses the episode season and sets value"""
Expand All @@ -418,7 +508,9 @@ def set_itunes_episode_type(self, tag):
except AttributeError:
self.itunes_episode_type = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:episodeType: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:episodeType: {tag.string}, could not be parsed"
)

def set_itunes_block(self, tag):
"""Check and see if item is blocked from iTunes and sets value"""
Expand All @@ -427,7 +519,9 @@ def set_itunes_block(self, tag):
except AttributeError:
block = ""
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:block: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:block: {tag.string}, could not be parsed"
)
if block == "yes":
self.itunes_block = True
else:
Expand Down Expand Up @@ -464,7 +558,9 @@ def set_itunes_duration(self, tag):
except AttributeError:
self.itunes_duration = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:duration: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:duration: {tag.string}, could not be parsed"
)

def set_itunes_explicit(self, tag):
"""Parses explicit from itunes item tags and sets value"""
Expand All @@ -488,7 +584,9 @@ def set_itunes_explicit(self, tag):
except AttributeError:
self.itunes_explicit = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:explicit could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:explicit could not be parsed"
)

def set_itunes_image(self, tag):
"""Parses itunes item images and set url as value"""
Expand All @@ -497,7 +595,9 @@ def set_itunes_image(self, tag):
except AttributeError:
self.itunes_image = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:image could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:image could not be parsed"
)

def set_itunes_order(self, tag):
"""Parses episode order and set url as value"""
Expand All @@ -507,7 +607,9 @@ def set_itunes_order(self, tag):
except AttributeError:
self.itunes_order = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:order could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:order could not be parsed"
)

def set_itunes_subtitle(self, tag):
"""Parses subtitle from itunes tags and sets value"""
Expand All @@ -516,7 +618,9 @@ def set_itunes_subtitle(self, tag):
except AttributeError:
self.itunes_subtitle = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:subtitle could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:subtitle could not be parsed"
)

def set_itunes_summary(self, tag):
"""Parses summary from itunes tags and sets value"""
Expand All @@ -525,7 +629,9 @@ def set_itunes_summary(self, tag):
except AttributeError:
self.itunes_summary = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:summary could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:summary could not be parsed"
)

def set_interactive(self, tag):
"""Parses author and set value."""
Expand All @@ -536,4 +642,6 @@ def set_interactive(self, tag):
self.interactive = False
self.is_interactive = self.interactive
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level ihr:interactive: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level ihr:interactive: {tag.string}, could not be parsed"
)
Loading
Loading