Skip to content

Commit

Permalink
Merge pull request #21 from iheartradio/ihracp-7339/utc-timezone-offsets
Browse files Browse the repository at this point in the history
Adding all timezone offsets
  • Loading branch information
DrewJoseyGit authored Sep 9, 2024
2 parents 0bd1c71 + 4e94438 commit f54a22d
Show file tree
Hide file tree
Showing 5 changed files with 242 additions and 74 deletions.
19 changes: 19 additions & 0 deletions .pre-commit-config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,19 @@
repos:
- repo: https://github.com/ambv/black
rev: 22.3.0
hooks:
- id: black
name: black
entry: black
require_serial: true
language: python
language_version: python3
types_or: [cython, pyi, python]
minimum_pre_commit_version: '2.9.2'
# additional_dependencies: ['black==22.3.0']
- repo: https://github.com/pre-commit/pre-commit-hooks
rev: v2.0.0
hooks:
- id: flake8
exclude: ^test
args: ['--ignore=F841,E722,F821,E711,E231,W503,E501,F401']
166 changes: 137 additions & 29 deletions pypodcastparser/Item.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,9 +13,32 @@
LOGGER = logging.getLogger(__name__)


pytz_timezon_list = [tz for tz in pytz.all_timezones]
pytz_timezone_list = [tz for tz in pytz.all_timezones]

common_timezones = {
"IDLW": "Pacific/Midway",
"NUT": "Pacific/Niue",
"MART": "Pacific/Marquesas",
"AKST": "America/Anchorage",
"MST": "America/Denver",
"EST": "America/New_York",
"VET": "America/Caracas",
"BRT": "America/Sao_Paulo",
"GST": "Asia/Dubai",
"AZOT": "Atlantic/Azores",
"MSK": "Europe/Moscow",
"PKT": "Asia/Karachi",
"NPT": "Asia/Kathmandu",
"MMT": "Asia/Rangoon",
"ICT": "Asia/Bangkok",
"AWST": "Australia/Perth",
"ACWST": "Australia/Eucla",
"GMT": "GMT",
"ACST": "Australia/Adelaide",
"AEDT": "Australia/Sydney",
"CHAST": "Pacific/Chatham",
"NZDT": "Pacific/Auckland",
"LINT": "Pacific/Kiritimati",
"UTC": "UTC",
"CET": "Europe/Berlin",
"EET": "Africa/Cairo",
Expand All @@ -33,6 +56,47 @@
"CAT": "Africa/Maputo",
"AEST": "Australia/Sydney",
"PDT": "America/Los_Angeles",
"NZST": "Pacific/Auckland",
}

# Map of timezone offsets to timezone abbreviations
offset_map = {
"-1200": "IDLW",
"-1100": "NUT",
"-1000": "HST",
"-0930": "MART",
"-0900": "AKST",
"-0800": "PST",
"-0700": "MST",
"-0600": "CST",
"-0500": "EST",
"-0430": "VET",
"-0400": "AST",
"-0330": "NST",
"-0300": "BRT",
"-0200": "GST",
"-0100": "AZOT",
"-0000": "GMT",
"+0100": "CET",
"+0200": "EET",
"+0300": "MSK",
"+0400": "GST",
"+0500": "PKT",
"+0545": "NPT",
"+0600": "BST",
"+0630": "MMT",
"+0700": "ICT",
"+0800": "AWST",
"+0845": "ACWST",
"+0900": "JST",
"+0930": "ACST",
"+1000": "AEST",
"+1030": "ACST",
"+1100": "AEDT",
"+1200": "NZST",
"+1245": "CHAST",
"+1300": "NZDT",
"+1400": "LINT",
}


Expand Down Expand Up @@ -159,7 +223,9 @@ def set_time_published(self):
except (TypeError, ValueError, IndexError):
self.time_published = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed"
)

def set_dates_published(self):
if self.time_published is None:
Expand All @@ -170,7 +236,9 @@ def set_dates_published(self):
except ValueError:
self.date_time = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level pubDate: {self.published_date_string}, could not be parsed"
)

def to_dict(self):
item = {}
Expand Down Expand Up @@ -203,7 +271,9 @@ def set_author(self, tag):
except AttributeError:
self.author = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level author could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level author could not be parsed"
)

def set_description(self, tag):
"""Parses description and set value."""
Expand All @@ -212,7 +282,9 @@ def set_description(self, tag):
except AttributeError:
self.description = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level description could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level description could not be parsed"
)

def set_content_encoded(self, tag):
"""Parses content_encoded and set value."""
Expand All @@ -223,7 +295,9 @@ def set_content_encoded(self, tag):
except AttributeError:
self.content_encoded = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level content_encoded could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level content_encoded could not be parsed"
)

def set_enclosure(self, tag):
"""Parses enclosure_url, enclosure_type then set values."""
Expand All @@ -248,7 +322,9 @@ def set_guid(self, tag):
except AttributeError:
self.guid = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level guid could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level guid could not be parsed"
)

# TODO convert to one timezone
def set_published_date(self, tag):
Expand All @@ -262,22 +338,28 @@ def set_published_date(self, tag):
raise AttributeError

published_date_timezone = ""
# Check for timezone abbreviation
if re.match("^[a-zA-Z]{3}$", deconstructed_date[-1]):
published_date_timezone = deconstructed_date[-1]
deconstructed_date.pop()
elif "+1000" in self.published_date:
published_date_timezone = "AEST"
deconstructed_date.pop()
else:
# Check for specific timezone offsets
for offset, tz in offset_map.items():
if offset in self.published_date:
published_date_timezone = tz
deconstructed_date.pop()
break
if not published_date_timezone:
published_date_timezone = "EST"

regex_array = [
"^[a-zA-Z]{3},$",
"^\d{1,2}$",
"^[a-zA-Z]{3}$",
"^\d{4}$",
"^\d\d:\d\d",
r"^[a-zA-Z]{3},$", # Raw string, so \ is treated literally
r"^\d{1,2}$",
r"^[a-zA-Z]{3}$",
r"^\d{4}$",
r"^\d\d:\d\d",
]

new_array = []
for array_index, array_value in enumerate(regex_array):
if re.match(deconstructed_date[array_index], array_value):
Expand Down Expand Up @@ -329,7 +411,7 @@ def set_published_date(self, tag):
)

if published_date_timezone not in ["ET", "EST", "EDT"]:
if published_date_timezone in pytz_timezon_list:
if published_date_timezone in pytz_timezone_list:
current_timezone = pytz.timezone(published_date_timezone)
else:
current_timezone = pytz.timezone(
Expand Down Expand Up @@ -360,7 +442,9 @@ def set_title(self, tag):
except AttributeError:
self.title = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level title could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level title could not be parsed"
)

def set_itunes_author_name(self, tag):
"""Parses author name from itunes tags and sets value"""
Expand All @@ -369,7 +453,9 @@ def set_itunes_author_name(self, tag):
except AttributeError:
self.itunes_author_name = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:author could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:author could not be parsed"
)

def set_itunes_episode(self, tag):
"""Parses the episode number and sets value"""
Expand All @@ -381,7 +467,9 @@ def set_itunes_episode(self, tag):
except AttributeError:
self.itunes_episode = "0"
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:episode: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:episode: {tag.string}, could not be parsed"
)

def set_podcast_transcript(self, tag):
"""Parses the episode transcript and sets value
Expand All @@ -399,7 +487,9 @@ def set_podcast_transcript(self, tag):
except AttributeError:
self.podcast_transcript = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode transcription could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode transcription could not be parsed"
)

def set_itunes_season(self, tag):
"""Parses the episode season and sets value"""
Expand All @@ -418,7 +508,9 @@ def set_itunes_episode_type(self, tag):
except AttributeError:
self.itunes_episode_type = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:episodeType: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:episodeType: {tag.string}, could not be parsed"
)

def set_itunes_block(self, tag):
"""Check and see if item is blocked from iTunes and sets value"""
Expand All @@ -427,7 +519,9 @@ def set_itunes_block(self, tag):
except AttributeError:
block = ""
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:block: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:block: {tag.string}, could not be parsed"
)
if block == "yes":
self.itunes_block = True
else:
Expand Down Expand Up @@ -464,7 +558,9 @@ def set_itunes_duration(self, tag):
except AttributeError:
self.itunes_duration = None
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level itunes:duration: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level itunes:duration: {tag.string}, could not be parsed"
)

def set_itunes_explicit(self, tag):
"""Parses explicit from itunes item tags and sets value"""
Expand All @@ -488,7 +584,9 @@ def set_itunes_explicit(self, tag):
except AttributeError:
self.itunes_explicit = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:explicit could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:explicit could not be parsed"
)

def set_itunes_image(self, tag):
"""Parses itunes item images and set url as value"""
Expand All @@ -497,7 +595,9 @@ def set_itunes_image(self, tag):
except AttributeError:
self.itunes_image = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:image could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:image could not be parsed"
)

def set_itunes_order(self, tag):
"""Parses episode order and set url as value"""
Expand All @@ -507,7 +607,9 @@ def set_itunes_order(self, tag):
except AttributeError:
self.itunes_order = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:order could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:order could not be parsed"
)

def set_itunes_subtitle(self, tag):
"""Parses subtitle from itunes tags and sets value"""
Expand All @@ -516,7 +618,9 @@ def set_itunes_subtitle(self, tag):
except AttributeError:
self.itunes_subtitle = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:subtitle could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:subtitle could not be parsed"
)

def set_itunes_summary(self, tag):
"""Parses summary from itunes tags and sets value"""
Expand All @@ -525,7 +629,9 @@ def set_itunes_summary(self, tag):
except AttributeError:
self.itunes_summary = None
except Exception:
raise InvalidPodcastFeed("Invalid Podcast Feed, episode level itunes:summary could not be parsed")
raise InvalidPodcastFeed(
"Invalid Podcast Feed, episode level itunes:summary could not be parsed"
)

def set_interactive(self, tag):
"""Parses author and set value."""
Expand All @@ -536,4 +642,6 @@ def set_interactive(self, tag):
self.interactive = False
self.is_interactive = self.interactive
except Exception:
raise InvalidPodcastFeed(f"Invalid Podcast Feed, episode level ihr:interactive: {tag.string}, could not be parsed")
raise InvalidPodcastFeed(
f"Invalid Podcast Feed, episode level ihr:interactive: {tag.string}, could not be parsed"
)
Loading

0 comments on commit f54a22d

Please sign in to comment.