blob: 3fd10ce79e087eb2bf1d70b5abc9537c6989262c (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
|
import re
import time
from resources.lib.vrtplayer import metadatacreator
from resources.lib.vrtplayer import statichelper
class MetadataCollector:
def __init__(self):
pass
def get_single_layout_episode_metadata(self, soup):
metadata_creator = metadatacreator.MetadataCreator()
metadata_creator.duration = self.__get_episode_duration(soup)
metadata_creator.plot = self.get_plot(soup)
metadata_creator.datetime = self.get_broadcast_datetime(soup)
return metadata_creator.get_video_dictionary()
def get_multiple_layout_episode_metadata(self, soup):
metadata_creator = metadatacreator.MetadataCreator()
metadata_creator.duration = self.__get_multiple_layout_episode_duration(soup)
return metadata_creator.get_video_dictionary()
@staticmethod
def __get_episode_duration(soup):
duration = None
duration_item = soup.find(class_="content__duration")
if duration_item is not None:
minutes = re.findall("\d+", duration_item.text)
if len(minutes) != 0:
duration = statichelper.minutes_string_to_seconds_int(minutes[0])
return duration
@staticmethod
def get_az_metadata(tile):
metadata_creator = metadatacreator.MetadataCreator()
description = ""
description_item = tile.find(class_="tile__description")
if description_item is not None:
p_item = description_item.find("p")
if p_item is not None:
description = p_item.text.strip()
metadata_creator.plot = description
return metadata_creator.get_video_dictionary()
@staticmethod
def get_plot(soup):
description = ""
description_item = soup.find(class_="content__shortdescription")
if description_item is not None:
description = description_item.text
return description
@staticmethod
def get_broadcast_datetime(soup):
broadcast_datetime = None
broadcast_date_element = soup.find(class_="content__broadcastdate")
if broadcast_date_element is None:
return broadcast_datetime
time_element = broadcast_date_element.find("time")
if time_element is None:
return broadcast_datetime
broadcast_datetime = time.strptime(time_element["datetime"][:18], "%Y-%m-%dT%H:%M:%S")
return broadcast_datetime
@staticmethod
def __get_multiple_layout_episode_duration(soup):
seconds = None
minutes_element = soup.find("abbr", {"title": "minuten"})
if minutes_element is not None and minutes_element.parent is not None:
minutes = minutes_element.parent.next_element
seconds = statichelper.minutes_string_to_seconds_int(minutes)
return seconds
|