Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
13 changes: 12 additions & 1 deletion src/ncoreparser/parser.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@ def __init__(self) -> None:
self.id_and_name_pattern = re.compile(
r'<a href=".*?" onclick="torrent\(([0-9]+)\); return false;" title="(.*?)">'
)
self.id_and_poster_pattern = re.compile(r'<img onmouseout="elrejt\(\'borito([0-9]+)\'\)" onmouseover="mutat\(\'(.*?)\', \'[0-9]+\',.*?>')
self.date_and_time_pattern = re.compile(r'<div class="box_feltoltve2">(.*?)<br>(.*?)</div>')
self.size_pattern = re.compile(r'<div class="box_meret2">(.*?)</div>')
self.not_found_pattern = re.compile(r'<div class="lista_mini_error">Nincs találat!</div>')
Expand All @@ -35,6 +36,7 @@ def get_key(data: str) -> Union[str, None]:
def get_items(self, data: str) -> Generator[dict, None, None]:
types = self.type_pattern.findall(data)
ids_and_names = self.id_and_name_pattern.findall(data)
ids_and_posters = self.id_and_poster_pattern.findall(data)
dates_and_times = self.date_and_time_pattern.findall(data)
sizes = self.size_pattern.findall(data)
seed = self.seeders_pattern.findall(data)
Expand All @@ -46,6 +48,7 @@ def get_items(self, data: str) -> Generator[dict, None, None]:
ids, names = zip(*ids_and_names)
dates, times = zip(*dates_and_times)
key = self.get_key(data)
posters = dict(ids_and_posters)
else:
if not self.not_found_pattern.search(data):
raise NcoreParserError(f"Error while parse download items in {self.__class__.__name__}.")
Expand All @@ -61,6 +64,7 @@ def get_items(self, data: str) -> Generator[dict, None, None]:
"type": SearchParamType(types[i]),
"seed": seed[i],
"leech": leech[i],
"poster": posters.get(id),
}

def get_num_of_pages(self, data: str) -> int:
Expand Down Expand Up @@ -95,6 +99,7 @@ def __init__(self) -> None:
r'class="dd"><a onclick=".*?">(?P<leech>[0-9]+)</a></div>',
re.DOTALL,
)
self.poster_pattern = re.compile(r'<img src="(?P<poster>.*?)" alt="Borító">')

def get_item(self, data: str) -> dict:
try:
Expand Down Expand Up @@ -125,9 +130,15 @@ def get_item(self, data: str) -> dict:
leech = peers_match.group("leech")
else:
raise NcoreParserError("Peers pattern not found in data")
poster_match = self.poster_pattern.search(data)
if poster_match:
poster = poster_match.group("poster")
else:
# Some torrents don't have a poster so no error if not found
poster = None
except AttributeError as e:
raise NcoreParserError(f"Error while parsing by detailed page. {e}") from e
return {"title": title, "key": key, "date": date, "size": size, "type": t_type, "seed": seed, "leech": leech}
return {"title": title, "key": key, "date": date, "size": size, "type": t_type, "seed": seed, "leech": leech, "poster": poster}


class RssParser:
Expand Down
3 changes: 2 additions & 1 deletion src/ncoreparser/torrent.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ def get_torrent_page_url(torrent_id: str) -> str:

class Torrent:
def __init__(
self, id: str, title: str, key: str, size: Size, type: str, date: str, seed: str, leech: str, **params: Any
self, id: str, title: str, key: str, size: Size, type: str, date: str, seed: str, leech: str, poster: str, **params: Any
) -> None:
self._details = {
"id": id,
Expand All @@ -24,6 +24,7 @@ def __init__(
"leech": leech,
"download": URLs.DOWNLOAD_LINK.value.format(id=id, key=key),
"url": get_torrent_page_url(torrent_id=id),
"poster": poster,
}
self._details.update(params)

Expand Down