From 4787a36d0e95731fdf90388db8701adcfd1cc796 Mon Sep 17 00:00:00 2001 From: vincent Date: Thu, 13 May 2021 13:30:23 +0200 Subject: [PATCH] fix parsing issue --- backend/chainetv/emission.py | 21 +++++++++++++-------- 1 file changed, 13 insertions(+), 8 deletions(-) diff --git a/backend/chainetv/emission.py b/backend/chainetv/emission.py index 7eb7b8c..d79a56e 100644 --- a/backend/chainetv/emission.py +++ b/backend/chainetv/emission.py @@ -33,15 +33,21 @@ class Emmission(object): pass strsearch=strsearch.replace('É','E') strsearch=strsearch.strip() - linkchaine=self.html.find(title=re.compile(re.escape(strsearch))) - if linkchaine == None: + print(strsearch) + chaineElement=self.html.find(string=re.compile(re.escape(strsearch))) + if chaineElement == None: strsearch=strsearch.replace(" ","") - linkchaine=self.html.find(title=re.compile(re.escape(strsearch))) - if linkchaine == None: + chaineElement=self.html.find(string=re.compile(re.escape(strsearch))) + if chaineElement == None: return "can't find channel" - link = linkchaine.parent.parent.find_next_sibling().find("a") + emissionElement=chaineElement.parent.parent.parent.find_next_sibling() + print(emissionElement) + link = emissionElement.find("a") href = link['href'] - img=linkchaine.parent.parent.find_next_sibling().find_next('img')['src'] + try: + img=emissionElement.find_next('img')['data-src'] + except KeyError: + img=emissionElement.find_next('img')['src'] response = urllib.request.urlopen(href) parse=BeautifulSoup(response.read(),"html.parser") divcasting=parse.select_one(".peopleList") @@ -53,7 +59,7 @@ class Emmission(object): count+=1 else: casting= None - divsynopsis=parse.select_one(".synopsis-text") + divsynopsis=parse.select_one(".synopsis") if (divsynopsis): synopsis=divsynopsis.text else: @@ -71,4 +77,3 @@ def remove_first_space (string): else: break return string[space_number:] -