240 lines
8.3 KiB
Python
240 lines
8.3 KiB
Python
from tkinter import Label,Button,Frame,Tk,Entry,StringVar,LEFT,RIGHT
|
|
import json
|
|
import sys
|
|
import os
|
|
import unicodedata
|
|
from bs4 import BeautifulSoup
|
|
import webbrowser
|
|
import urllib.request
|
|
import re
|
|
|
|
class Labbelink (Label):
|
|
|
|
def __init__(self,parent,text,link):
|
|
Label.__init__(self,parent,text=text,fg="blue",cursor="hand2")
|
|
self.link=link
|
|
self.bind("<Button-1>",self._openlink)
|
|
|
|
def _openlink(self,evt):
|
|
webbrowser.open(self.link)
|
|
|
|
class Interface:
|
|
|
|
def __init__(self):
|
|
self.datafilepath=os.path.dirname(os.path.realpath(__file__))+"/chaine.json"
|
|
self.data = load_jsonfile(self.datafilepath)
|
|
self.fenetre = Tk()
|
|
self.fenetre.title("recherche de chaine")
|
|
self.value = StringVar()
|
|
self.label = Label(self.fenetre, text="entrer numero de chaine")
|
|
self.entree = Entry(self.fenetre, textvariable=self.value, width=30)
|
|
self.frame = Frame(self.fenetre)
|
|
self.resultframe = Frame(self.fenetre)
|
|
self.bouton_update_base = Button(
|
|
self.fenetre, text="update la base de chaine", command=self.click_update)
|
|
self.bouton = Button(self.frame, text="OK", command=self.click)
|
|
self.reset = Button(self.frame, text="reset", command=self.click_reset)
|
|
self.label.pack()
|
|
self.entree.pack()
|
|
self.entree.focus_set()
|
|
self.resultframe.pack(expand=1,fill='both')
|
|
self.frame.pack()
|
|
self.bouton.pack(side=LEFT)
|
|
self.reset.pack(side=RIGHT)
|
|
self.bouton_update_base.pack()
|
|
self.fenetre.bind("<Key-Return>", self.enter)
|
|
self.fenetre.bind("<Key-Escape>", self.eventreset)
|
|
|
|
|
|
def enter(self,evt):
|
|
self.click()
|
|
|
|
def eventreset(self,evt):
|
|
self.click_reset()
|
|
|
|
def mainloop(self):
|
|
self.fenetre.mainloop()
|
|
|
|
def click(self):
|
|
print(self.value.get())
|
|
|
|
try:
|
|
strlink=geturlprogrammetv(self.data[self.value.get()])
|
|
link= Labbelink(self.resultframe,self.data[self.value.get()],strlink)
|
|
link.pack()
|
|
print(self.data[self.value.get()])
|
|
emision=parse_emmission(strlink)
|
|
if emision:
|
|
if emision == "can't find show":
|
|
Label(self.resultframe,text="impssible de parser cette chaine").pack()
|
|
else:
|
|
Label(self.resultframe,text="emmision ce soir: "+emision["title"]).pack()
|
|
if len(emision['casting']) > 0:
|
|
Label(self.resultframe,text="réalisateur: "+emision['casting'][0]).pack()
|
|
Label(self.resultframe,text="acteur: "+str(emision['casting'][1:])).pack()
|
|
Label(self.resultframe,text="synopsys: " +emision['synopsis'],wraplength=250).pack()
|
|
Label(self.resultframe,text="lien: "+emision['href ']).pack()
|
|
self.resultframe.update()
|
|
|
|
else:
|
|
Label(self.resultframe,text="pas de connection internet impossible de determiner l'émission du soir").pack()
|
|
|
|
except KeyError:
|
|
print("numero de chaine inconnue")
|
|
unknow=Label(self.resultframe, text="numero de chaine inconnue")
|
|
unknow.pack()
|
|
|
|
|
|
|
|
#self.label2["text"] += geturlprogrammetv(self.data[self.value.get()])
|
|
|
|
self.value.set("")
|
|
|
|
def click_reset(self):
|
|
print("reset")
|
|
for child in self.resultframe.winfo_children():
|
|
child.destroy()
|
|
|
|
|
|
def click_update(self):
|
|
parsechaine(self.datafilepath)
|
|
self.data = load_jsonfile(self.datafilepath)
|
|
labelupdate = Label(self.resultframe, text="update chaine done"+"\r")
|
|
labelupdate.pack()
|
|
|
|
def _openlink(self,link):
|
|
webbrowser.open_new(link)
|
|
|
|
|
|
|
|
|
|
def load_jsonfile(file):
|
|
try:
|
|
with open(file, 'r', encoding='utf-8') as f:
|
|
return json.load(f)
|
|
except FileNotFoundError:
|
|
parsechaine(file)
|
|
with open(file, 'r', encoding='utf-8') as f:
|
|
return json.load(f)
|
|
|
|
def RepresentsInt(s):
|
|
try:
|
|
int(s)
|
|
return True
|
|
except ValueError:
|
|
return False
|
|
except TypeError:
|
|
return False
|
|
|
|
def parsechaine(file):
|
|
|
|
URL = 'https://fr.wikipedia.org/wiki/Liste_des_cha%C3%AEnes_de_Canal'
|
|
liste_chaine = {}
|
|
response = urllib.request.urlopen(URL)
|
|
html = response.read()
|
|
parse = BeautifulSoup(html,"html.parser")
|
|
for item in parse.find_all('table'):
|
|
if (item.get("class") == ['wikitable'] or item.get("class") == ['wikitable', 'sortable']):
|
|
for tr in item.find_all('tr'):
|
|
|
|
firstTD = tr.find()
|
|
num = firstTD.text
|
|
#print(num)
|
|
if RepresentsInt(num):
|
|
|
|
if RepresentsInt(firstTD.find_next().string):
|
|
#print(firstTD.find_next().find_next().text)
|
|
liste_chaine[int(num)] = firstTD.find_next().find_next().text
|
|
else:
|
|
#print(firstTD.find_next().string)
|
|
liste_chaine[int(num)] = firstTD.find_next().text
|
|
print(json.dumps(liste_chaine, indent=4))
|
|
with open(file, 'w', encoding='utf-8') as f:
|
|
json.dump(liste_chaine, f, indent=4)
|
|
|
|
def geturlprogrammetv(strsearch):
|
|
strsearch=unicodedata.normalize('NFD', strsearch).encode('ascii', 'ignore')
|
|
strsearch=strsearch.decode("utf-8")
|
|
strsearch=strsearch.replace(" ","+")
|
|
return "https://www.programme-tv.net/rechercher?q="+strsearch
|
|
|
|
|
|
def parse_emmission(URL):
|
|
try:
|
|
response = urllib.request.urlopen(URL)
|
|
except urllib.error.URLError:
|
|
return False
|
|
|
|
html = response.read()
|
|
parse=BeautifulSoup(html,"html.parser")
|
|
link=parse.select_one(".prog_name")
|
|
if link == None:
|
|
return "can't find show"
|
|
href="https://www.programme-tv.net"+link['href']
|
|
response = urllib.request.urlopen(href)
|
|
html = response.read()
|
|
parse=BeautifulSoup(html,"html.parser")
|
|
divcasting=parse.select_one(".descriptif")
|
|
casting=divcasting.find_all(href=re.compile("biographie"))
|
|
i=0
|
|
for actor in casting:
|
|
casting[i]=actor.text
|
|
i+=1
|
|
divsynopsis=parse.select_one(".episode-synopsis")
|
|
img=divsynopsis.find_next('img')['data-src']
|
|
synopsis=divsynopsis.select_one(".d-b").text
|
|
print(type(synopsis))
|
|
print(remove_first_space(str(synopsis)))
|
|
return {'title':link['title'],'href':href,'casting':casting,'synopsis':synopsis,'img':img}
|
|
|
|
|
|
def remove_first_space (string):
|
|
space_number=0
|
|
for char in string:
|
|
print(char)
|
|
if char == " ":
|
|
space_number+=1
|
|
else:
|
|
print(char)
|
|
break
|
|
print(space_number)
|
|
|
|
return string[space_number:]
|
|
|
|
print(remove_first_space(" Joséphine apparaît dans un parc zoologique. Elle se fait embaucher comme soigneuse après avoir eu quelques frayeurs face à un lion échappé de son enclos. L'ange gardien rencontre Clara Lorenz, la nouvelle directrice des lieux. Joséphine ne tarde pas à comprendre que la jeune femme ne semble guère se plaire ici : elle succède à son père décédé il y a deux mois et avec qui elle n'était pas en bons termes."))
|
|
|
|
def cli(num):
|
|
datafilepath=os.path.dirname(os.path.realpath(__file__))+"/chaine.json"
|
|
data = load_jsonfile(datafilepath)
|
|
print(num)
|
|
try:
|
|
print(data[num])
|
|
except KeyError:
|
|
print("numero de chaine inconnue")
|
|
return
|
|
emision=parse_emmission(geturlprogrammetv(data[num]))
|
|
if emision:
|
|
if emision == "can't find show":
|
|
print ("impssible de parser cette chaine")
|
|
else:
|
|
print("emmision ce soir: "+emision["title"])
|
|
if len(emision['casting']) > 0:
|
|
print("réalisateur: "+emision['casting'][0])
|
|
print("acteur: "+str(emision['casting'][1:]))
|
|
print("synopsys: " +emision['synopsis'])
|
|
print("lien: "+emision['href'])
|
|
|
|
else:
|
|
print("pas de connection internet impossible de determiner l'émission du soir")
|
|
print("")
|
|
if len(sys.argv) > 1:
|
|
for i in sys.argv[1:]:
|
|
if i =="update":
|
|
parsechaine(os.path.dirname(os.path.realpath(__file__))+"/chaine.json")
|
|
else:
|
|
cli(i)
|
|
else:
|
|
Interface().mainloop()
|
|
|
|
|