239 lines
9.4 KiB
Python
239 lines
9.4 KiB
Python
# -*- coding: utf-8 -*-
|
|
# ------------------------------------------------------------
|
|
# Canale per cineblog01
|
|
# ------------------------------------------------------------
|
|
import datetime
|
|
import re
|
|
|
|
from core import scrapertools, httptools, servertools, support
|
|
from platformcode import logger, config
|
|
|
|
|
|
# def findhost(url):
|
|
# host = httptools.downloadpage(url, follow_redirect=True).url
|
|
# if host == 'https://cb01.uno/':
|
|
# host = support.match(host, patron=r'<a href="([^"]+)').match
|
|
# return host
|
|
|
|
|
|
host = config.get_channel_url()
|
|
headers = [['Referer', host]]
|
|
|
|
|
|
@support.menu
|
|
def mainlist(item):
|
|
film = [
|
|
('HD', ['', 'menu', 'Film HD Streaming']),
|
|
('Generi', ['', 'menu', 'Film per Genere']),
|
|
('Anni', ['', 'menu', 'Film per Anno']),
|
|
('Paese', ['', 'menu', 'Film per Paese']),
|
|
('Ultimi Aggiornati', ['/lista-film-ultimi-100-film-aggiornati/', 'peliculas', 'newest']),
|
|
('Ultimi Aggiunti', ['/lista-film-ultimi-100-film-aggiunti/', 'peliculas', 'newest'])
|
|
]
|
|
tvshow = ['/serietv/',
|
|
('Per Lettera', ['/serietv/', 'menu', 'Serie-Tv per Lettera']),
|
|
('Per Genere', ['/serietv/', 'menu', 'Serie-Tv per Genere']),
|
|
('Per anno', ['/serietv/', 'menu', 'Serie-Tv per Anno']),
|
|
('Ultime Aggiornate', ['/serietv/', 'peliculas', 'newest'])
|
|
]
|
|
docu = [('Documentari {bullet bold}', ['/category/documentario/', 'peliculas']),
|
|
('HD {submenu} {documentari}', ['/category/hd-alta-definizione/documentario-hd/', 'peliculas'])
|
|
]
|
|
|
|
return locals()
|
|
|
|
|
|
@support.scrape
|
|
def menu(item):
|
|
patronBlock = item.args + r'<span.*?><\/span>.*?<ul.*?>(?P<block>.*?)<\/ul>'
|
|
patronMenu = r'href="?(?P<url>[^">]+)"?>(?P<title>.*?)<\/a>'
|
|
action = 'peliculas'
|
|
|
|
return locals()
|
|
|
|
|
|
def newest(categoria):
|
|
support.info(categoria)
|
|
|
|
item = support.Item()
|
|
try:
|
|
if categoria == "series":
|
|
item.contentType = 'tvshow'
|
|
item.url = host + '/serietv/' # aggiornamento-quotidiano-serie-tv/'
|
|
else:
|
|
item.contentType = 'movie'
|
|
item.url = host + '/lista-film-ultimi-100-film-aggiunti/'
|
|
item.args = "newest"
|
|
return peliculas(item)
|
|
# Continua la ricerca in caso di errore
|
|
except:
|
|
import sys
|
|
for line in sys.exc_info():
|
|
logger.error("{0}".format(line))
|
|
return []
|
|
|
|
|
|
def search(item, text):
|
|
logger.info("search", text)
|
|
if item.contentType == 'tvshow': item.url = host + '/serietv'
|
|
else: item.url = host
|
|
try:
|
|
item.url = item.url + "/search/" + text.replace(' ', '+')
|
|
return peliculas(item)
|
|
|
|
# Continua la ricerca in caso di errore
|
|
except:
|
|
import sys
|
|
for line in sys.exc_info():
|
|
logger.error("%s" % line)
|
|
return []
|
|
|
|
@support.scrape
|
|
def peliculas(item):
|
|
# esclusione degli articoli 'di servizio'
|
|
curYear = datetime.date.today().year
|
|
blacklist = ['BENVENUTI', 'Richieste Serie TV', 'CB01.UNO ▶ TROVA L’INDIRIZZO UFFICIALE ',
|
|
'Aggiornamento Quotidiano Serie TV',
|
|
'Openload: la situazione. Benvenuto Verystream', 'Openload: lo volete ancora?',
|
|
'OSCAR ' + str(curYear) + ' ▶ VOTA IL TUO FILM PREFERITO! 🎬',
|
|
'Auguri di Buon Natale e Felice Anno Nuovo! – ' + str(curYear) + '!']
|
|
# debug= True
|
|
if 'newest' in item.args:
|
|
if '/serietv/' not in item.url:
|
|
# debug = True
|
|
pagination = ''
|
|
patronBlock = r'Ultimi 100 film [^:]+:(?P<block>.*?)<\/td>'
|
|
patron = r'<a href="?(?P<url>[^">]+)"?>(?P<title>[^<([]+)(?:\[(?P<lang>Sub-ITA|B/N|SUB-ITA)\])?\s*(?:\[(?P<quality>HD|SD|HD/3D)\])?\s*\((?P<year>[0-9]{4})\)<\/a>'
|
|
action = 'findvideos'
|
|
else:
|
|
patronBlock = r'Ultime SerieTv aggiornate(?P<block>.*?)Lista'
|
|
patron = r'src=(?:")?(?P<thumb>[^ "]+)(?:")? alt=(?:")?(?P<title>.*?)(?: – \d+×\d+)?(?:>|"| – )(?:(?P<lang>Sub-ITA|ITA))?[^>]*>.*?<a href=(?:")?(?P<url>[^" ]+)(?:")?.*?rpwe-summary[^>]*>(?P<genre>[^\(]*)\((?P<year>\d{4})[^\)]*\) (?P<plot>[^<]+)<'
|
|
action = 'episodios'
|
|
|
|
elif '/serietv/' not in item.url:
|
|
patron = r'<div class="card-image">\s*<a[^>]+>\s*<img src="(?P<thumb>[^" ]+)" alt[^>]+>[^>]+>[^>]+>[^>]+>[^>]+>[^>]+><a href="?(?P<url>[^" >]+)(?:\/|"|\s+)>(?P<title>[^<[(]+)(?:\[(?P<quality>[A-Za-z0-9/-]+)])? (?:\((?P<year>[0-9]{4})\))?[^>]+>[^>]+>[^>]+>[^>]+>[^>]+>(?P<genre>[^<>&âÃÂÖ]+)(?:[^ ]+\s*DURATA\s*(?P<duration>[0-9]+)[^>]+>[^>]+>[^>]+>(?P<plot>[^<>]+))?'
|
|
action = 'findvideos'
|
|
|
|
else:
|
|
patron = r'card-image[^>]*>\s*<a href=(?:")?(?P<url>[^" >]+)(?:")?\s*>\s*<img src=(?:")?(?P<thumb>[^" ]+)(?:")? alt="(?P<title>.*?)(?: – \d+×\d+)?(?:"| – )(?:(?P<lang>Sub-ITA|ITA))?[^>]*>[^>]+>[^>]+>[^>]*>[^>]+>[^>]+>[^>]*>[^>]+>[^>]+>[^>]*>[^>]+>[^>]+>[^>]*>(?P<genre>[^\(]+)\((?P<year>\d{4})[^>]*>[^>]+>[^>]+>[^>]+>(?:<p>)?(?P<plot>[^<]+)'
|
|
action = 'episodios'
|
|
item.contentType = 'tvshow'
|
|
|
|
patronNext = '<a class="?page-link"? href="?([^>"]+)"?><i class="fa fa-angle-right">'
|
|
|
|
return locals()
|
|
|
|
|
|
@support.scrape
|
|
def episodios(item):
|
|
@support.scrape
|
|
def folder(item, data):
|
|
"""
|
|
Quando c'è un link ad una cartelle di vcrypt contenente più stagioni
|
|
"""
|
|
actLike = 'episodios'
|
|
addVideolibrary = False
|
|
downloadEnabled = False
|
|
|
|
folderUrl = scrapertools.find_single_match(data, r'TUTTA L[EA] \w+\s+(?:–|-)\s+<a href="?([^" ]+)').replace(
|
|
'.net/', '.pw/') # vcrypt.pw non ha CF
|
|
data = httptools.downloadpage(folderUrl, disable_directIP=True).data
|
|
patron = r'><a href="(?P<url>[^"]+)[^>]+>(?P<title>[^<]+)'
|
|
sceneTitle = True
|
|
|
|
def itemHook(item):
|
|
item.serieFolder = True
|
|
return item
|
|
return locals()
|
|
|
|
# debug=True
|
|
data = support.match(item.url, headers=headers).data
|
|
folderItemlist = folder(item, data) if '<p>TUTTA L' in data else []
|
|
|
|
patronBlock = r'(?P<block>sp-head[^>]+>\s*(?:STAGION[EI]\s*(?:DA\s*[0-9]+\s*A)?\s*[0-9]+|MINISERIE) - (?P<lang>[^-<]+)(?:- (?P<quality>[^-<]+))?.*?<\/div>.*?)spdiv[^>]*>'
|
|
patron = r'(?:/>|<p>|<strong>)(?P<other>.*?(?P<episode>[0-9]+(?:×|ÃÂ)[0-9]+)\s*(?P<title2>.*?)?(?:\s*–|\s*-|\s*<).*?)(?:<\/p>|<br)'
|
|
def itemlistHook(itemlist):
|
|
title_dict = {}
|
|
itlist = []
|
|
for i in itemlist:
|
|
i.url = item.url
|
|
i.title = re.sub(r'\.(\D)',' \\1', i.title)
|
|
match = support.match(i.title, patron=r'(\d+.\d+)').match.replace('x','')
|
|
i.order = match
|
|
if match not in title_dict:
|
|
title_dict[match] = i
|
|
elif match in title_dict and i.contentLanguage == title_dict[match].contentLanguage \
|
|
or i.contentLanguage == 'ITA' and not title_dict[match].contentLanguage \
|
|
or title_dict[match].contentLanguage == 'ITA' and not i.contentLanguage:
|
|
title_dict[match].url = i.url
|
|
else:
|
|
title_dict[match + '1'] = i
|
|
|
|
for key, value in title_dict.items():
|
|
itlist.append(value)
|
|
|
|
itlist = sorted(itlist, key=lambda it: (it.contentLanguage, int(it.order)))
|
|
|
|
itlist.extend(folderItemlist)
|
|
|
|
return itlist
|
|
return locals()
|
|
|
|
|
|
def findvideos(item):
|
|
if item.serieFolder:
|
|
return support.server(item, data=item.url)
|
|
if item.contentType == "episode":
|
|
return findvid_serie(item)
|
|
|
|
def load_links(itemlist, re_txt, desc_txt, quality=""):
|
|
streaming = scrapertools.find_single_match(data, re_txt).replace('"', '')
|
|
logger.debug('STREAMING', streaming)
|
|
logger.debug('STREAMING=', streaming)
|
|
matches = support.match(streaming, patron = r'<td><a.*?href=([^ ]+) [^>]+>([^<]+)<').matches
|
|
for scrapedurl, scrapedtitle in matches:
|
|
logger.debug("##### findvideos %s ## %s ## %s ##" % (desc_txt, scrapedurl, scrapedtitle))
|
|
itemlist.append(item.clone(action="play", title=scrapedtitle, url=scrapedurl, server=scrapedtitle, quality=quality))
|
|
|
|
logger.debug()
|
|
|
|
itemlist = []
|
|
|
|
# Carica la pagina
|
|
data = httptools.downloadpage(item.url).data
|
|
data = re.sub('\n|\t', '', data)
|
|
|
|
# Estrae i contenuti - Streaming
|
|
load_links(itemlist, '<strong>Streamin?g:</strong>(.*?)cbtable', "Streaming", "SD")
|
|
|
|
# Estrae i contenuti - Streaming HD
|
|
load_links(itemlist, '<strong>Streamin?g HD[^<]+</strong>(.*?)cbtable', "Streaming HD", "HD")
|
|
|
|
# Estrae i contenuti - Streaming 3D
|
|
load_links(itemlist, '<strong>Streamin?g 3D[^<]+</strong>(.*?)cbtable', "Streaming 3D")
|
|
|
|
itemlist = support.server(item, itemlist=itemlist)
|
|
# Extract the quality format
|
|
patronvideos = r'([\w.]+)</strong></div></td>'
|
|
support.addQualityTag(item, itemlist, data, patronvideos)
|
|
|
|
return itemlist
|
|
|
|
# Estrae i contenuti - Download
|
|
# load_links(itemlist, '<strong>Download:</strong>(.*?)<tableclass=cbtable height=30>', "aqua", "Download")
|
|
|
|
# Estrae i contenuti - Download HD
|
|
# load_links(itemlist, '<strong>Download HD[^<]+</strong>(.*?)<tableclass=cbtable width=100% height=20>', "azure", "Download HD")
|
|
|
|
|
|
def findvid_serie(item):
|
|
logger.debug()
|
|
data = re.sub(r'((?:<p>|<strong>)?[^\d]*\d*(?:×|Ã)[0-9]+[^<]+)', '', item.other)
|
|
|
|
return support.server(item, data=data)
|
|
|
|
|
|
def play(item):
|
|
logger.debug()
|
|
return servertools.find_video_items(item, data=item.url)
|