# -*- coding: utf-8 -*- # ------------------------------------------------------------ # Ringraziamo Icarus crew # Canale ilgiramondo # ------------------------------------------------------------ import re import urlparse from core import httptools, scrapertools from core.item import Item from platformcode import logger from platformcode import config host = "http://www.ilgiramondo.net" def mainlist(item): logger.info("kod.ilgiramondo mainlist") itemlist = [Item(channel=item.channel, title="[COLOR azure]Video di Viaggi[/COLOR]", action="peliculas", url=host + "/video-vacanze-viaggi/", thumbnail="http://hotelsjaisalmer.com/wp-content/uploads/2016/10/Travel1.jpg")] return itemlist def peliculas(item): logger.info("kod.ilgiramondo peliculas") itemlist = [] # Carica la pagina data = httptools.downloadpage(item.url).data # Estrae i contenuti patron = '
]+>
\s*]+><\/a>' matches = re.compile(patron, re.DOTALL).findall(data) scrapertools.printMatches(matches) for scrapedurl, scrapedthumbnail in matches: html = httptools.downloadpage(scrapedurl).data start = html.find("
") end = html.find("

", start) scrapedplot = html[start:end] scrapedplot = re.sub(r'<[^>]*>', '', scrapedplot) scrapedplot = scrapertools.decodeHtmlentities(scrapedplot) html = httptools.downloadpage(scrapedurl).data start = html.find("") end = html.find("", start) scrapedtitle = html[start:end] scrapedtitle = re.sub(r'<[^>]*>', '', scrapedtitle) scrapedtitle = scrapedtitle.replace(" | Video Di Viaggi E Vacanze", "") # scrapedplot = "" itemlist.append(Item(channel=item.channel, action="findvideos", fulltitle=scrapedtitle, show=scrapedtitle, title=scrapedtitle, url=scrapedurl, thumbnail=scrapedthumbnail, plot=scrapedplot, folder=True)) # Paginazione patronvideos = '