28 lines
886 B
Python
28 lines
886 B
Python
# -*- coding: utf-8 -*-
|
|
|
|
import re
|
|
import urllib
|
|
|
|
from core import httptools
|
|
from core import scrapertools
|
|
from platformcode import logger
|
|
|
|
|
|
def get_video_url(page_url, premium=False, user="", password="", video_password=""):
|
|
logger.info("(page_url='%s')" % page_url)
|
|
page_url = page_url.replace("amp;", "")
|
|
data = httptools.downloadpage(page_url).data
|
|
logger.info("data=" + data)
|
|
video_urls = []
|
|
patron = "video_src.*?(http.*?)%22%2C%22video_timestamp"
|
|
matches = re.compile(patron, re.DOTALL).findall(data)
|
|
scrapertools.printMatches(matches)
|
|
for match in matches:
|
|
videourl = match
|
|
videourl = videourl.replace('%5C', '')
|
|
videourl = urllib.unquote(videourl)
|
|
video_urls.append(["[facebook]", videourl])
|
|
for video_url in video_urls:
|
|
logger.info("%s - %s" % (video_url[0], video_url[1]))
|
|
return video_urls
|