[utils] Recognize more patterns in strip_jsonp()

Used in Youku Show pages
This commit is contained in:
Yen Chi Hsuan 2017-05-26 21:58:18 +08:00
parent 59ed87cbd9
commit 5552c9eb0f
No known key found for this signature in database
GPG key ID: 7F902A182457CA23
3 changed files with 15 additions and 1 deletions

View file

@ -2211,7 +2211,12 @@ def parse_age_limit(s):
def strip_jsonp(code):
return re.sub(
r'(?s)^[a-zA-Z0-9_.$]+\s*\(\s*(.*)\);?\s*?(?://[^\n]*)*$', r'\1', code)
r'''(?sx)^
(?:window\.)?(?P<func_name>[a-zA-Z0-9_.$]+)
(?:\s*&&\s*(?P=func_name))?
\s*\(\s*(?P<callback_data>.*)\);?
\s*?(?://[^\n]*)*$''',
r'\g<callback_data>', code)
def js_to_json(code):