wsgi: reuse mimetype table from crawler
This commit is contained in:
@@ -194,7 +194,7 @@ def cgi_get(environ, start_response):
|
|||||||
# get page
|
# get page
|
||||||
req = crawler.adv_get(url=url, timeout=TIMEOUT)
|
req = crawler.adv_get(url=url, timeout=TIMEOUT)
|
||||||
|
|
||||||
if req['contenttype'] in ['text/html', 'application/xhtml+xml', 'application/xml']:
|
if req['contenttype'] in crawler.MIMETYPE['html']:
|
||||||
if options['get'] == 'page':
|
if options['get'] == 'page':
|
||||||
html = readabilite.parse(req['data'], encoding=req['encoding'])
|
html = readabilite.parse(req['data'], encoding=req['encoding'])
|
||||||
html.make_links_absolute(req['url'])
|
html.make_links_absolute(req['url'])
|
||||||
|
Reference in New Issue
Block a user