mirror of
https://github.com/not-kennethreitz/markdownplease.com.git
synced 2026-06-05 23:20:19 +00:00
Merge branch 'master' of github.com:LuRsT/url2markdown
This commit is contained in:
+11
-6
@@ -7,24 +7,29 @@ from html2text import html2text
|
||||
|
||||
_READABILITY_URL = 'https://www.readability.com/api/content/v1/parser'
|
||||
|
||||
def readability(url):
|
||||
def _readability(url):
|
||||
token = os.environ.get('READABILITY_TOKEN')
|
||||
params = {'url': url, 'token': token}
|
||||
|
||||
r = requests.get(_READABILITY_URL, params=params)
|
||||
return r.json()['content'], r.json()['title']
|
||||
decoded_content = (
|
||||
r.json()['content'],
|
||||
r.json()['title'],
|
||||
)
|
||||
return decoded_content
|
||||
|
||||
def convert(html, title=None):
|
||||
def _convert(html, title=None):
|
||||
if title:
|
||||
title = '# {}'.format(title)
|
||||
html = '\n\n'.join([title, html])
|
||||
|
||||
return html2text(html)
|
||||
text_from_html = html2text(html)
|
||||
return text_from_html
|
||||
|
||||
def get_readable_content_from_url(url):
|
||||
try:
|
||||
content, title = readability(url)
|
||||
return convert(content, title=title)
|
||||
content, title = _readability(url)
|
||||
return _convert(content, title=title)
|
||||
except KeyError:
|
||||
return None
|
||||
|
||||
|
||||
@@ -18,14 +18,12 @@ def fuck_gpl3():
|
||||
type = request.args.get('type', 'markdown')
|
||||
|
||||
content = get_readable_content_from_url(url)
|
||||
print url
|
||||
|
||||
if url:
|
||||
if not content:
|
||||
return '404 Not Found', 404
|
||||
|
||||
if type == 'html':
|
||||
print url
|
||||
markdown_url_contents = _markdown_to_html(content)
|
||||
return render_template(
|
||||
'index.html',
|
||||
|
||||
Reference in New Issue
Block a user