Merge branch 'master' of github.com:kennethreitz/requests-html

# Please enter a commit message to explain why this merge is necessary,
# especially if it merges an updated upstream into a topic branch.
#
# Lines starting with '#' will be ignored, and an empty message aborts
# the commit.
This commit is contained in:
2018-03-04 15:23:54 -05:00
parent 7ac299f527
commit 72a7e0be69
2 changed files with 20 additions and 1 deletions
+4 -1
View File
@@ -418,10 +418,13 @@ class HTML(BaseParser):
while True:
yield next
try:
next = next.next(fetch=True).html
next = next(next)
except AttributeError:
break
def __next__(self):
return self.next(fetch=True).html
def render(self, retries: int = 8, script: str = None, wait: float = 0.2, scrolldown=False, sleep: int = 0, reload: bool = True, timeout: Union[float, int] = 8.0):
"""Reloads the response in Chromium, and replaces HTML content
with an updated version, with JavaScript executed.
+16
View File
@@ -0,0 +1,16 @@
from requests_html import HTMLSession
session = HTMLSession()
def test_pagination():
pages = (
'https://xkcd.com/1957/',
'https://reddit.com/',
'https://pornhub.com/',
'https://theverge.com/archives'
)
for page in pages:
r = session.get(page)
assert next(r.html)