diff options
author | Frederick Muriuki Muriithi | 2022-08-12 14:34:02 +0300 |
---|---|---|
committer | Frederick Muriuki Muriithi | 2022-08-12 14:34:02 +0300 |
commit | 3cfd0ec3d38f4b460817606ea5d6749a1a85a1ea (patch) | |
tree | f9c4a1fe1a7ac6f91268d5f5a8889514f70aeac5 /test/requests/link_checker.py | |
parent | 30ec1cec4c2ddf878131dbc48b36373a93cb8148 (diff) | |
download | genenetwork2-3cfd0ec3d38f4b460817606ea5d6749a1a85a1ea.tar.gz |
Update to newer lxml API
Diffstat (limited to 'test/requests/link_checker.py')
-rw-r--r-- | test/requests/link_checker.py | 5 |
1 files changed, 3 insertions, 2 deletions
diff --git a/test/requests/link_checker.py b/test/requests/link_checker.py index feae6526..86222254 100644 --- a/test/requests/link_checker.py +++ b/test/requests/link_checker.py @@ -1,6 +1,6 @@ import re import requests -from lxml.html import parse +from lxml.html import document_fromstring from requests.exceptions import ConnectionError DO_FAIL=False # fail on error @@ -66,7 +66,8 @@ def verify_static_file(link): def check_page(host, start_url): print("") print("Checking links host "+host+" in page `"+start_url+"`") - doc = parse(start_url).getroot() + req = requests.get(start_url) + doc = document_fromstring(start_url) links = get_links(doc) in_page_links = list(filter(is_in_page_link, links)) internal_links = list(filter(is_internal_link, links)) |