mirror of
https://github.com/zulip/zulip.git
synced 2025-11-16 03:41:58 +00:00
documentation_crawler: Consider status.zulip.com external.
Signed-off-by: Anders Kaseorg <anders@zulip.com>
This commit is contained in:
committed by
Tim Abbott
parent
6c857eb645
commit
89b3129d48
@@ -80,11 +80,14 @@ class BaseDocumentationSpider(scrapy.Spider):
|
|||||||
|
|
||||||
def _is_external_link(self, url: str) -> bool:
|
def _is_external_link(self, url: str) -> bool:
|
||||||
split_url = urlsplit(url)
|
split_url = urlsplit(url)
|
||||||
if split_url.hostname == "chat.zulip.org":
|
if split_url.hostname in ("chat.zulip.org", "status.zulip.com"):
|
||||||
# Since most chat.zulip.org URLs will be links to specific
|
# Since most chat.zulip.org URLs will be links to specific
|
||||||
# logged-in content that the spider cannot verify, or the
|
# logged-in content that the spider cannot verify, or the
|
||||||
# homepage, there's no need to check those (which can
|
# homepage, there's no need to check those (which can
|
||||||
# cause errors when chat.zulip.org is being updated).
|
# cause errors when chat.zulip.org is being updated).
|
||||||
|
#
|
||||||
|
# status.zulip.com is externally hosted and, in a peculiar twist of
|
||||||
|
# cosmic irony, often itself offline.
|
||||||
return True
|
return True
|
||||||
if split_url.hostname == "zulip.readthedocs.io" or f".{split_url.hostname}".endswith(
|
if split_url.hostname == "zulip.readthedocs.io" or f".{split_url.hostname}".endswith(
|
||||||
(".zulip.com", ".zulip.org")
|
(".zulip.com", ".zulip.org")
|
||||||
|
|||||||
Reference in New Issue
Block a user