mirror of
				https://github.com/zulip/zulip.git
				synced 2025-11-04 05:53:43 +00:00 
			
		
		
		
	documentation_crawler: Consider status.zulip.com external.
Signed-off-by: Anders Kaseorg <anders@zulip.com>
This commit is contained in:
		
				
					committed by
					
						
						Tim Abbott
					
				
			
			
				
	
			
			
			
						parent
						
							6c857eb645
						
					
				
				
					commit
					89b3129d48
				
			@@ -80,11 +80,14 @@ class BaseDocumentationSpider(scrapy.Spider):
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
    def _is_external_link(self, url: str) -> bool:
 | 
					    def _is_external_link(self, url: str) -> bool:
 | 
				
			||||||
        split_url = urlsplit(url)
 | 
					        split_url = urlsplit(url)
 | 
				
			||||||
        if split_url.hostname == "chat.zulip.org":
 | 
					        if split_url.hostname in ("chat.zulip.org", "status.zulip.com"):
 | 
				
			||||||
            # Since most chat.zulip.org URLs will be links to specific
 | 
					            # Since most chat.zulip.org URLs will be links to specific
 | 
				
			||||||
            # logged-in content that the spider cannot verify, or the
 | 
					            # logged-in content that the spider cannot verify, or the
 | 
				
			||||||
            # homepage, there's no need to check those (which can
 | 
					            # homepage, there's no need to check those (which can
 | 
				
			||||||
            # cause errors when chat.zulip.org is being updated).
 | 
					            # cause errors when chat.zulip.org is being updated).
 | 
				
			||||||
 | 
					            #
 | 
				
			||||||
 | 
					            # status.zulip.com is externally hosted and, in a peculiar twist of
 | 
				
			||||||
 | 
					            # cosmic irony, often itself offline.
 | 
				
			||||||
            return True
 | 
					            return True
 | 
				
			||||||
        if split_url.hostname == "zulip.readthedocs.io" or f".{split_url.hostname}".endswith(
 | 
					        if split_url.hostname == "zulip.readthedocs.io" or f".{split_url.hostname}".endswith(
 | 
				
			||||||
            (".zulip.com", ".zulip.org")
 | 
					            (".zulip.com", ".zulip.org")
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user