mirror of
https://github.com/MarshalX/telegram-crawler.git
synced 2025-03-15 13:22:43 +01:00
add CIDR
This commit is contained in:
parent
ad9fdc5496
commit
f9cddfdb47
1 changed files with 4 additions and 0 deletions
|
@ -24,6 +24,8 @@ HIDDEN_URLS = {
|
|||
'desktop.telegram.org/changelog',
|
||||
|
||||
'instantview.telegram.org/rules',
|
||||
|
||||
'core.telegram.org/resources/cidr.txt',
|
||||
}
|
||||
BASE_URL_REGEX = r'telegram.org'
|
||||
|
||||
|
@ -208,6 +210,8 @@ async def crawl(url: str, session: aiohttp.ClientSession):
|
|||
LINKS_TO_TRACK.add(url)
|
||||
elif 'text/css' in content_type:
|
||||
LINKS_TO_TRACK.add(url)
|
||||
elif 'text/plain' in content_type:
|
||||
LINKS_TO_TRACK.add(url)
|
||||
elif 'application/json' in content_type:
|
||||
LINKS_TO_TRACK.add(url)
|
||||
else:
|
||||
|
|
Loading…
Add table
Reference in a new issue