return tracking of corefork

This commit is contained in:
Il'ya (Marshal) 2021-09-09 20:43:53 +02:00
parent 4a72253936
commit 58e3417baa

View file

@ -14,7 +14,7 @@ PROTOCOL = 'https://'
BASE_URL = 'telegram.org'
# its necessary to help crawler to find more links
HIDDEN_URLS = {
# 'corefork.telegram.org',
'corefork.telegram.org',
'telegram.org/privacy/gmailbot',
'telegram.org/tos',
@ -77,6 +77,17 @@ CRAWL_RULES = {
'validatedRequestedInfo',
},
},
'corefork.telegram.org': {
'deny': {
'file/',
'bots/payments',
'tdlib/docs/classtd',
'validatedRequestedInfo',
},
},
'telegram.org': {
'deny': {
'file/',