mirror of
https://github.com/MarshalX/telegram-crawler.git
synced 2025-03-15 13:22:43 +01:00
return tracking of corefork
This commit is contained in:
parent
4a72253936
commit
58e3417baa
1 changed files with 12 additions and 1 deletions
|
@ -14,7 +14,7 @@ PROTOCOL = 'https://'
|
|||
BASE_URL = 'telegram.org'
|
||||
# its necessary to help crawler to find more links
|
||||
HIDDEN_URLS = {
|
||||
# 'corefork.telegram.org',
|
||||
'corefork.telegram.org',
|
||||
|
||||
'telegram.org/privacy/gmailbot',
|
||||
'telegram.org/tos',
|
||||
|
@ -77,6 +77,17 @@ CRAWL_RULES = {
|
|||
'validatedRequestedInfo',
|
||||
},
|
||||
},
|
||||
'corefork.telegram.org': {
|
||||
'deny': {
|
||||
'file/',
|
||||
|
||||
'bots/payments',
|
||||
|
||||
'tdlib/docs/classtd',
|
||||
|
||||
'validatedRequestedInfo',
|
||||
},
|
||||
},
|
||||
'telegram.org': {
|
||||
'deny': {
|
||||
'file/',
|
||||
|
|
Loading…
Add table
Reference in a new issue