mirror of https://gitlab.com/bashrc2/epicyon
Saving known crawlers list
parent
12028370e5
commit
0d83ad8476
16
daemon.py
16
daemon.py
|
@ -398,10 +398,15 @@ class PubServer(BaseHTTPRequestHandler):
|
||||||
"""
|
"""
|
||||||
if self.server.knownCrawlers.get(uaStr):
|
if self.server.knownCrawlers.get(uaStr):
|
||||||
self.server.knownCrawlers[uaStr]['hits'] += 1
|
self.server.knownCrawlers[uaStr]['hits'] += 1
|
||||||
|
self.server.knownCrawlers[uaStr]['lastseen'] = \
|
||||||
|
int(time.time())
|
||||||
else:
|
else:
|
||||||
self.server.knownCrawlers[uaStr] = {
|
self.server.knownCrawlers[uaStr] = {
|
||||||
|
"lastseen": int(time.time()),
|
||||||
"hits": 1
|
"hits": 1
|
||||||
}
|
}
|
||||||
|
saveJson(self.server.knownCrawlers,
|
||||||
|
self.server.baseDir + '/accounts/knownCrawlers.json')
|
||||||
|
|
||||||
def _getInstanceUrl(self, callingDomain: str) -> str:
|
def _getInstanceUrl(self, callingDomain: str) -> str:
|
||||||
"""Returns the URL for this instance
|
"""Returns the URL for this instance
|
||||||
|
@ -17160,10 +17165,6 @@ def runDaemon(listsEnabled: str,
|
||||||
# list of blocked user agent types within the User-Agent header
|
# list of blocked user agent types within the User-Agent header
|
||||||
httpd.userAgentsBlocked = userAgentsBlocked
|
httpd.userAgentsBlocked = userAgentsBlocked
|
||||||
|
|
||||||
# dict of known web crawlers accessing nodeinfo or the masto API
|
|
||||||
# and how many times they have been seen
|
|
||||||
httpd.knownCrawlers = {}
|
|
||||||
|
|
||||||
httpd.unitTest = unitTest
|
httpd.unitTest = unitTest
|
||||||
httpd.allowLocalNetworkAccess = allowLocalNetworkAccess
|
httpd.allowLocalNetworkAccess = allowLocalNetworkAccess
|
||||||
if unitTest:
|
if unitTest:
|
||||||
|
@ -17364,6 +17365,13 @@ def runDaemon(listsEnabled: str,
|
||||||
createNewsInbox(baseDir, domain, port, httpPrefix)
|
createNewsInbox(baseDir, domain, port, httpPrefix)
|
||||||
setConfigParam(baseDir, "listsEnabled", "Murdoch press")
|
setConfigParam(baseDir, "listsEnabled", "Murdoch press")
|
||||||
|
|
||||||
|
# dict of known web crawlers accessing nodeinfo or the masto API
|
||||||
|
# and how many times they have been seen
|
||||||
|
httpd.knownCrawlers = {}
|
||||||
|
knownCrawlersFilename = baseDir + '/accounts/knownCrawlers.json'
|
||||||
|
if os.path.isfile(knownCrawlersFilename):
|
||||||
|
httpd.knownCrawlers = loadJson(baseDir + '/accounts/knownCrawlers.json')
|
||||||
|
|
||||||
if listsEnabled:
|
if listsEnabled:
|
||||||
httpd.listsEnabled = listsEnabled
|
httpd.listsEnabled = listsEnabled
|
||||||
else:
|
else:
|
||||||
|
|
Loading…
Reference in New Issue