Update due to bug in folder location
This commit is contained in:
parent
7b4651b07e
commit
27a2b56936
@ -8,7 +8,7 @@ from urllib.parse import urlparse
|
|||||||
|
|
||||||
# Define constants
|
# Define constants
|
||||||
URLS_DIRECTORY = "/opt/cdxfiles/urls"
|
URLS_DIRECTORY = "/opt/cdxfiles/urls"
|
||||||
URLS_FILES_DIRECTORY = "/opt/cdxfiles/urls_files"
|
URLS_FILES_DIRECTORY = "/opt/cdxfiles/urls_tophosts"
|
||||||
ROOT_DIRECTORY = "/root/urls_files"
|
ROOT_DIRECTORY = "/root/urls_files"
|
||||||
CONCURRENCY = 10
|
CONCURRENCY = 10
|
||||||
BATCH_SIZE = 10
|
BATCH_SIZE = 10
|
||||||
@ -209,7 +209,7 @@ def main():
|
|||||||
if filename.endswith(".cdx.json"):
|
if filename.endswith(".cdx.json"):
|
||||||
directory_output_file.write(f"{filename}\n")
|
directory_output_file.write(f"{filename}\n")
|
||||||
|
|
||||||
# Process older files in /opt/cdxfiles/urls, URLS_FILES_DIRECTORY, and the ROOT_DIRECTORY
|
# Process older files in /opt/cdxfiles/urls and urls_tophosts
|
||||||
older_than_48_hours = datetime.now() - timedelta(days=2)
|
older_than_48_hours = datetime.now() - timedelta(days=2)
|
||||||
directories_to_check = [URLS_DIRECTORY, URLS_FILES_DIRECTORY]
|
directories_to_check = [URLS_DIRECTORY, URLS_FILES_DIRECTORY]
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user