ADO2VMCrawler/selenium_crawler/config.json

51 lines
1.2 KiB
JSON

{
"crawler": {
"max_blogs": 2,
"default_search_query": "선돌막국수"
},
"image_filter": {
"min_width": 400,
"min_height": 400,
"min_file_size_kb": 10,
"max_file_size_mb": 10,
"require_both_dimensions": false,
"allowed_formats": [
".jpg",
".jpeg",
".png",
".webp"
]
},
"paths": {
"project_dir_linux": "/data/crawler"
},
"webdriver": {
"headless": false,
"window_size": "1920,1080",
"page_load_timeout": 20,
"implicit_wait": 5,
"user_agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
},
"loading_delays": {
"initial_page_load": 3,
"after_search": 5,
"iframe_wait": 2,
"search_result_wait": 3,
"place_detail_wait": 3,
"dynamic_wait": {
"enabled": true,
"check_interval": 0.5,
"max_wait": 15,
"elements_to_check": [
".GHAhO",
".place_name",
"span.LDgIH"
]
}
},
"logging": {
"console_level": "INFO",
"file_level": "DEBUG",
"log_format": "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
}
}