This commit is contained in:
table 2025-08-04 23:02:05 +00:00
parent 6790061e22
commit f7a3ca8fd7
3 changed files with 6 additions and 8 deletions

View File

@ -6,9 +6,7 @@ surreal_ns = "test"
surreal_db = "v1.21.1"
# Crawler config
# crawl_filter = "https://ftpgeoinfo.msl.mt.gov/Data/Spatial/MSDI/Imagery/2023_NAIP/UTM_County_Mosaics/"
crawl_filter = "https://oliveratkinson.net"
# start_url = "https://ftpgeoinfo.msl.mt.gov/Data/Spatial/MSDI/Imagery/2023_NAIP/UTM_County_Mosaics/"
start_url = "https://oliveratkinson.net"
budget = 1000
batch_size = 500
crawl_filter = "https://ftpgeoinfo.msl.mt.gov/Data/Spatial/MSDI"
start_url = "https://ftpgeoinfo.msl.mt.gov/Data/Spatial/MSDI"
budget = 10000
batch_size = 50

View File

@ -7,7 +7,7 @@ scrape_configs:
static_configs:
# change this your machine's ip, localhost won't work
# because localhost refers to the docker container.
- targets: ['172.20.239.48:2500']
- targets: ['192.168.1.200:2500']
#- targets: ['192.168.8.209:2500']
- job_name: loki
static_configs:

View File

@ -275,7 +275,7 @@ async fn get_uncrawled_links(
count = config.batch_size;
}
debug!("Getting uncrawled links");
debug!("Getting {} uncrawled links", count);
let mut response = db
.query("SELECT * FROM website WHERE crawled = false AND site ~ type::string($format) LIMIT $count;")