From b62c1424fabeadd4a2bea677efd0fc6aaada2e6a Mon Sep 17 00:00:00 2001 From: _ <_@_> Date: Mon, 21 Dec 2020 22:16:12 -0600 Subject: [PATCH] :pencil: docs: document wget spidering --- .gitignore | 2 +- issues/2020-12Dec/auth-route-YNQAQKJS.md | 22 ++++++++++++++++++++++ 2 files changed, 23 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index a688c68..b6935cc 100644 --- a/.gitignore +++ b/.gitignore @@ -3,5 +3,5 @@ /ptth_server.toml /ptth_relay.toml /ptth_build_L6KLMVS6/ +/scraper-secret.txt /target - diff --git a/issues/2020-12Dec/auth-route-YNQAQKJS.md b/issues/2020-12Dec/auth-route-YNQAQKJS.md index b490601..63bf70c 100644 --- a/issues/2020-12Dec/auth-route-YNQAQKJS.md +++ b/issues/2020-12Dec/auth-route-YNQAQKJS.md @@ -61,6 +61,28 @@ e.g. `0..3` means "0, 1, 2, 3". So 100-199 means 199 is the last byte retrieved. By polling with HEAD and byte range requests, a scraper client can approximate `tail -f` behavior of a server-side file. +`wget --continue --execute robots=off --no-parent --recursive --header "$(