pi0 · October 2, 2017 22:15 · pi0 · Oct 2, 2017
diff --git a/crawl.sh b/crawl.sh

 wget -nv -t3 -c -nH -r -l0 -k -p -np -e robots=off --reject-regex "\/\?(.*)" [url]
 
diff --git a/crawl_detailed.sh b/crawl_detailed.sh

 wget \
  --no-verbose \
  --tries=3 \
  --continue \
  --retry-connrefused \
  --no-host-directories \
  --recursive \
  --level 0 \
  --convert-links \
  --page-requisites \
  --no-parent \
  -e robots=off \
  --reject-regex "\/\?(.*)" \
  [url]
   
diff --git a/fix_names.sh b/fix_names.sh

 for f in `find . -regex ".*?.*"`; do mv -v $f $(echo $f | sed "s/\?.*//") ; done
 
diff --git a/fix_names_detailed.sh b/fix_names_detailed.sh

 for f in `find . -regex ".*?.*"`;
  do mv -v $f $(echo $f | sed "s/\?.*//")
 done

	wget -nv -t3 -c -nH -r -l0 -k -p -np -e robots=off --reject-regex "\/\?(.*)" [url]

	for f in `find . -regex ".?."`; do mv -v $f $(echo $f \| sed "s/\?.*//") ; done