Browse Source

Added descriptive/verbose output; save URLs to local file

master
Adrian Short 8 years ago
parent
commit
33d4bb587a
1 changed files with 12 additions and 3 deletions
  1. +12
    -3
      get.sh

+ 12
- 3
get.sh View File

@@ -8,19 +8,28 @@
# Adrian Short 26 Feb 2016 # Adrian Short 26 Feb 2016


COOKIEJAR=cookiejar.txt COOKIEJAR=cookiejar.txt
BASEURL=https://fastweb.sutton.gov.uk/fastweb
URLS=urls.txt
BASEURL=https://fastweb.sutton.gov.uk/FASTWEB


mkdir -p $1 mkdir -p $1
cd $1 cd $1


echo "Getting session cookies"
curl -s -c $COOKIEJAR "$BASEURL/welcome.asp" > /dev/null # Get the session cookies curl -s -c $COOKIEJAR "$BASEURL/welcome.asp" > /dev/null # Get the session cookies
echo "OK"
echo


echo "Getting list of PDF files. This could take several minutes if there are a large number of documents for this application."
curl -s -c $COOKIEJAR \ curl -s -c $COOKIEJAR \
--data "cbxCopyrightStatement=on" \ --data "cbxCopyrightStatement=on" \
--data "ApplicationNumber=$1" \ --data "ApplicationNumber=$1" \
"$BASEURL/images.asp" \ "$BASEURL/images.asp" \
| grep -E -o 'http.+?\.(pdf|PDF)' \
| wget --no-check-certificate --no-clobber -i -
| grep -E -o 'http.+?\.(pdf|PDF)' > $URLS
echo "OK"

echo "Downloading PDFs"
wget --no-check-certificate --no-clobber -i $URLS
echo "Downloading complete"


rm $COOKIEJAR rm $COOKIEJAR
ls -lht ls -lht


Loading…
Cancel
Save