summaryrefslogtreecommitdiffstats
path: root/lcrawl
blob: 2c087c59890b3106d8468e6c75af4aa1ec6beda7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
#!/bin/sh

BASIS="$1"
FILEREGEX="$2"
EXTREGEX="$3"
NEXTREGEX="$4"

function crawl() {
    CURRENT="$1"
    NUM="$2"
    LOCAL="$(mktemp)"
    
    wget -O"$LOCAL" "$CURRENT"
    
    FILE=$(perl -e 'while (<>) { $_ =~ '"$FILEREGEX"' && print && exit 0}' "$LOCAL")
    EXT=$(perl -e 'while (<>) { $_ =~ '"$EXTREGEX"' && print && exit 0}' "$LOCAL")
    
    NEXT=$(perl -e 'while (<>) { $_ =~ '"$NEXTREGEX"' && print && exit 0}; exit 1' "$LOCAL")
    HAS_NEXT=$?
    
    wget -O"$(printf "%03i" $NUM).$EXT" "$FILE"
    
    rm "$LOCAL"
    
    if [ $HAS_NEXT -eq 0 ]; then
	crawl "$NEXT" $(expr $NUM + 1)
    fi
}

crawl "$BASIS" 0