]>
Commit | Line | Data |
---|---|---|
d8f41ccd A |
1 | #! /bin/csh -f |
2 | # | |
3 | # urlPageGrab on a set of Safari plt-style sites. The HTML source for these sites | |
4 | # can be obtained from speedo_html.tar in this directory. You typically place | |
5 | # the untarred version of that in a user's ~/Sites directory; they'll appear in | |
6 | # ~/Sites/base. If you do this on host foo.local, in ~someUser/Sites, then you'd | |
7 | # typically run this script like this (the time prefix results in your shell | |
8 | # telling you how much time elapsed to execute the whole script): | |
9 | # | |
10 | # % time pltGrab foo.local "/~someUser/base" s q | |
11 | # | |
12 | # This assumes of course that you have an https-capable web server running on | |
13 | # host foo.local. See SecurityTech/apacheConfig/ for a script and instructions | |
14 | # that make that pretty easy. | |
15 | # | |
16 | #################################################################################### | |
17 | # | |
18 | if ( $#argv < 2 ) then | |
19 | echo Usage: pltGrab pltHostName pltBasePath \[s \(ssl\)\] \[q \(quiet\)\] | |
20 | exit(1) | |
21 | endif | |
22 | ||
23 | set PLT_SITES = ( bugzilla.mozilla.org \ | |
24 | espn.go.com \ | |
25 | home.netscape.com \ | |
26 | hotwired.lycos.com \ | |
27 | lxr.mozilla.org \ | |
28 | my.netscape.com \ | |
29 | news.cnet.com \ | |
30 | slashdot.org \ | |
31 | web.icq.com \ | |
32 | www.altavista.com \ | |
33 | www.amazon.com \ | |
34 | www.aol.com \ | |
35 | www.apple.com \ | |
36 | www.cnn.com \ | |
37 | www.compuserve.com \ | |
38 | www.digitalcity.com \ | |
39 | www.ebay.com \ | |
40 | www.excite.com \ | |
41 | www.expedia.com \ | |
42 | www.google.com \ | |
43 | www.iplanet.com \ | |
44 | www.mapquest.com \ | |
45 | www.microsoft.com \ | |
46 | www.moviefone.com \ | |
47 | www.msn.com \ | |
48 | www.msnbc.com \ | |
49 | www.nytimes.com \ | |
50 | www.nytimes.com_Table \ | |
51 | www.quicken.com \ | |
52 | www.spinner.com \ | |
53 | www.sun.com \ | |
54 | www.time.com \ | |
55 | www.tomshardware.com \ | |
56 | www.travelocity.com \ | |
57 | www.voodooextreme.com \ | |
58 | www.w3.org_DOML2Core \ | |
59 | www.wired.com \ | |
60 | www.yahoo.com \ | |
61 | www.zdnet.com \ | |
62 | www.zdnet.com_Gamespot.com ) | |
63 | ||
64 | set PLT_HOST=$argv[1] | |
65 | set BASE_PATH=$argv[2] | |
66 | shift | |
67 | shift | |
68 | set QUIET= | |
69 | set DO_SSL= | |
70 | ||
71 | while ( $#argv > 0 ) | |
72 | switch ( "$argv[1]" ) | |
73 | case s: | |
74 | set DO_SSL = s | |
75 | shift | |
76 | breaksw | |
77 | case q: | |
78 | set QUIET = q | |
79 | shift | |
80 | breaksw | |
81 | default: | |
82 | echo Usage: pltGrab pltHostName pltBasePath \[s \(ssl\)\] \[q \(quiet\)\] | |
83 | exit(1) | |
84 | endsw | |
85 | end | |
86 | ||
87 | foreach site ($PLT_SITES) | |
88 | set HTTP_PATH="$BASE_PATH/$site/" | |
89 | urlPageGrab $PLT_HOST "$HTTP_PATH" $DO_SSL $QUIET || exit(1) | |
90 | end | |
91 |