/[safari]/get_book.sh

This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!

Diff of /get_book.sh

Parent Directory | Revision Log | View Patch Patch

-revision 1.7 by dpavlin,
Sun Feb 15 11:40:43 2004 UTC
+revision 1.8 by dpavlin,
Tue Feb 17 19:06:10 2004 UTC
 Line 38 
 function mirror() {
          file=`echo $url | sed -e s,http://[^?]*?,index.html?, -e s,#.*$,, -e s,/,%2F,g`
          if [ -e "$file" ] ; then
  #               echo "skip $url"
+                 echo -n "."
                  return
          fi
-Line 68 
 function geturl() {
+Line 69 
 function geturl() {
          sed -e 's/^.*<a.*href="//i' \
                  -e 's/".*//' -e 's/amp;//g' \
                  -e 's,^[^\?]*\?,http://safari.oreilly.com/,' \
-                 -e 's/#$//' \
+                 -e 's/#.*$//' \
                  -e 's/\&srchText=//' \
                  -e 's/open=false/open=true/' | \
                  grep '&s=1&b=1&f=1&t=1&c=1&u=1&r=&o=1' | \
-Line 81 
 function uniqurl() {
+Line 82 
 function uniqurl() {
          mv in in.tmp
          grep -v 'view=[A-Z]' in.tmp | sort -u > in
          grep 'view=[A-Z].*/index' in.tmp | sort -u >> in
+         links=`wc -l in | cut -d" " -f1`
+         echo "found $links unique links"
  }
  function mirror_in() {
-Line 108 
 function mirror_in() {
+Line 111 
 function mirror_in() {
                          exit 1
                  fi
          done
+         echo
  }
  echo -n > in
  mirror "http://safari.oreilly.com/?XmlId=$isbn"
+ echo
  echo "extract URLs from first page..."
  geturl "index.html?XmlId=$isbn" $isbn

 Legend:



Removed from v.1.7
 


changed lines


 
Added in v.1.8
 Legend:



Removed from v.1.7
 


changed lines


 
Added in v.1.8
-Removed from v.1.7
+Added in v.1.8

	ViewVC Help
Powered by ViewVC 1.1.26