2012-01-31 04:33:17 -05:00
|
|
|
|
|
|
|
;;; load.scm - a scheme web spidering script
|
|
|
|
;;;
|
2012-01-31 08:12:10 -05:00
|
|
|
;;; Copyright (c) 2012 Johan Ceuppens
|
2012-01-31 04:33:17 -05:00
|
|
|
;;;
|
|
|
|
;;; All rights reserved.
|
|
|
|
;;;
|
|
|
|
;;; Redistribution and use in source and binary forms, with or without
|
|
|
|
;;; modification, are permitted provided that the following conditions
|
|
|
|
;;; are met:
|
|
|
|
;;; 1. Redistributions of source code must retain the above copyright
|
|
|
|
;;; notice, this list of conditions and the following disclaimer.
|
|
|
|
;;; 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
;;; notice, this list of conditions and the following disclaimer in the
|
|
|
|
;;; documentation and/or other materials provided with the distribution.
|
|
|
|
;;; 3. The name of the authors may not be used to endorse or promote products
|
|
|
|
;;; derived from this software without specific prior written permission.
|
|
|
|
;;;
|
|
|
|
;;; THIS SOFTWARE IS PROVIDED BY THE AUTHORS ``AS IS'' AND ANY EXPRESS OR
|
|
|
|
;;; IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
|
|
|
;;; OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
|
|
|
;;; IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
|
|
;;; INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
|
|
|
;;; NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
;;; DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
;;; THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
;;; (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
|
|
|
;;; THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
|
|
|
(load "client.scm")
|
|
|
|
|
|
|
|
(display "give hostname name : ")
|
|
|
|
(define hostname (symbol->string (read)))
|
|
|
|
(newline)
|
|
|
|
(display "server name = ")(display hostname)
|
|
|
|
(newline)
|
|
|
|
(display "give port : ")
|
|
|
|
(define port (number->string (read)))
|
|
|
|
(newline)
|
2012-01-31 23:05:49 -05:00
|
|
|
(define dir-filename (ask-server (string-append "GET / HTTP/1.0" (string #\return #\newline #\return #\newline)) "index.html" hostname port))
|
2012-01-31 04:33:17 -05:00
|
|
|
|
2012-01-31 22:46:31 -05:00
|
|
|
(display "give string to search for (no spaces): ")
|
2012-01-31 23:05:49 -05:00
|
|
|
(define keyword (symbol->string (read)))
|
2012-01-31 22:46:31 -05:00
|
|
|
(newline)
|
|
|
|
|
|
|
|
(let ((file-contents (file->string (string-append dir-filename "/" "index.html"))));;FIXME dir
|
2012-01-31 22:26:50 -05:00
|
|
|
;; (do ((url-list (file-contents->url file-contents 0)
|
|
|
|
;; (file-contents->url file-contents 0)))
|
2012-01-31 22:46:31 -05:00
|
|
|
(let ((hostname-list '())
|
|
|
|
(keywordl '())
|
|
|
|
(url-list (file-contents->url file-contents 0)))
|
|
|
|
(set! hostname-list (url->hostname url-list hostname-list));;FIXME url-list
|
|
|
|
(display hostname-list)
|
|
|
|
(file-contents->keyword file-contents keyword)
|
|
|
|
(display keywordl)
|
2012-01-31 22:26:50 -05:00
|
|
|
))
|