sunterlib/s48/cavespider/string-util-alt.scm

158 lines
5.7 KiB
Scheme
Raw Normal View History

2012-01-31 22:46:31 -05:00
2012-01-31 04:33:17 -05:00
;;; Copyright (c) 2012 Johan Ceuppens
;;;
;;; All rights reserved.
;;;
;;; Redistribution and use in source and binary forms, with or without
;;; modification, are permitted provided that the following conditions
;;; are met:
;;; 1. Redistributions of source code must retain the above copyright
;;; notice, this list of conditions and the following disclaimer.
;;; 2. Redistributions in binary form must reproduce the above copyright
;;; notice, this list of conditions and the following disclaimer in the
;;; documentation and/or other materials provided with the distribution.
;;; 3. The name of the authors may not be used to endorse or promote products
;;; derived from this software without specific prior written permission.
;;;
;;; THIS SOFTWARE IS PROVIDED BY THE AUTHORS ``AS IS'' AND ANY EXPRESS OR
;;; IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
;;; OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
;;; IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY DIRECT, INDIRECT,
;;; INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
;;; NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
;;; DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
;;; THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
;;; (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
;;; THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
(load "file-util.scm")
(load "hash-util.scm")
(load "html-util.scm")
2012-01-31 10:31:15 -05:00
;;(define (url->hostname url-list hostname-list)
;; (let ((file-contents (file-contents->url )))
;; ))
2012-01-31 04:33:17 -05:00
2012-01-31 22:46:31 -05:00
;; FIXME double in string-util.scm
(define (url->hostname url-list hostname-list)
(let ((s "")
(rets "")
(j 0)
(url (if (null? url-list)
#f
(car url-list)))
)
;;(display "URL=")(display url)(newline)
(if url
(begin
(set! url (string-append url (string #\/)));;following /
(if (>= (string-length url) 8)
(begin
(do ((i 0 (+ i 1)))
((cond ((>= i (string-length url))
(set! j (string-length url)))
((or (string=? s "http://")(string=? s "ftp://")
(string=? s " http://")(string=? s " ftp://"))
(set! j i)))
#t)
(set! s (string-append s (string (string-ref url i))))
)
(do ((i j (+ i 1)))
((cond ((>= i (string-length url))
#t)
((not (eq? #\/ (string-ref url i)))
(set! j i)))
#t)
)
(do ((i j (+ i 1)))
((or (>= i (string-length url))
(eq? (string-ref url i) #\space)
(eq? (string-ref url i) #\newline)
(eq? (string-ref url i) #\/)
(eq? (string-ref url i) #\\))
#t)
(set! rets (string-append rets (string (string-ref url i))))
)
(display rets)
(set! hostname-list (append (list rets) (url->hostname (cdr url-list) hostname-list)))
)
rets)
rets)
(begin
;;(display s)
rets))
rets))
2012-01-31 04:33:17 -05:00
(define (tags filename)
(html-tags filename))
2012-01-31 22:46:31 -05:00
(define (file-contents->url tags-of-file-contents-str . dummy)
2012-01-31 10:31:15 -05:00
;;(display tags-of-file-contents-str)
2012-01-31 04:33:17 -05:00
(let ((s "")
(ret '())
(http-prefix "http://"))
(do ((i 0 (+ i 1)))
((>= i (string-length tags-of-file-contents-str))
2012-01-31 10:31:15 -05:00
ret)
(cond ((not (eq? #\h (string-ref tags-of-file-contents-str i)))
(set! s ""))
((eq? #\h (string-ref tags-of-file-contents-str i))
(let ((s2 ""))
(do ((j i (+ j 1)))
((cond ((string=? s2 http-prefix)
(let ((s3 ""))
(do ((k j (+ k 1)))
((cond ((eq? (string-ref tags-of-file-contents-str k)
2012-01-31 10:39:49 -05:00
#\");;FIXME
2012-01-31 10:31:15 -05:00
(set! j k)(set! i k)(set! s2 ""))
((eq? (string-ref tags-of-file-contents-str k)
#\/)
(set! ret (append ret (list s3)))
2012-01-31 10:39:49 -05:00
2012-01-31 10:31:15 -05:00
(set! j k)
(set! i k))
((>= k (string-length tags-of-file-contents-str));;FIXME prev
(set! s2 "")(set! i k)(set! j k))
))
(set! s3 (string-append
s3
(string (string-ref tags-of-file-contents-str k))))
)
2012-01-31 10:39:49 -05:00
2012-01-31 10:31:15 -05:00
))
((not (string<=? s2 http-prefix))
(set! s "")
(set! i j))
))
(set! s2 (string-append
s2
(string (string-ref tags-of-file-contents-str j))))
(display "s2=")(display s)
(set! i j)))))
2012-01-31 04:33:17 -05:00
(set! s (string-append s (string (string-ref tags-of-file-contents-str i))))
2012-01-31 10:31:15 -05:00
;;(display "s=")(display (string-ref tags-of-file-contents-str i))
2012-01-31 04:33:17 -05:00
)
ret))
2012-01-31 22:46:31 -05:00
;; test
;;(display
;; (file-contents->url (html-dump "index.html"))
;; )