;;; gap-buffer.scm --- String buffer that supports point
;;; Copyright (C) 2002, 2003, 2006 Free Software Foundation, Inc.
;;;
;;;; This library is free software; you can redistribute it and/or
;;;; modify it under the terms of the GNU Lesser General Public
;;;; License as published by the Free Software Foundation; either
;;;; version 3 of the License, or (at your option) any later version.
;;;;
;;;; This library is distributed in the hope that it will be useful,
;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
;;;; Lesser General Public License for more details.
;;;;
;;;; You should have received a copy of the GNU Lesser General Public
;;;; License along with this library; if not, write to the Free Software
;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
;;;
;;; Author: Thien-Thi Nguyen <ttn@gnu.org>
;;; Commentary:
;; A gap buffer is a structure that models a string but allows relatively
;; efficient insertion of text somewhere in the middle. The insertion
;; location is called `point' with minimum value 1, and a maximum value of the
;; length of the string (which is not fixed).
;;
;; Specifically, we allocate a continuous buffer of characters that is
;; composed of the BEFORE, the GAP and the AFTER (reading L->R), like so:
;;
;; +--- POINT
;; v
;; +--------------------+--------------------+--------------------+
;; | BEFORE | GAP | AFTER |
;; +--------------------+--------------------+--------------------+
;;
;; <----- bef-sz ----->|<----- gap-sz ----->|<----- aft-sz ----->
;;
;; <-------------------| usr-sz |------------------->
;;
;; <-------------------------- all-sz -------------------------->
;;
;; This diagram also shows how the different sizes are computed, and the
;; location of POINT. Note that the user-visible buffer size `usr-sz' does
;; NOT include the GAP, while the allocation `all-sz' DOES.
;;
;; The consequence of this arrangement is that "moving point" is simply a
;; matter of kicking characters across the GAP, while insertion can be viewed
;; as filling up the gap, increasing `bef-sz' and decreasing `gap-sz'. When
;; `gap-sz' falls below some threshold, we reallocate with a larger `all-sz'.
;;
;; In the implementation, we actually keep track of the AFTER start offset
;; `aft-ofs' since it is used more often than `gap-sz'. In fact, most of the
;; variables in the diagram are for conceptualization only.
;;
;; A gap buffer port is a soft port (see Guile manual) that wraps a gap
;; buffer. Character and string writes, as well as character reads, are
;; supported. Flushing and closing are not supported.
;;
;; These procedures are exported:
;; (gb? OBJ)
;; (make-gap-buffer . INIT)
;; (gb-point GB)
;; (gb-point-min GB)
;; (gb-point-max GB)
;; (gb-insert-string! GB STRING)
;; (gb-insert-char! GB CHAR)
;; (gb-delete-char! GB COUNT)
;; (gb-goto-char GB LOCATION)
;; (gb->string GB)
;; (gb-filter! GB STRING-PROC)
;; (gb->lines GB)
;; (gb-filter-lines! GB LINES-PROC)
;; (make-gap-buffer-port GB)
;;
;; INIT is an optional port or a string. COUNT and LOCATION are integers.
;; STRING-PROC is a procedure that takes and returns a string. LINES-PROC is
;; a procedure that takes and returns a list of strings, each representing a
;; line of text (newlines are stripped and added back automatically).
;;
;; (The term and concept of "gap buffer" are borrowed from Emacs. We will
;; gladly return them when libemacs.so is available. ;-)
;;
;; Notes:
;; - overrun errors are suppressed silently
;;; Code:
(define-module (ice-9 gap-buffer)
:autoload (srfi srfi-13) (string-join)
:export (gb?
make-gap-buffer
gb-point
gb-point-min
gb-point-max
gb-insert-string!
gb-insert-char!
gb-delete-char!
gb-erase!
gb-goto-char
gb->string
gb-filter!
gb->lines
gb-filter-lines!
make-gap-buffer-port))
(define gap-buffer
(make-record-type 'gap-buffer
'(s ; the buffer, a string
all-sz ; total allocation
gap-ofs ; GAP starts, aka (1- point)
aft-ofs ; AFTER starts
)))
(define gb? (record-predicate gap-buffer))
(define s: (record-accessor gap-buffer 's))
(define all-sz: (record-accessor gap-buffer 'all-sz))
(define gap-ofs: (record-accessor gap-buffer 'gap-ofs))
(define aft-ofs: (record-accessor gap-buffer 'aft-ofs))
(define s! (record-modifier gap-buffer 's))
(define all-sz! (record-modifier gap-buffer 'all-sz))
(define gap-ofs! (record-modifier gap-buffer 'gap-ofs))
(define aft-ofs! (record-modifier gap-buffer 'aft-ofs))
;; todo: expose
(define default-initial-allocation 128)
(define default-chunk-size 128)
(define default-realloc-threshold 32)
(define (round-up n)
(* default-chunk-size (+ 1 (quotient n default-chunk-size))))
(define new (record-constructor gap-buffer '()))
(define (realloc gb inc)
(let* ((old-s (s: gb))
(all-sz (all-sz: gb))
(new-sz (+ all-sz inc))
(gap-ofs (gap-ofs: gb))
(aft-ofs (aft-ofs: gb))
(new-s (make-string new-sz))
(new-aft-ofs (+ aft-ofs inc)))
(substring-move! old-s 0 gap-ofs new-s 0)
(substring-move! old-s aft-ofs all-sz new-s new-aft-ofs)
(s! gb new-s)
(all-sz! gb new-sz)
(aft-ofs! gb new-aft-ofs)))
(define (make-gap-buffer . init) ; port/string
(let ((gb (new)))
(cond ((null? init)
(s! gb (make-string default-initial-allocation))
(all-sz! gb default-initial-allocation)
(gap-ofs! gb 0)
(aft-ofs! gb default-initial-allocation))
(else (let ((jam! (lambda (string len)
(let ((alloc (round-up len)))
(s! gb (make-string alloc))
(all-sz! gb alloc)
(substring-move! string 0 len (s: gb) 0)
(gap-ofs! gb len)
(aft-ofs! gb alloc))))
(v (car init)))
(cond ((port? v)
(let ((next (lambda () (read-char v))))
(let loop ((c (next)) (acc '()) (len 0))
(if (eof-object? c)
(jam! (list->string (reverse acc)) len)
(loop (next) (cons c acc) (1+ len))))))
((string? v)
(jam! v (string-length v)))
(else (error "bad init type"))))))
gb))
(define (gb-point gb)
(1+ (gap-ofs: gb)))
(define (gb-point-min gb) 1) ; no narrowing (for now)
(define (gb-point-max gb)
(1+ (- (all-sz: gb) (- (aft-ofs: gb) (gap-ofs: gb)))))
(define (insert-prep gb len)
(let* ((gap-ofs (gap-ofs: gb))
(aft-ofs (aft-ofs: gb))
(slack (- (- aft-ofs gap-ofs) len)))
(and (< slack default-realloc-threshold)
(realloc gb (round-up (- slack))))
gap-ofs))
(define (gb-insert-string! gb string)
(let* ((len (string-length string))
(gap-ofs (insert-prep gb len)))
(substring-move! string 0 len (s: gb) gap-ofs)
(gap-ofs! gb (+ gap-ofs len))))
(define (gb-insert-char! gb char)
(let ((gap-ofs (insert-prep gb 1)))
(string-set! (s: gb) gap-ofs char)
(gap-ofs! gb (+ gap-ofs 1))))
(define (gb-delete-char! gb count)
(cond ((< count 0) ; backwards
(gap-ofs! gb (max 0 (+ (gap-ofs: gb) count))))
((> count 0) ; forwards
(aft-ofs! gb (min (all-sz: gb) (+ (aft-ofs: gb) count))))
((= count 0) ; do nothing
#t)))
(define (gb-erase! gb)
(gap-ofs! gb 0)
(aft-ofs! gb (all-sz: gb)))
(define (point++n! gb n s gap-ofs aft-ofs) ; n>0; warning: reckless
(substring-move! s aft-ofs (+ aft-ofs n) s gap-ofs)
(gap-ofs! gb (+ gap-ofs n))
(aft-ofs! gb (+ aft-ofs n)))
(define (point+-n! gb n s gap-ofs aft-ofs) ; n<0; warning: reckless
(substring-move! s (+ gap-ofs n) gap-ofs s (+ aft-ofs n))
(gap-ofs! gb (+ gap-ofs n))
(aft-ofs! gb (+ aft-ofs n)))
(define (gb-goto-char gb new-point)
(let ((pmax (gb-point-max gb)))
(or (and (< new-point 1) (gb-goto-char gb 1))
(and (> new-point pmax) (gb-goto-char gb pmax))
(let ((delta (- new-point (gb-point gb))))
(or (= delta 0)
((if (< delta 0)
point+-n!
point++n!)
gb delta (s: gb) (gap-ofs: gb) (aft-ofs: gb))))))
new-point)
(define (gb->string gb)
(let ((s (s: gb)))
(string-append (substring s 0 (gap-ofs: gb))
(substring s (aft-ofs: gb)))))
(define (gb-filter! gb string-proc)
(let ((new (string-proc (gb->string gb))))
(gb-erase! gb)
(gb-insert-string! gb new)))
(define (gb->lines gb)
(let ((str (gb->string gb)))
(let loop ((start 0) (acc '()))
(cond ((string-index str #\newline start)
=> (lambda (w)
(loop (1+ w) (cons (substring str start w) acc))))
(else (reverse (cons (substring str start) acc)))))))
(define (gb-filter-lines! gb lines-proc)
(let ((new-lines (lines-proc (gb->lines gb))))
(gb-erase! gb)
(gb-insert-string! gb (string-join new-lines #\newline))))
(define (make-gap-buffer-port gb)
(or (gb? gb)
(error "not a gap-buffer:" gb))
(make-soft-port
(vector
(lambda (c) (gb-insert-char! gb c))
(lambda (s) (gb-insert-string! gb s))
#f
(lambda () (let ((gap-ofs (gap-ofs: gb))
(aft-ofs (aft-ofs: gb)))
(if (= aft-ofs (all-sz: gb))
#f
(let* ((s (s: gb))
(c (string-ref s aft-ofs)))
(string-set! s gap-ofs c)
(gap-ofs! gb (1+ gap-ofs))
(aft-ofs! gb (1+ aft-ofs))
c))))
#f)
"rw"))
;;; gap-buffer.scm ends here