123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596 |
- ;;; Encoding and decoding byte representations of strings
- ;; Copyright (C) 2013 Free Software Foundation, Inc.
- ;;;; This library is free software; you can redistribute it and/or
- ;;;; modify it under the terms of the GNU Lesser General Public
- ;;;; License as published by the Free Software Foundation; either
- ;;;; version 3 of the License, or (at your option) any later version.
- ;;;;
- ;;;; This library is distributed in the hope that it will be useful,
- ;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- ;;;; Lesser General Public License for more details.
- ;;;;
- ;;;; You should have received a copy of the GNU Lesser General Public
- ;;;; License along with this library; if not, write to the Free Software
- ;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- ;;; Code:
- (define-module (ice-9 iconv)
- #:use-module (rnrs bytevectors)
- #:use-module (ice-9 binary-ports)
- #:use-module ((ice-9 rdelim) #:select (read-string))
- #:export (string->bytevector
- bytevector->string
- call-with-encoded-output-string))
- ;; Like call-with-output-string, but actually closes the port.
- (define (call-with-output-string* proc)
- (let ((port (open-output-string)))
- (proc port)
- (let ((str (get-output-string port)))
- (close-port port)
- str)))
- (define (call-with-output-bytevector* proc)
- (call-with-values (lambda () (open-bytevector-output-port))
- (lambda (port get-bytevector)
- (proc port)
- (let ((bv (get-bytevector)))
- (close-port port)
- bv))))
- (define* (call-with-encoded-output-string encoding proc
- #:optional
- (conversion-strategy 'error))
- "Call PROC on a fresh port. Encode the resulting string as a
- bytevector according to ENCODING, and return the bytevector."
- (if (and (string-ci=? encoding "utf-8")
- (eq? conversion-strategy 'error))
- ;; I don't know why, but this appears to be faster; at least for
- ;; serving examples/debug-sxml.scm (1464 reqs/s versus 850
- ;; reqs/s).
- (string->utf8 (call-with-output-string* proc))
- (call-with-output-bytevector*
- (lambda (port)
- (set-port-encoding! port encoding)
- (if conversion-strategy
- (set-port-conversion-strategy! port conversion-strategy))
- (proc port)))))
- ;; TODO: Provide C implementations that call scm_from_stringn and
- ;; friends?
- (define* (string->bytevector str encoding
- #:optional (conversion-strategy 'error))
- "Encode STRING according to ENCODING, which should be a string naming
- a character encoding, like \"utf-8\"."
- (if (and (string-ci=? encoding "utf-8")
- (eq? conversion-strategy 'error))
- (string->utf8 str)
- (call-with-encoded-output-string
- encoding
- (lambda (port)
- (display str port))
- conversion-strategy)))
- (define* (bytevector->string bv encoding
- #:optional (conversion-strategy 'error))
- "Decode the string represented by BV. The bytes in the bytevector
- will be interpreted according to ENCODING, which should be a string
- naming a character encoding, like \"utf-8\"."
- (if (and (string-ci=? encoding "utf-8")
- (eq? conversion-strategy 'error))
- (utf8->string bv)
- (let ((p (open-bytevector-input-port bv)))
- (set-port-encoding! p encoding)
- (if conversion-strategy
- (set-port-conversion-strategy! p conversion-strategy))
- (let ((res (read-string p)))
- (close-port p)
- (if (eof-object? res)
- ""
- res)))))
|