123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151 |
- package mahonia
- import (
- "io"
- "unicode/utf8"
- )
- const (
- defaultBufSize = 4096
- )
- type Reader struct {
- buf []byte
- rd io.Reader
- decode Decoder
- r, w int
- err error
- }
- func (d Decoder) NewReader(rd io.Reader) *Reader {
- b := new(Reader)
- b.buf = make([]byte, defaultBufSize)
- b.rd = rd
- b.decode = d
- return b
- }
- func (b *Reader) fill() {
-
- if b.r > 0 {
- copy(b.buf, b.buf[b.r:b.w])
- b.w -= b.r
- b.r = 0
- }
-
- n, e := b.rd.Read(b.buf[b.w:])
- b.w += n
- if e != nil {
- b.err = e
- }
- }
- func (b *Reader) Read(p []byte) (n int, err error) {
- n = len(p)
- filled := false
- if n == 0 {
- return 0, b.err
- }
- if b.w == b.r {
- if b.err != nil {
- return 0, b.err
- }
- if n > len(b.buf) {
-
-
- b.buf = make([]byte, n)
- }
- b.fill()
- filled = true
- if b.w == b.r {
- return 0, b.err
- }
- }
- i := 0
- for i < n {
- rune, size, status := b.decode(b.buf[b.r:b.w])
- if status == STATE_ONLY {
- b.r += size
- continue
- }
- if status == NO_ROOM {
- if b.err != nil {
- rune = 0xfffd
- size = b.w - b.r
- if size == 0 {
- break
- }
- status = INVALID_CHAR
- } else if filled {
- break
- } else {
- b.fill()
- filled = true
- continue
- }
- }
- if i+utf8.RuneLen(rune) > n {
- break
- }
- b.r += size
- if rune < 128 {
- p[i] = byte(rune)
- i++
- } else {
- i += utf8.EncodeRune(p[i:], rune)
- }
- }
- return i, nil
- }
- func (b *Reader) ReadRune() (c rune, size int, err error) {
- read:
- c, size, status := b.decode(b.buf[b.r:b.w])
- if status == NO_ROOM && b.err == nil {
- b.fill()
- goto read
- }
- if status == STATE_ONLY {
- b.r += size
- goto read
- }
- if b.r == b.w {
- return 0, 0, b.err
- }
- if status == NO_ROOM {
- c = 0xfffd
- size = b.w - b.r
- status = INVALID_CHAR
- }
- b.r += size
- return c, size, nil
- }
|