buffer.go 12.4 KB
Newer Older
1 2 3 4 5 6 7 8 9
// Copyright 2009 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

package bytes

// Simple byte buffer for marshaling data.

import (
10
	"errors"
11
	"io"
12
	"unicode/utf8"
13 14 15 16 17 18 19 20 21
)

// A Buffer is a variable-sized buffer of bytes with Read and Write methods.
// The zero value for Buffer is an empty buffer ready to use.
type Buffer struct {
	buf       []byte            // contents are the bytes buf[off : len(buf)]
	off       int               // read at &buf[off], write at &buf[len(buf)]
	runeBytes [utf8.UTFMax]byte // avoid allocation of slice on each WriteByte or Rune
	bootstrap [64]byte          // memory to hold first slice; helps small buffers (Printf) avoid allocation.
22
	lastRead  readOp            // last read operation, so that Unread* can work correctly.
23 24
}

25 26 27 28 29 30 31 32 33 34 35
// The readOp constants describe the last action performed on
// the buffer, so that UnreadRune and UnreadByte can
// check for invalid usage.
type readOp int

const (
	opInvalid  readOp = iota // Non-read operation.
	opReadRune               // Read rune.
	opRead                   // Any other read operation.
)

36 37 38
// ErrTooLarge is passed to panic if memory cannot be allocated to store data in a buffer.
var ErrTooLarge = errors.New("bytes.Buffer: too large")

39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
// Bytes returns a slice of the contents of the unread portion of the buffer;
// len(b.Bytes()) == b.Len().  If the caller changes the contents of the
// returned slice, the contents of the buffer will change provided there
// are no intervening method calls on the Buffer.
func (b *Buffer) Bytes() []byte { return b.buf[b.off:] }

// String returns the contents of the unread portion of the buffer
// as a string.  If the Buffer is a nil pointer, it returns "<nil>".
func (b *Buffer) String() string {
	if b == nil {
		// Special case, useful in debugging.
		return "<nil>"
	}
	return string(b.buf[b.off:])
}

// Len returns the number of bytes of the unread portion of the buffer;
// b.Len() == len(b.Bytes()).
func (b *Buffer) Len() int { return len(b.buf) - b.off }

// Truncate discards all but the first n unread bytes from the buffer.
60
// It panics if n is negative or greater than the length of the buffer.
61
func (b *Buffer) Truncate(n int) {
62
	b.lastRead = opInvalid
63 64 65 66
	switch {
	case n < 0 || n > b.Len():
		panic("bytes.Buffer: truncation out of range")
	case n == 0:
67 68 69 70 71 72 73 74 75 76
		// Reuse buffer space.
		b.off = 0
	}
	b.buf = b.buf[0 : b.off+n]
}

// Reset resets the buffer so it has no content.
// b.Reset() is the same as b.Truncate(0).
func (b *Buffer) Reset() { b.Truncate(0) }

77 78 79
// grow grows the buffer to guarantee space for n more bytes.
// It returns the index where bytes should be written.
// If the buffer can't grow it will panic with ErrTooLarge.
80 81 82 83 84 85 86 87 88 89 90 91
func (b *Buffer) grow(n int) int {
	m := b.Len()
	// If buffer is empty, reset to recover space.
	if m == 0 && b.off != 0 {
		b.Truncate(0)
	}
	if len(b.buf)+n > cap(b.buf) {
		var buf []byte
		if b.buf == nil && n <= len(b.bootstrap) {
			buf = b.bootstrap[0:]
		} else {
			// not enough space anywhere
92
			buf = makeSlice(2*cap(b.buf) + n)
93 94 95 96 97 98 99 100 101
			copy(buf, b.buf[b.off:])
		}
		b.buf = buf
		b.off = 0
	}
	b.buf = b.buf[0 : b.off+m+n]
	return b.off + m
}

102 103 104 105 106 107 108 109 110 111 112 113 114
// Grow grows the buffer's capacity, if necessary, to guarantee space for
// another n bytes. After Grow(n), at least n bytes can be written to the
// buffer without another allocation.
// If n is negative, Grow will panic.
// If the buffer can't grow it will panic with ErrTooLarge.
func (b *Buffer) Grow(n int) {
	if n < 0 {
		panic("bytes.Buffer.Grow: negative count")
	}
	m := b.grow(n)
	b.buf = b.buf[0:m]
}

115 116
// Write appends the contents of p to the buffer.  The return
// value n is the length of p; err is always nil.
117 118
// If the buffer becomes too large, Write will panic with
// ErrTooLarge.
119
func (b *Buffer) Write(p []byte) (n int, err error) {
120
	b.lastRead = opInvalid
121
	m := b.grow(len(p))
122
	return copy(b.buf[m:], p), nil
123 124 125 126
}

// WriteString appends the contents of s to the buffer.  The return
// value n is the length of s; err is always nil.
127 128
// If the buffer becomes too large, WriteString will panic with
// ErrTooLarge.
129
func (b *Buffer) WriteString(s string) (n int, err error) {
130
	b.lastRead = opInvalid
131 132 133 134 135 136 137 138 139 140 141 142
	m := b.grow(len(s))
	return copy(b.buf[m:], s), nil
}

// MinRead is the minimum slice size passed to a Read call by
// Buffer.ReadFrom.  As long as the Buffer has at least MinRead bytes beyond
// what is required to hold the contents of r, ReadFrom will not grow the
// underlying buffer.
const MinRead = 512

// ReadFrom reads data from r until EOF and appends it to the buffer.
// The return value n is the number of bytes read.
143
// Any error except io.EOF encountered during the read
144
// is also returned.
145 146
// If the buffer becomes too large, ReadFrom will panic with
// ErrTooLarge.
147
func (b *Buffer) ReadFrom(r io.Reader) (n int64, err error) {
148
	b.lastRead = opInvalid
149 150 151 152 153
	// If buffer is empty, reset to recover space.
	if b.off >= len(b.buf) {
		b.Truncate(0)
	}
	for {
154 155 156 157 158 159 160
		if free := cap(b.buf) - len(b.buf); free < MinRead {
			// not enough space at end
			newBuf := b.buf
			if b.off+free < MinRead {
				// not enough space using beginning of buffer;
				// double buffer capacity
				newBuf = makeSlice(2*cap(b.buf) + MinRead)
161 162
			}
			copy(newBuf, b.buf[b.off:])
163
			b.buf = newBuf[:len(b.buf)-b.off]
164 165 166 167 168
			b.off = 0
		}
		m, e := r.Read(b.buf[len(b.buf):cap(b.buf)])
		b.buf = b.buf[0 : len(b.buf)+m]
		n += int64(m)
169
		if e == io.EOF {
170 171 172 173 174 175 176 177 178
			break
		}
		if e != nil {
			return n, e
		}
	}
	return n, nil // err is EOF, so return nil explicitly
}

179 180 181 182 183 184 185 186 187 188 189 190
// makeSlice allocates a slice of size n. If the allocation fails, it panics
// with ErrTooLarge.
func makeSlice(n int) []byte {
	// If the make fails, give a known error.
	defer func() {
		if recover() != nil {
			panic(ErrTooLarge)
		}
	}()
	return make([]byte, n)
}

191
// WriteTo writes data to w until the buffer is drained or an error
192 193
// occurs. The return value n is the number of bytes written; it always
// fits into an int, but it is int64 to match the io.WriterTo interface.
194
// Any error encountered during the write is also returned.
195
func (b *Buffer) WriteTo(w io.Writer) (n int64, err error) {
196
	b.lastRead = opInvalid
197
	if b.off < len(b.buf) {
198
		nBytes := b.Len()
199
		m, e := w.Write(b.buf[b.off:])
200 201 202
		if m > nBytes {
			panic("bytes.Buffer.WriteTo: invalid Write count")
		}
203
		b.off += m
204
		n = int64(m)
205 206 207
		if e != nil {
			return n, e
		}
208
		// all bytes should have been written, by definition of
209
		// Write method in io.Writer
210 211 212
		if m != nBytes {
			return n, io.ErrShortWrite
		}
213 214 215 216 217 218 219 220 221
	}
	// Buffer is now empty; reset.
	b.Truncate(0)
	return
}

// WriteByte appends the byte c to the buffer.
// The returned error is always nil, but is included
// to match bufio.Writer's WriteByte.
222 223
// If the buffer becomes too large, WriteByte will panic with
// ErrTooLarge.
224
func (b *Buffer) WriteByte(c byte) error {
225
	b.lastRead = opInvalid
226 227 228 229 230 231 232 233 234
	m := b.grow(1)
	b.buf[m] = c
	return nil
}

// WriteRune appends the UTF-8 encoding of Unicode
// code point r to the buffer, returning its length and
// an error, which is always nil but is included
// to match bufio.Writer's WriteRune.
235 236
// If the buffer becomes too large, WriteRune will panic with
// ErrTooLarge.
237
func (b *Buffer) WriteRune(r rune) (n int, err error) {
238 239 240 241
	if r < utf8.RuneSelf {
		b.WriteByte(byte(r))
		return 1, nil
	}
242
	n = utf8.EncodeRune(b.runeBytes[0:], r)
243 244 245 246 247 248
	b.Write(b.runeBytes[0:n])
	return n, nil
}

// Read reads the next len(p) bytes from the buffer or until the buffer
// is drained.  The return value n is the number of bytes read.  If the
249
// buffer has no data to return, err is io.EOF (unless len(p) is zero);
250
// otherwise it is nil.
251
func (b *Buffer) Read(p []byte) (n int, err error) {
252
	b.lastRead = opInvalid
253 254 255
	if b.off >= len(b.buf) {
		// Buffer is empty, reset to recover space.
		b.Truncate(0)
256 257 258
		if len(p) == 0 {
			return
		}
259
		return 0, io.EOF
260 261 262
	}
	n = copy(p, b.buf[b.off:])
	b.off += n
263 264 265
	if n > 0 {
		b.lastRead = opRead
	}
266 267 268 269 270 271 272 273
	return
}

// Next returns a slice containing the next n bytes from the buffer,
// advancing the buffer as if the bytes had been returned by Read.
// If there are fewer than n bytes in the buffer, Next returns the entire buffer.
// The slice is only valid until the next call to a read or write method.
func (b *Buffer) Next(n int) []byte {
274
	b.lastRead = opInvalid
275 276 277 278 279 280
	m := b.Len()
	if n > m {
		n = m
	}
	data := b.buf[b.off : b.off+n]
	b.off += n
281 282 283
	if n > 0 {
		b.lastRead = opRead
	}
284 285 286 287
	return data
}

// ReadByte reads and returns the next byte from the buffer.
288
// If no byte is available, it returns error io.EOF.
289
func (b *Buffer) ReadByte() (c byte, err error) {
290
	b.lastRead = opInvalid
291 292 293
	if b.off >= len(b.buf) {
		// Buffer is empty, reset to recover space.
		b.Truncate(0)
294
		return 0, io.EOF
295 296 297
	}
	c = b.buf[b.off]
	b.off++
298
	b.lastRead = opRead
299 300 301 302 303
	return c, nil
}

// ReadRune reads and returns the next UTF-8-encoded
// Unicode code point from the buffer.
304
// If no bytes are available, the error returned is io.EOF.
305 306
// If the bytes are an erroneous UTF-8 encoding, it
// consumes one byte and returns U+FFFD, 1.
307
func (b *Buffer) ReadRune() (r rune, size int, err error) {
308
	b.lastRead = opInvalid
309 310 311
	if b.off >= len(b.buf) {
		// Buffer is empty, reset to recover space.
		b.Truncate(0)
312
		return 0, 0, io.EOF
313
	}
314
	b.lastRead = opReadRune
315 316 317
	c := b.buf[b.off]
	if c < utf8.RuneSelf {
		b.off++
318
		return rune(c), 1, nil
319 320 321 322 323 324
	}
	r, n := utf8.DecodeRune(b.buf[b.off:])
	b.off += n
	return r, n, nil
}

325 326 327 328 329
// UnreadRune unreads the last rune returned by ReadRune.
// If the most recent read or write operation on the buffer was
// not a ReadRune, UnreadRune returns an error.  (In this regard
// it is stricter than UnreadByte, which will unread the last byte
// from any read operation.)
330
func (b *Buffer) UnreadRune() error {
331
	if b.lastRead != opReadRune {
332
		return errors.New("bytes.Buffer: UnreadRune: previous operation was not ReadRune")
333 334 335 336 337 338 339 340 341 342 343 344
	}
	b.lastRead = opInvalid
	if b.off > 0 {
		_, n := utf8.DecodeLastRune(b.buf[0:b.off])
		b.off -= n
	}
	return nil
}

// UnreadByte unreads the last byte returned by the most recent
// read operation.  If write has happened since the last read, UnreadByte
// returns an error.
345
func (b *Buffer) UnreadByte() error {
346
	if b.lastRead != opReadRune && b.lastRead != opRead {
347
		return errors.New("bytes.Buffer: UnreadByte: previous operation was not a read")
348 349 350 351 352 353 354 355
	}
	b.lastRead = opInvalid
	if b.off > 0 {
		b.off--
	}
	return nil
}

356 357 358
// ReadBytes reads until the first occurrence of delim in the input,
// returning a slice containing the data up to and including the delimiter.
// If ReadBytes encounters an error before finding a delimiter,
359
// it returns the data read before the error and the error itself (often io.EOF).
360 361
// ReadBytes returns err != nil if and only if the returned data does not end in
// delim.
362
func (b *Buffer) ReadBytes(delim byte) (line []byte, err error) {
363 364 365 366 367 368 369 370 371
	slice, err := b.readSlice(delim)
	// return a copy of slice. The buffer's backing array may
	// be overwritten by later calls.
	line = append(line, slice...)
	return
}

// readSlice is like readBytes but returns a reference to internal buffer data.
func (b *Buffer) readSlice(delim byte) (line []byte, err error) {
372
	i := IndexByte(b.buf[b.off:], delim)
373
	end := b.off + i + 1
374
	if i < 0 {
375
		end = len(b.buf)
376
		err = io.EOF
377
	}
378 379 380
	line = b.buf[b.off:end]
	b.off = end
	return line, err
381 382 383 384 385
}

// ReadString reads until the first occurrence of delim in the input,
// returning a string containing the data up to and including the delimiter.
// If ReadString encounters an error before finding a delimiter,
386
// it returns the data read before the error and the error itself (often io.EOF).
387 388
// ReadString returns err != nil if and only if the returned data does not end
// in delim.
389
func (b *Buffer) ReadString(delim byte) (line string, err error) {
390 391
	slice, err := b.readSlice(delim)
	return string(slice), err
392 393
}

394 395
// NewBuffer creates and initializes a new Buffer using buf as its initial
// contents.  It is intended to prepare a Buffer to read existing data.  It
396
// can also be used to size the internal buffer for writing. To do that,
397
// buf should have the desired capacity but a length of zero.
398 399
//
// In most cases, new(Buffer) (or just declaring a Buffer variable) is
400
// sufficient to initialize a Buffer.
401 402 403
func NewBuffer(buf []byte) *Buffer { return &Buffer{buf: buf} }

// NewBufferString creates and initializes a new Buffer using string s as its
404 405 406 407 408
// initial contents. It is intended to prepare a buffer to read an existing
// string.
//
// In most cases, new(Buffer) (or just declaring a Buffer variable) is
// sufficient to initialize a Buffer.
409 410 411
func NewBufferString(s string) *Buffer {
	return &Buffer{buf: []byte(s)}
}