vendor/github.com/golang/protobuf/proto/decode.go
changeset 242 2a9ec03fe5a1
child 251 1c52a0eeb952
equal deleted inserted replaced
241:e77dad242f4c 242:2a9ec03fe5a1
       
     1 // Go support for Protocol Buffers - Google's data interchange format
       
     2 //
       
     3 // Copyright 2010 The Go Authors.  All rights reserved.
       
     4 // https://github.com/golang/protobuf
       
     5 //
       
     6 // Redistribution and use in source and binary forms, with or without
       
     7 // modification, are permitted provided that the following conditions are
       
     8 // met:
       
     9 //
       
    10 //     * Redistributions of source code must retain the above copyright
       
    11 // notice, this list of conditions and the following disclaimer.
       
    12 //     * Redistributions in binary form must reproduce the above
       
    13 // copyright notice, this list of conditions and the following disclaimer
       
    14 // in the documentation and/or other materials provided with the
       
    15 // distribution.
       
    16 //     * Neither the name of Google Inc. nor the names of its
       
    17 // contributors may be used to endorse or promote products derived from
       
    18 // this software without specific prior written permission.
       
    19 //
       
    20 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
       
    21 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
       
    22 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
       
    23 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
       
    24 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
       
    25 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
       
    26 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
       
    27 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
       
    28 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
       
    29 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
       
    30 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
       
    31 
       
    32 package proto
       
    33 
       
    34 /*
       
    35  * Routines for decoding protocol buffer data to construct in-memory representations.
       
    36  */
       
    37 
       
    38 import (
       
    39 	"errors"
       
    40 	"fmt"
       
    41 	"io"
       
    42 )
       
    43 
       
    44 // errOverflow is returned when an integer is too large to be represented.
       
    45 var errOverflow = errors.New("proto: integer overflow")
       
    46 
       
    47 // ErrInternalBadWireType is returned by generated code when an incorrect
       
    48 // wire type is encountered. It does not get returned to user code.
       
    49 var ErrInternalBadWireType = errors.New("proto: internal error: bad wiretype for oneof")
       
    50 
       
    51 // DecodeVarint reads a varint-encoded integer from the slice.
       
    52 // It returns the integer and the number of bytes consumed, or
       
    53 // zero if there is not enough.
       
    54 // This is the format for the
       
    55 // int32, int64, uint32, uint64, bool, and enum
       
    56 // protocol buffer types.
       
    57 func DecodeVarint(buf []byte) (x uint64, n int) {
       
    58 	for shift := uint(0); shift < 64; shift += 7 {
       
    59 		if n >= len(buf) {
       
    60 			return 0, 0
       
    61 		}
       
    62 		b := uint64(buf[n])
       
    63 		n++
       
    64 		x |= (b & 0x7F) << shift
       
    65 		if (b & 0x80) == 0 {
       
    66 			return x, n
       
    67 		}
       
    68 	}
       
    69 
       
    70 	// The number is too large to represent in a 64-bit value.
       
    71 	return 0, 0
       
    72 }
       
    73 
       
    74 func (p *Buffer) decodeVarintSlow() (x uint64, err error) {
       
    75 	i := p.index
       
    76 	l := len(p.buf)
       
    77 
       
    78 	for shift := uint(0); shift < 64; shift += 7 {
       
    79 		if i >= l {
       
    80 			err = io.ErrUnexpectedEOF
       
    81 			return
       
    82 		}
       
    83 		b := p.buf[i]
       
    84 		i++
       
    85 		x |= (uint64(b) & 0x7F) << shift
       
    86 		if b < 0x80 {
       
    87 			p.index = i
       
    88 			return
       
    89 		}
       
    90 	}
       
    91 
       
    92 	// The number is too large to represent in a 64-bit value.
       
    93 	err = errOverflow
       
    94 	return
       
    95 }
       
    96 
       
    97 // DecodeVarint reads a varint-encoded integer from the Buffer.
       
    98 // This is the format for the
       
    99 // int32, int64, uint32, uint64, bool, and enum
       
   100 // protocol buffer types.
       
   101 func (p *Buffer) DecodeVarint() (x uint64, err error) {
       
   102 	i := p.index
       
   103 	buf := p.buf
       
   104 
       
   105 	if i >= len(buf) {
       
   106 		return 0, io.ErrUnexpectedEOF
       
   107 	} else if buf[i] < 0x80 {
       
   108 		p.index++
       
   109 		return uint64(buf[i]), nil
       
   110 	} else if len(buf)-i < 10 {
       
   111 		return p.decodeVarintSlow()
       
   112 	}
       
   113 
       
   114 	var b uint64
       
   115 	// we already checked the first byte
       
   116 	x = uint64(buf[i]) - 0x80
       
   117 	i++
       
   118 
       
   119 	b = uint64(buf[i])
       
   120 	i++
       
   121 	x += b << 7
       
   122 	if b&0x80 == 0 {
       
   123 		goto done
       
   124 	}
       
   125 	x -= 0x80 << 7
       
   126 
       
   127 	b = uint64(buf[i])
       
   128 	i++
       
   129 	x += b << 14
       
   130 	if b&0x80 == 0 {
       
   131 		goto done
       
   132 	}
       
   133 	x -= 0x80 << 14
       
   134 
       
   135 	b = uint64(buf[i])
       
   136 	i++
       
   137 	x += b << 21
       
   138 	if b&0x80 == 0 {
       
   139 		goto done
       
   140 	}
       
   141 	x -= 0x80 << 21
       
   142 
       
   143 	b = uint64(buf[i])
       
   144 	i++
       
   145 	x += b << 28
       
   146 	if b&0x80 == 0 {
       
   147 		goto done
       
   148 	}
       
   149 	x -= 0x80 << 28
       
   150 
       
   151 	b = uint64(buf[i])
       
   152 	i++
       
   153 	x += b << 35
       
   154 	if b&0x80 == 0 {
       
   155 		goto done
       
   156 	}
       
   157 	x -= 0x80 << 35
       
   158 
       
   159 	b = uint64(buf[i])
       
   160 	i++
       
   161 	x += b << 42
       
   162 	if b&0x80 == 0 {
       
   163 		goto done
       
   164 	}
       
   165 	x -= 0x80 << 42
       
   166 
       
   167 	b = uint64(buf[i])
       
   168 	i++
       
   169 	x += b << 49
       
   170 	if b&0x80 == 0 {
       
   171 		goto done
       
   172 	}
       
   173 	x -= 0x80 << 49
       
   174 
       
   175 	b = uint64(buf[i])
       
   176 	i++
       
   177 	x += b << 56
       
   178 	if b&0x80 == 0 {
       
   179 		goto done
       
   180 	}
       
   181 	x -= 0x80 << 56
       
   182 
       
   183 	b = uint64(buf[i])
       
   184 	i++
       
   185 	x += b << 63
       
   186 	if b&0x80 == 0 {
       
   187 		goto done
       
   188 	}
       
   189 	// x -= 0x80 << 63 // Always zero.
       
   190 
       
   191 	return 0, errOverflow
       
   192 
       
   193 done:
       
   194 	p.index = i
       
   195 	return x, nil
       
   196 }
       
   197 
       
   198 // DecodeFixed64 reads a 64-bit integer from the Buffer.
       
   199 // This is the format for the
       
   200 // fixed64, sfixed64, and double protocol buffer types.
       
   201 func (p *Buffer) DecodeFixed64() (x uint64, err error) {
       
   202 	// x, err already 0
       
   203 	i := p.index + 8
       
   204 	if i < 0 || i > len(p.buf) {
       
   205 		err = io.ErrUnexpectedEOF
       
   206 		return
       
   207 	}
       
   208 	p.index = i
       
   209 
       
   210 	x = uint64(p.buf[i-8])
       
   211 	x |= uint64(p.buf[i-7]) << 8
       
   212 	x |= uint64(p.buf[i-6]) << 16
       
   213 	x |= uint64(p.buf[i-5]) << 24
       
   214 	x |= uint64(p.buf[i-4]) << 32
       
   215 	x |= uint64(p.buf[i-3]) << 40
       
   216 	x |= uint64(p.buf[i-2]) << 48
       
   217 	x |= uint64(p.buf[i-1]) << 56
       
   218 	return
       
   219 }
       
   220 
       
   221 // DecodeFixed32 reads a 32-bit integer from the Buffer.
       
   222 // This is the format for the
       
   223 // fixed32, sfixed32, and float protocol buffer types.
       
   224 func (p *Buffer) DecodeFixed32() (x uint64, err error) {
       
   225 	// x, err already 0
       
   226 	i := p.index + 4
       
   227 	if i < 0 || i > len(p.buf) {
       
   228 		err = io.ErrUnexpectedEOF
       
   229 		return
       
   230 	}
       
   231 	p.index = i
       
   232 
       
   233 	x = uint64(p.buf[i-4])
       
   234 	x |= uint64(p.buf[i-3]) << 8
       
   235 	x |= uint64(p.buf[i-2]) << 16
       
   236 	x |= uint64(p.buf[i-1]) << 24
       
   237 	return
       
   238 }
       
   239 
       
   240 // DecodeZigzag64 reads a zigzag-encoded 64-bit integer
       
   241 // from the Buffer.
       
   242 // This is the format used for the sint64 protocol buffer type.
       
   243 func (p *Buffer) DecodeZigzag64() (x uint64, err error) {
       
   244 	x, err = p.DecodeVarint()
       
   245 	if err != nil {
       
   246 		return
       
   247 	}
       
   248 	x = (x >> 1) ^ uint64((int64(x&1)<<63)>>63)
       
   249 	return
       
   250 }
       
   251 
       
   252 // DecodeZigzag32 reads a zigzag-encoded 32-bit integer
       
   253 // from  the Buffer.
       
   254 // This is the format used for the sint32 protocol buffer type.
       
   255 func (p *Buffer) DecodeZigzag32() (x uint64, err error) {
       
   256 	x, err = p.DecodeVarint()
       
   257 	if err != nil {
       
   258 		return
       
   259 	}
       
   260 	x = uint64((uint32(x) >> 1) ^ uint32((int32(x&1)<<31)>>31))
       
   261 	return
       
   262 }
       
   263 
       
   264 // DecodeRawBytes reads a count-delimited byte buffer from the Buffer.
       
   265 // This is the format used for the bytes protocol buffer
       
   266 // type and for embedded messages.
       
   267 func (p *Buffer) DecodeRawBytes(alloc bool) (buf []byte, err error) {
       
   268 	n, err := p.DecodeVarint()
       
   269 	if err != nil {
       
   270 		return nil, err
       
   271 	}
       
   272 
       
   273 	nb := int(n)
       
   274 	if nb < 0 {
       
   275 		return nil, fmt.Errorf("proto: bad byte length %d", nb)
       
   276 	}
       
   277 	end := p.index + nb
       
   278 	if end < p.index || end > len(p.buf) {
       
   279 		return nil, io.ErrUnexpectedEOF
       
   280 	}
       
   281 
       
   282 	if !alloc {
       
   283 		// todo: check if can get more uses of alloc=false
       
   284 		buf = p.buf[p.index:end]
       
   285 		p.index += nb
       
   286 		return
       
   287 	}
       
   288 
       
   289 	buf = make([]byte, nb)
       
   290 	copy(buf, p.buf[p.index:])
       
   291 	p.index += nb
       
   292 	return
       
   293 }
       
   294 
       
   295 // DecodeStringBytes reads an encoded string from the Buffer.
       
   296 // This is the format used for the proto2 string type.
       
   297 func (p *Buffer) DecodeStringBytes() (s string, err error) {
       
   298 	buf, err := p.DecodeRawBytes(false)
       
   299 	if err != nil {
       
   300 		return
       
   301 	}
       
   302 	return string(buf), nil
       
   303 }
       
   304 
       
   305 // Unmarshaler is the interface representing objects that can
       
   306 // unmarshal themselves.  The argument points to data that may be
       
   307 // overwritten, so implementations should not keep references to the
       
   308 // buffer.
       
   309 // Unmarshal implementations should not clear the receiver.
       
   310 // Any unmarshaled data should be merged into the receiver.
       
   311 // Callers of Unmarshal that do not want to retain existing data
       
   312 // should Reset the receiver before calling Unmarshal.
       
   313 type Unmarshaler interface {
       
   314 	Unmarshal([]byte) error
       
   315 }
       
   316 
       
   317 // newUnmarshaler is the interface representing objects that can
       
   318 // unmarshal themselves. The semantics are identical to Unmarshaler.
       
   319 //
       
   320 // This exists to support protoc-gen-go generated messages.
       
   321 // The proto package will stop type-asserting to this interface in the future.
       
   322 //
       
   323 // DO NOT DEPEND ON THIS.
       
   324 type newUnmarshaler interface {
       
   325 	XXX_Unmarshal([]byte) error
       
   326 }
       
   327 
       
   328 // Unmarshal parses the protocol buffer representation in buf and places the
       
   329 // decoded result in pb.  If the struct underlying pb does not match
       
   330 // the data in buf, the results can be unpredictable.
       
   331 //
       
   332 // Unmarshal resets pb before starting to unmarshal, so any
       
   333 // existing data in pb is always removed. Use UnmarshalMerge
       
   334 // to preserve and append to existing data.
       
   335 func Unmarshal(buf []byte, pb Message) error {
       
   336 	pb.Reset()
       
   337 	if u, ok := pb.(newUnmarshaler); ok {
       
   338 		return u.XXX_Unmarshal(buf)
       
   339 	}
       
   340 	if u, ok := pb.(Unmarshaler); ok {
       
   341 		return u.Unmarshal(buf)
       
   342 	}
       
   343 	return NewBuffer(buf).Unmarshal(pb)
       
   344 }
       
   345 
       
   346 // UnmarshalMerge parses the protocol buffer representation in buf and
       
   347 // writes the decoded result to pb.  If the struct underlying pb does not match
       
   348 // the data in buf, the results can be unpredictable.
       
   349 //
       
   350 // UnmarshalMerge merges into existing data in pb.
       
   351 // Most code should use Unmarshal instead.
       
   352 func UnmarshalMerge(buf []byte, pb Message) error {
       
   353 	if u, ok := pb.(newUnmarshaler); ok {
       
   354 		return u.XXX_Unmarshal(buf)
       
   355 	}
       
   356 	if u, ok := pb.(Unmarshaler); ok {
       
   357 		// NOTE: The history of proto have unfortunately been inconsistent
       
   358 		// whether Unmarshaler should or should not implicitly clear itself.
       
   359 		// Some implementations do, most do not.
       
   360 		// Thus, calling this here may or may not do what people want.
       
   361 		//
       
   362 		// See https://github.com/golang/protobuf/issues/424
       
   363 		return u.Unmarshal(buf)
       
   364 	}
       
   365 	return NewBuffer(buf).Unmarshal(pb)
       
   366 }
       
   367 
       
   368 // DecodeMessage reads a count-delimited message from the Buffer.
       
   369 func (p *Buffer) DecodeMessage(pb Message) error {
       
   370 	enc, err := p.DecodeRawBytes(false)
       
   371 	if err != nil {
       
   372 		return err
       
   373 	}
       
   374 	return NewBuffer(enc).Unmarshal(pb)
       
   375 }
       
   376 
       
   377 // DecodeGroup reads a tag-delimited group from the Buffer.
       
   378 // StartGroup tag is already consumed. This function consumes
       
   379 // EndGroup tag.
       
   380 func (p *Buffer) DecodeGroup(pb Message) error {
       
   381 	b := p.buf[p.index:]
       
   382 	x, y := findEndGroup(b)
       
   383 	if x < 0 {
       
   384 		return io.ErrUnexpectedEOF
       
   385 	}
       
   386 	err := Unmarshal(b[:x], pb)
       
   387 	p.index += y
       
   388 	return err
       
   389 }
       
   390 
       
   391 // Unmarshal parses the protocol buffer representation in the
       
   392 // Buffer and places the decoded result in pb.  If the struct
       
   393 // underlying pb does not match the data in the buffer, the results can be
       
   394 // unpredictable.
       
   395 //
       
   396 // Unlike proto.Unmarshal, this does not reset pb before starting to unmarshal.
       
   397 func (p *Buffer) Unmarshal(pb Message) error {
       
   398 	// If the object can unmarshal itself, let it.
       
   399 	if u, ok := pb.(newUnmarshaler); ok {
       
   400 		err := u.XXX_Unmarshal(p.buf[p.index:])
       
   401 		p.index = len(p.buf)
       
   402 		return err
       
   403 	}
       
   404 	if u, ok := pb.(Unmarshaler); ok {
       
   405 		// NOTE: The history of proto have unfortunately been inconsistent
       
   406 		// whether Unmarshaler should or should not implicitly clear itself.
       
   407 		// Some implementations do, most do not.
       
   408 		// Thus, calling this here may or may not do what people want.
       
   409 		//
       
   410 		// See https://github.com/golang/protobuf/issues/424
       
   411 		err := u.Unmarshal(p.buf[p.index:])
       
   412 		p.index = len(p.buf)
       
   413 		return err
       
   414 	}
       
   415 
       
   416 	// Slow workaround for messages that aren't Unmarshalers.
       
   417 	// This includes some hand-coded .pb.go files and
       
   418 	// bootstrap protos.
       
   419 	// TODO: fix all of those and then add Unmarshal to
       
   420 	// the Message interface. Then:
       
   421 	// The cast above and code below can be deleted.
       
   422 	// The old unmarshaler can be deleted.
       
   423 	// Clients can call Unmarshal directly (can already do that, actually).
       
   424 	var info InternalMessageInfo
       
   425 	err := info.Unmarshal(pb, p.buf[p.index:])
       
   426 	p.index = len(p.buf)
       
   427 	return err
       
   428 }