Source file src/encoding/binary/varint.go
1 // Copyright 2011 The Go Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style 3 // license that can be found in the LICENSE file. 4 5 package binary 6 7 // This file implements "varint" encoding of 64-bit integers. 8 // The encoding is: 9 // - unsigned integers are serialized 7 bits at a time, starting with the 10 // least significant bits 11 // - the most significant bit (msb) in each output byte indicates if there 12 // is a continuation byte (msb = 1) 13 // - signed integers are mapped to unsigned integers using "zig-zag" 14 // encoding: Positive values x are written as 2*x + 0, negative values 15 // are written as 2*(^x) + 1; that is, negative numbers are complemented 16 // and whether to complement is encoded in bit 0. 17 // 18 // Design note: 19 // At most 10 bytes are needed for 64-bit values. The encoding could 20 // be more dense: a full 64-bit value needs an extra byte just to hold bit 63. 21 // Instead, the msb of the previous byte could be used to hold bit 63 since we 22 // know there can't be more than 64 bits. This is a trivial improvement and 23 // would reduce the maximum encoding length to 9 bytes. However, it breaks the 24 // invariant that the msb is always the "continuation bit" and thus makes the 25 // format incompatible with a varint encoding for larger numbers (say 128-bit). 26 27 import ( 28 "errors" 29 "io" 30 ) 31 32 // MaxVarintLenN is the maximum length of a varint-encoded N-bit integer. 33 const ( 34 MaxVarintLen16 = 3 35 MaxVarintLen32 = 5 36 MaxVarintLen64 = 10 37 ) 38 39 // AppendUvarint appends the varint-encoded form of x, 40 // as generated by [PutUvarint], to buf and returns the extended buffer. 41 func AppendUvarint(buf []byte, x uint64) []byte { 42 for x >= 0x80 { 43 buf = append(buf, byte(x)|0x80) 44 x >>= 7 45 } 46 return append(buf, byte(x)) 47 } 48 49 // PutUvarint encodes a uint64 into buf and returns the number of bytes written. 50 // If the buffer is too small, PutUvarint will panic. 51 func PutUvarint(buf []byte, x uint64) int { 52 i := 0 53 for x >= 0x80 { 54 buf[i] = byte(x) | 0x80 55 x >>= 7 56 i++ 57 } 58 buf[i] = byte(x) 59 return i + 1 60 } 61 62 // Uvarint decodes a uint64 from buf and returns that value and the 63 // number of bytes read (> 0). If an error occurred, the value is 0 64 // and the number of bytes n is <= 0 meaning: 65 // - n == 0: buf too small; 66 // - n < 0: value larger than 64 bits (overflow) and -n is the number of 67 // bytes read. 68 func Uvarint(buf []byte) (uint64, int) { 69 var x uint64 70 var s uint 71 for i, b := range buf { 72 if i == MaxVarintLen64 { 73 // Catch byte reads past MaxVarintLen64. 74 // See issue https://golang.org/issues/41185 75 return 0, -(i + 1) // overflow 76 } 77 if b < 0x80 { 78 if i == MaxVarintLen64-1 && b > 1 { 79 return 0, -(i + 1) // overflow 80 } 81 return x | uint64(b)<<s, i + 1 82 } 83 x |= uint64(b&0x7f) << s 84 s += 7 85 } 86 return 0, 0 87 } 88 89 // AppendVarint appends the varint-encoded form of x, 90 // as generated by [PutVarint], to buf and returns the extended buffer. 91 func AppendVarint(buf []byte, x int64) []byte { 92 ux := uint64(x) << 1 93 if x < 0 { 94 ux = ^ux 95 } 96 return AppendUvarint(buf, ux) 97 } 98 99 // PutVarint encodes an int64 into buf and returns the number of bytes written. 100 // If the buffer is too small, PutVarint will panic. 101 func PutVarint(buf []byte, x int64) int { 102 ux := uint64(x) << 1 103 if x < 0 { 104 ux = ^ux 105 } 106 return PutUvarint(buf, ux) 107 } 108 109 // Varint decodes an int64 from buf and returns that value and the 110 // number of bytes read (> 0). If an error occurred, the value is 0 111 // and the number of bytes n is <= 0 with the following meaning: 112 // - n == 0: buf too small; 113 // - n < 0: value larger than 64 bits (overflow) 114 // and -n is the number of bytes read. 115 func Varint(buf []byte) (int64, int) { 116 ux, n := Uvarint(buf) // ok to continue in presence of error 117 x := int64(ux >> 1) 118 if ux&1 != 0 { 119 x = ^x 120 } 121 return x, n 122 } 123 124 var errOverflow = errors.New("binary: varint overflows a 64-bit integer") 125 126 // ReadUvarint reads an encoded unsigned integer from r and returns it as a uint64. 127 // The error is [io.EOF] only if no bytes were read. 128 // If an [io.EOF] happens after reading some but not all the bytes, 129 // ReadUvarint returns [io.ErrUnexpectedEOF]. 130 func ReadUvarint(r io.ByteReader) (uint64, error) { 131 var x uint64 132 var s uint 133 for i := 0; i < MaxVarintLen64; i++ { 134 b, err := r.ReadByte() 135 if err != nil { 136 if i > 0 && err == io.EOF { 137 err = io.ErrUnexpectedEOF 138 } 139 return x, err 140 } 141 if b < 0x80 { 142 if i == MaxVarintLen64-1 && b > 1 { 143 return x, errOverflow 144 } 145 return x | uint64(b)<<s, nil 146 } 147 x |= uint64(b&0x7f) << s 148 s += 7 149 } 150 return x, errOverflow 151 } 152 153 // ReadVarint reads an encoded signed integer from r and returns it as an int64. 154 // The error is [io.EOF] only if no bytes were read. 155 // If an [io.EOF] happens after reading some but not all the bytes, 156 // ReadVarint returns [io.ErrUnexpectedEOF]. 157 func ReadVarint(r io.ByteReader) (int64, error) { 158 ux, err := ReadUvarint(r) // ok to continue in presence of error 159 x := int64(ux >> 1) 160 if ux&1 != 0 { 161 x = ^x 162 } 163 return x, err 164 } 165