blob: 837e5c4947a5afb1e5cc6328e1cd0e47c8627a96 [file] [log] [blame]
Damien Neil302cb322019-06-19 15:22:13 -07001// Copyright 2019 The Go Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style.
3// license that can be found in the LICENSE file.
4
5// Package messageset encodes and decodes the obsolete MessageSet wire format.
6package messageset
7
8import (
9 "google.golang.org/protobuf/internal/encoding/wire"
10 "google.golang.org/protobuf/internal/errors"
11 pref "google.golang.org/protobuf/reflect/protoreflect"
Joe Tsai5ae10aa2019-07-11 18:23:08 -070012 preg "google.golang.org/protobuf/reflect/protoregistry"
Damien Neil302cb322019-06-19 15:22:13 -070013)
14
15// The MessageSet wire format is equivalent to a message defiend as follows,
16// where each Item defines an extension field with a field number of 'type_id'
17// and content of 'message'. MessageSet extensions must be non-repeated message
18// fields.
19//
20// message MessageSet {
21// repeated group Item = 1 {
22// required int32 type_id = 2;
23// required string message = 3;
24// }
25// }
26const (
27 FieldItem = wire.Number(1)
28 FieldTypeID = wire.Number(2)
29 FieldMessage = wire.Number(3)
30)
31
Joe Tsai5ae10aa2019-07-11 18:23:08 -070032// ExtensionName is the field name for extensions of MessageSet.
33//
34// A valid MessageSet extension must be of the form:
35// message MyMessage {
36// extend proto2.bridge.MessageSet {
37// optional MyMessage message_set_extension = 1234;
38// }
39// ...
40// }
41const ExtensionName = "message_set_extension"
42
Damien Neil302cb322019-06-19 15:22:13 -070043// IsMessageSet returns whether the message uses the MessageSet wire format.
44func IsMessageSet(md pref.MessageDescriptor) bool {
45 xmd, ok := md.(interface{ IsMessageSet() bool })
46 return ok && xmd.IsMessageSet()
47}
48
Joe Tsai5ae10aa2019-07-11 18:23:08 -070049// IsMessageSetExtension reports this field extends a MessageSet.
50func IsMessageSetExtension(fd pref.FieldDescriptor) bool {
51 if fd.Name() != ExtensionName {
52 return false
53 }
54 if fd.FullName().Parent() != fd.Message().FullName() {
55 return false
56 }
57 return IsMessageSet(fd.ContainingMessage())
58}
59
60// FindMessageSetExtension locates a MessageSet extension field by name.
61// In text and JSON formats, the extension name used is the message itself.
62// The extension field name is derived by appending ExtensionName.
63func FindMessageSetExtension(r preg.ExtensionTypeResolver, s pref.FullName) (pref.ExtensionType, error) {
64 xt, err := r.FindExtensionByName(s.Append(ExtensionName))
65 if err != nil {
66 return nil, err
67 }
Damien Neil79bfdbe2019-08-28 11:08:22 -070068 if !IsMessageSetExtension(xt.TypeDescriptor()) {
Joe Tsai5ae10aa2019-07-11 18:23:08 -070069 return nil, preg.NotFound
70 }
71 return xt, nil
72}
73
Damien Neil302cb322019-06-19 15:22:13 -070074// SizeField returns the size of a MessageSet item field containing an extension
75// with the given field number, not counting the contents of the message subfield.
76func SizeField(num wire.Number) int {
77 return 2*wire.SizeTag(FieldItem) + wire.SizeTag(FieldTypeID) + wire.SizeVarint(uint64(num))
78}
79
Damien Neilce3384c2019-11-06 13:18:28 -080080// Unmarshal parses a MessageSet.
81//
82// It calls fn with the type ID and value of each item in the MessageSet.
83// Unknown fields are discarded.
84//
85// If wantLen is true, the item values include the varint length prefix.
86// This is ugly, but simplifies the fast-path decoder in internal/impl.
87func Unmarshal(b []byte, wantLen bool, fn func(typeID wire.Number, value []byte) error) error {
88 for len(b) > 0 {
89 num, wtyp, n := wire.ConsumeTag(b)
90 if n < 0 {
91 return wire.ParseError(n)
92 }
93 b = b[n:]
94 if num != FieldItem || wtyp != wire.StartGroupType {
95 n := wire.ConsumeFieldValue(num, wtyp, b)
96 if n < 0 {
97 return wire.ParseError(n)
98 }
99 b = b[n:]
100 continue
101 }
Damien Neil9afe9bb2020-02-07 10:06:53 -0800102 typeID, value, n, err := ConsumeFieldValue(b, wantLen)
Damien Neilce3384c2019-11-06 13:18:28 -0800103 if err != nil {
104 return err
105 }
106 b = b[n:]
107 if typeID == 0 {
108 continue
109 }
110 if err := fn(typeID, value); err != nil {
111 return err
112 }
Damien Neil302cb322019-06-19 15:22:13 -0700113 }
Damien Neilce3384c2019-11-06 13:18:28 -0800114 return nil
Damien Neil302cb322019-06-19 15:22:13 -0700115}
116
Damien Neil9afe9bb2020-02-07 10:06:53 -0800117// ConsumeFieldValue parses b as a MessageSet item field value until and including
Damien Neil302cb322019-06-19 15:22:13 -0700118// the trailing end group marker. It assumes the start group tag has already been parsed.
119// It returns the contents of the type_id and message subfields and the total
120// item length.
121//
122// If wantLen is true, the returned message value includes the length prefix.
Damien Neil9afe9bb2020-02-07 10:06:53 -0800123func ConsumeFieldValue(b []byte, wantLen bool) (typeid wire.Number, message []byte, n int, err error) {
Damien Neil302cb322019-06-19 15:22:13 -0700124 ilen := len(b)
125 for {
126 num, wtyp, n := wire.ConsumeTag(b)
127 if n < 0 {
128 return 0, nil, 0, wire.ParseError(n)
129 }
130 b = b[n:]
131 switch {
132 case num == FieldItem && wtyp == wire.EndGroupType:
133 if wantLen && len(message) == 0 {
134 // The message field was missing, which should never happen.
135 // Be prepared for this case anyway.
136 message = wire.AppendVarint(message, 0)
137 }
138 return typeid, message, ilen - len(b), nil
139 case num == FieldTypeID && wtyp == wire.VarintType:
140 v, n := wire.ConsumeVarint(b)
141 if n < 0 {
142 return 0, nil, 0, wire.ParseError(n)
143 }
144 b = b[n:]
145 typeid = wire.Number(v)
146 case num == FieldMessage && wtyp == wire.BytesType:
147 m, n := wire.ConsumeBytes(b)
148 if n < 0 {
149 return 0, nil, 0, wire.ParseError(n)
150 }
151 if message == nil {
152 if wantLen {
153 message = b[:n]
154 } else {
155 message = m
156 }
157 } else {
158 // This case should never happen in practice, but handle it for
159 // correctness: The MessageSet item contains multiple message
160 // fields, which need to be merged.
161 //
162 // In the case where we're returning the length, this becomes
163 // quite inefficient since we need to strip the length off
164 // the existing data and reconstruct it with the combined length.
165 if wantLen {
166 _, nn := wire.ConsumeVarint(message)
167 m0 := message[nn:]
168 message = message[:0]
169 message = wire.AppendVarint(message, uint64(len(m0)+len(m)))
170 message = append(message, m0...)
171 message = append(message, m...)
172 } else {
173 message = append(message, m...)
174 }
175 }
176 b = b[n:]
177 }
178 }
179}
180
181// AppendFieldStart appends the start of a MessageSet item field containing
182// an extension with the given number. The caller must add the message
183// subfield (including the tag).
184func AppendFieldStart(b []byte, num wire.Number) []byte {
185 b = wire.AppendTag(b, FieldItem, wire.StartGroupType)
186 b = wire.AppendTag(b, FieldTypeID, wire.VarintType)
187 b = wire.AppendVarint(b, uint64(num))
188 return b
189}
190
191// AppendFieldEnd appends the trailing end group marker for a MessageSet item field.
192func AppendFieldEnd(b []byte) []byte {
193 return wire.AppendTag(b, FieldItem, wire.EndGroupType)
194}
Damien Neilce3384c2019-11-06 13:18:28 -0800195
196// SizeUnknown returns the size of an unknown fields section in MessageSet format.
197//
198// See AppendUnknown.
199func SizeUnknown(unknown []byte) (size int) {
200 for len(unknown) > 0 {
201 num, typ, n := wire.ConsumeTag(unknown)
202 if n < 0 || typ != wire.BytesType {
203 return 0
204 }
205 unknown = unknown[n:]
206 _, n = wire.ConsumeBytes(unknown)
207 if n < 0 {
208 return 0
209 }
210 unknown = unknown[n:]
211 size += SizeField(num) + wire.SizeTag(FieldMessage) + n
212 }
213 return size
214}
215
216// AppendUnknown appends unknown fields to b in MessageSet format.
217//
218// For historic reasons, unresolved items in a MessageSet are stored in a
219// message's unknown fields section in non-MessageSet format. That is, an
220// unknown item with typeID T and value V appears in the unknown fields as
221// a field with number T and value V.
222//
223// This function converts the unknown fields back into MessageSet form.
224func AppendUnknown(b, unknown []byte) ([]byte, error) {
225 for len(unknown) > 0 {
226 num, typ, n := wire.ConsumeTag(unknown)
227 if n < 0 || typ != wire.BytesType {
228 return nil, errors.New("invalid data in message set unknown fields")
229 }
230 unknown = unknown[n:]
231 _, n = wire.ConsumeBytes(unknown)
232 if n < 0 {
233 return nil, errors.New("invalid data in message set unknown fields")
234 }
235 b = AppendFieldStart(b, num)
236 b = wire.AppendTag(b, FieldMessage, wire.BytesType)
237 b = append(b, unknown[:n]...)
238 b = AppendFieldEnd(b)
239 unknown = unknown[n:]
240 }
241 return b, nil
242}