mirror of
https://github.com/protocolbuffers/protobuf-go.git
synced 2025-01-26 18:35:25 +00:00
3c4ab8c6f1
This is more consistent with the indent documentation: If indent is a non-empty string, it causes every entry in a List or Message to be preceded by the indent and trailed by a newline. Since an empty message has no entries, there should be no newlines. Change-Id: I5d57165aaf94ca6b184bb35bf05d5d68f5ee9dd5 Reviewed-on: https://go-review.googlesource.com/c/protobuf/+/194877 Reviewed-by: Herbie Ong <herbie@google.com>
189 lines
4.9 KiB
Go
189 lines
4.9 KiB
Go
// Copyright 2018 The Go Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style
|
|
// license that can be found in the LICENSE file.
|
|
|
|
package text
|
|
|
|
import (
|
|
"regexp"
|
|
"strings"
|
|
|
|
"google.golang.org/protobuf/internal/detrand"
|
|
"google.golang.org/protobuf/internal/errors"
|
|
)
|
|
|
|
// Marshal serializes v as the proto text format, where v must be a Message.
|
|
// In the proto text format, the top-level value is always a message where the
|
|
// delimiters are elided.
|
|
//
|
|
// If indent is a non-empty string, it causes every entry in a List or Message
|
|
// to be preceded by the indent and trailed by a newline.
|
|
//
|
|
// If delims is not the zero value, it controls the delimiter characters used
|
|
// for messages (e.g., "{}" vs "<>").
|
|
//
|
|
// If outputASCII is true, strings will be serialized in such a way that
|
|
// multi-byte UTF-8 sequences are escaped. This property ensures that the
|
|
// overall output is ASCII (as opposed to UTF-8).
|
|
func Marshal(v Value, indent string, delims [2]byte, outputASCII bool) ([]byte, error) {
|
|
p := encoder{}
|
|
if len(indent) > 0 {
|
|
if strings.Trim(indent, " \t") != "" {
|
|
return nil, errors.New("indent may only be composed of space and tab characters")
|
|
}
|
|
p.indent = indent
|
|
p.newline = "\n"
|
|
}
|
|
switch delims {
|
|
case [2]byte{0, 0}:
|
|
p.delims = [2]byte{'{', '}'}
|
|
case [2]byte{'{', '}'}, [2]byte{'<', '>'}:
|
|
p.delims = delims
|
|
default:
|
|
return nil, errors.New("delimiters may only be \"{}\" or \"<>\"")
|
|
}
|
|
p.outputASCII = outputASCII
|
|
|
|
err := p.marshalMessage(v, false)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return p.out, nil
|
|
}
|
|
|
|
type encoder struct {
|
|
out []byte
|
|
|
|
indent string
|
|
indents []byte
|
|
newline string // set to "\n" if len(indent) > 0
|
|
delims [2]byte
|
|
outputASCII bool
|
|
}
|
|
|
|
func (p *encoder) marshalList(v Value) error {
|
|
if v.Type() != List {
|
|
return errors.New("invalid type %v, expected list", v.Type())
|
|
}
|
|
elems := v.List()
|
|
p.out = append(p.out, '[')
|
|
p.indents = append(p.indents, p.indent...)
|
|
if len(elems) > 0 {
|
|
p.out = append(p.out, p.newline...)
|
|
}
|
|
for i, elem := range elems {
|
|
p.out = append(p.out, p.indents...)
|
|
if err := p.marshalValue(elem); err != nil {
|
|
return err
|
|
}
|
|
if i < len(elems)-1 {
|
|
p.out = append(p.out, ',')
|
|
}
|
|
p.out = append(p.out, p.newline...)
|
|
}
|
|
p.indents = p.indents[:len(p.indents)-len(p.indent)]
|
|
if len(elems) > 0 {
|
|
p.out = append(p.out, p.indents...)
|
|
}
|
|
p.out = append(p.out, ']')
|
|
return nil
|
|
}
|
|
|
|
func (p *encoder) marshalMessage(v Value, emitDelims bool) error {
|
|
if v.Type() != Message {
|
|
return errors.New("invalid type %v, expected message", v.Type())
|
|
}
|
|
items := v.Message()
|
|
if emitDelims {
|
|
p.out = append(p.out, p.delims[0])
|
|
p.indents = append(p.indents, p.indent...)
|
|
if len(items) > 0 {
|
|
p.out = append(p.out, p.newline...)
|
|
}
|
|
}
|
|
for i, item := range items {
|
|
p.out = append(p.out, p.indents...)
|
|
if err := p.marshalKey(item[0]); err != nil {
|
|
return err
|
|
}
|
|
p.out = append(p.out, ':')
|
|
if len(p.indent) > 0 {
|
|
p.out = append(p.out, ' ')
|
|
// For multi-line output, add a random extra space after key:
|
|
// to make output unstable.
|
|
if detrand.Bool() {
|
|
p.out = append(p.out, ' ')
|
|
}
|
|
}
|
|
|
|
if err := p.marshalValue(item[1]); err != nil {
|
|
return err
|
|
}
|
|
if i < len(items)-1 && len(p.indent) == 0 {
|
|
p.out = append(p.out, ' ')
|
|
// For single-line output, add a random extra space after a field
|
|
// to make output unstable.
|
|
if detrand.Bool() {
|
|
p.out = append(p.out, ' ')
|
|
}
|
|
}
|
|
p.out = append(p.out, p.newline...)
|
|
}
|
|
if emitDelims {
|
|
p.indents = p.indents[:len(p.indents)-len(p.indent)]
|
|
if len(items) > 0 {
|
|
p.out = append(p.out, p.indents...)
|
|
}
|
|
p.out = append(p.out, p.delims[1])
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// This expression is more liberal than ConsumeAnyTypeUrl in C++.
|
|
// However, the C++ parser does not handle many legal URL strings.
|
|
// The Go implementation is more liberal to be backwards compatible with
|
|
// the historical Go implementation which was overly liberal (and buggy).
|
|
var urlRegexp = regexp.MustCompile(`^[-_a-zA-Z0-9]+([./][-_a-zA-Z0-9]+)*`)
|
|
|
|
func (p *encoder) marshalKey(v Value) error {
|
|
switch v.Type() {
|
|
case String:
|
|
var err error
|
|
p.out = append(p.out, '[')
|
|
if len(urlRegexp.FindString(v.str)) == len(v.str) {
|
|
p.out = append(p.out, v.str...)
|
|
} else {
|
|
err = p.marshalString(v)
|
|
}
|
|
p.out = append(p.out, ']')
|
|
return err
|
|
case Uint:
|
|
return p.marshalNumber(v)
|
|
case Name:
|
|
s, _ := v.Name()
|
|
p.out = append(p.out, s...)
|
|
return nil
|
|
default:
|
|
return errors.New("invalid type %v to encode key", v.Type())
|
|
}
|
|
}
|
|
|
|
func (p *encoder) marshalValue(v Value) error {
|
|
switch v.Type() {
|
|
case Bool, Int, Uint, Float32, Float64:
|
|
return p.marshalNumber(v)
|
|
case String:
|
|
return p.marshalString(v)
|
|
case List:
|
|
return p.marshalList(v)
|
|
case Message:
|
|
return p.marshalMessage(v, true)
|
|
case Name:
|
|
s, _ := v.Name()
|
|
p.out = append(p.out, s...)
|
|
return nil
|
|
default:
|
|
return errors.New("invalid type %v to encode value", v.Type())
|
|
}
|
|
}
|