goext/gojson/indent.go

// Copyright 2010 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

package json

import "bytes"

// HTMLEscape appends to dst the JSON-encoded src with <, >, &, U+2028 and U+2029
// characters inside string literals changed to \u003c, \u003e, \u0026, \u2028, \u2029
// so that the JSON will be safe to embed inside HTML <script> tags.
// For historical reasons, web browsers don't honor standard HTML
// escaping within <script> tags, so an alternative JSON encoding must be used.
func HTMLEscape(dst *bytes.Buffer, src []byte) {
	dst.Grow(len(src))
	dst.Write(appendHTMLEscape(dst.AvailableBuffer(), src))
}

func appendHTMLEscape(dst, src []byte) []byte {
	// The characters can only appear in string literals,
	// so just scan the string one byte at a time.
	start := 0
	for i, c := range src {
		if c == '<' || c == '>' || c == '&' {
			dst = append(dst, src[start:i]...)
			dst = append(dst, '\\', 'u', '0', '0', hex[c>>4], hex[c&0xF])
			start = i + 1
		}
		// Convert U+2028 and U+2029 (E2 80 A8 and E2 80 A9).
		if c == 0xE2 && i+2 < len(src) && src[i+1] == 0x80 && src[i+2]&^1 == 0xA8 {
			dst = append(dst, src[start:i]...)
			dst = append(dst, '\\', 'u', '2', '0', '2', hex[src[i+2]&0xF])
			start = i + len("\u2029")
		}
	}
	return append(dst, src[start:]...)
}

// Compact appends to dst the JSON-encoded src with
// insignificant space characters elided.
func Compact(dst *bytes.Buffer, src []byte) error {
	dst.Grow(len(src))
	b := dst.AvailableBuffer()
	b, err := appendCompact(b, src, false)
	dst.Write(b)
	return err
}

func appendCompact(dst, src []byte, escape bool) ([]byte, error) {
	origLen := len(dst)
	scan := newScanner()
	defer freeScanner(scan)
	start := 0
	for i, c := range src {
		if escape && (c == '<' || c == '>' || c == '&') {
			if start < i {
				dst = append(dst, src[start:i]...)
			}
			dst = append(dst, '\\', 'u', '0', '0', hex[c>>4], hex[c&0xF])
			start = i + 1
		}
		// Convert U+2028 and U+2029 (E2 80 A8 and E2 80 A9).
		if escape && c == 0xE2 && i+2 < len(src) && src[i+1] == 0x80 && src[i+2]&^1 == 0xA8 {
			if start < i {
				dst = append(dst, src[start:i]...)
			}
			dst = append(dst, '\\', 'u', '2', '0', '2', hex[src[i+2]&0xF])
			start = i + 3
		}
		v := scan.step(scan, c)
		if v >= scanSkipSpace {
			if v == scanError {
				break
			}
			if start < i {
				dst = append(dst, src[start:i]...)
			}
			start = i + 1
		}
	}
	if scan.eof() == scanError {
		return dst[:origLen], scan.err
	}
	if start < len(src) {
		dst = append(dst, src[start:]...)
	}
	return dst, nil
}

func appendNewline(dst []byte, prefix, indent string, depth int) []byte {
	dst = append(dst, '\n')
	dst = append(dst, prefix...)
	for i := 0; i < depth; i++ {
		dst = append(dst, indent...)
	}
	return dst
}

// indentGrowthFactor specifies the growth factor of indenting JSON input.
// Empirically, the growth factor was measured to be between 1.4x to 1.8x
// for some set of compacted JSON with the indent being a single tab.
// Specify a growth factor slightly larger than what is observed
// to reduce probability of allocation in appendIndent.
// A factor no higher than 2 ensures that wasted space never exceeds 50%.
const indentGrowthFactor = 2

// Indent appends to dst an indented form of the JSON-encoded src.
// Each element in a JSON object or array begins on a new,
// indented line beginning with prefix followed by one or more
// copies of indent according to the indentation nesting.
// The data appended to dst does not begin with the prefix nor
// any indentation, to make it easier to embed inside other formatted JSON data.
// Although leading space characters (space, tab, carriage return, newline)
// at the beginning of src are dropped, trailing space characters
// at the end of src are preserved and copied to dst.
// For example, if src has no trailing spaces, neither will dst;
// if src ends in a trailing newline, so will dst.
func Indent(dst *bytes.Buffer, src []byte, prefix, indent string) error {
	dst.Grow(indentGrowthFactor * len(src))
	b := dst.AvailableBuffer()
	b, err := appendIndent(b, src, prefix, indent)
	dst.Write(b)
	return err
}

func appendIndent(dst, src []byte, prefix, indent string) ([]byte, error) {
	origLen := len(dst)
	scan := newScanner()
	defer freeScanner(scan)
	needIndent := false
	depth := 0
	for _, c := range src {
		scan.bytes++
		v := scan.step(scan, c)
		if v == scanSkipSpace {
			continue
		}
		if v == scanError {
			break
		}
		if needIndent && v != scanEndObject && v != scanEndArray {
			needIndent = false
			depth++
			dst = appendNewline(dst, prefix, indent, depth)
		}

		// Emit semantically uninteresting bytes
		// (in particular, punctuation in strings) unmodified.
		if v == scanContinue {
			dst = append(dst, c)
			continue
		}

		// Add spacing around real punctuation.
		switch c {
		case '{', '[':
			// delay indent so that empty object and array are formatted as {} and [].
			needIndent = true
			dst = append(dst, c)
		case ',':
			dst = append(dst, c)
			dst = appendNewline(dst, prefix, indent, depth)
		case ':':
			dst = append(dst, c, ' ')
		case '}', ']':
			if needIndent {
				// suppress indent in empty object/array
				needIndent = false
			} else {
				depth--
				dst = appendNewline(dst, prefix, indent, depth)
			}
			dst = append(dst, c)
		default:
			dst = append(dst, c)
		}
	}
	if scan.eof() == scanError {
		return dst[:origLen], scan.err
	}
	return dst, nil
}
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`// Copyright 2010 The Go Authors. All rights reserved.`
			`// Use of this source code is governed by a BSD-style`
			`// license that can be found in the LICENSE file.`

			`package json`

Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`import "bytes"`

			`// HTMLEscape appends to dst the JSON-encoded src with <, >, &, U+2028 and U+2029`
			`// characters inside string literals changed to \u003c, \u003e, \u0026, \u2028, \u2029`
			`// so that the JSON will be safe to embed inside HTML <script> tags.`
			`// For historical reasons, web browsers don't honor standard HTML`
			`// escaping within <script> tags, so an alternative JSON encoding must be used.`
			`func HTMLEscape(dst *bytes.Buffer, src []byte) {`
			`dst.Grow(len(src))`
			`dst.Write(appendHTMLEscape(dst.AvailableBuffer(), src))`
			`}`

			`func appendHTMLEscape(dst, src []byte) []byte {`
			`// The characters can only appear in string literals,`
			`// so just scan the string one byte at a time.`
			`start := 0`
			`for i, c := range src {`
			`if c == '<' \|\| c == '>' \|\| c == '&' {`
			`dst = append(dst, src[start:i]...)`
			`dst = append(dst, '\\', 'u', '0', '0', hex[c>>4], hex[c&0xF])`
			`start = i + 1`
			`}`
			`// Convert U+2028 and U+2029 (E2 80 A8 and E2 80 A9).`
			`if c == 0xE2 && i+2 < len(src) && src[i+1] == 0x80 && src[i+2]&^1 == 0xA8 {`
			`dst = append(dst, src[start:i]...)`
			`dst = append(dst, '\\', 'u', '2', '0', '2', hex[src[i+2]&0xF])`
			`start = i + len("\u2029")`
			`}`
			`}`
			`return append(dst, src[start:]...)`
			`}`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00
			`// Compact appends to dst the JSON-encoded src with`
			`// insignificant space characters elided.`
			`func Compact(dst *bytes.Buffer, src []byte) error {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst.Grow(len(src))`
			`b := dst.AvailableBuffer()`
			`b, err := appendCompact(b, src, false)`
			`dst.Write(b)`
			`return err`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`

Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`func appendCompact(dst, src []byte, escape bool) ([]byte, error) {`
			`origLen := len(dst)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`scan := newScanner()`
			`defer freeScanner(scan)`
			`start := 0`
			`for i, c := range src {`
			`if escape && (c == '<' \|\| c == '>' \|\| c == '&') {`
			`if start < i {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, src[start:i]...)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, '\\', 'u', '0', '0', hex[c>>4], hex[c&0xF])`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`start = i + 1`
			`}`
			`// Convert U+2028 and U+2029 (E2 80 A8 and E2 80 A9).`
			`if escape && c == 0xE2 && i+2 < len(src) && src[i+1] == 0x80 && src[i+2]&^1 == 0xA8 {`
			`if start < i {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, src[start:i]...)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, '\\', 'u', '2', '0', '2', hex[src[i+2]&0xF])`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`start = i + 3`
			`}`
			`v := scan.step(scan, c)`
			`if v >= scanSkipSpace {`
			`if v == scanError {`
			`break`
			`}`
			`if start < i {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, src[start:i]...)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
			`start = i + 1`
			`}`
			`}`
			`if scan.eof() == scanError {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`return dst[:origLen], scan.err`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
			`if start < len(src) {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, src[start:]...)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`return dst, nil`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`

Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`func appendNewline(dst []byte, prefix, indent string, depth int) []byte {`
			`dst = append(dst, '\n')`
			`dst = append(dst, prefix...)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`for i := 0; i < depth; i++ {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, indent...)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`return dst`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`

Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`// indentGrowthFactor specifies the growth factor of indenting JSON input.`
			`// Empirically, the growth factor was measured to be between 1.4x to 1.8x`
			`// for some set of compacted JSON with the indent being a single tab.`
			`// Specify a growth factor slightly larger than what is observed`
			`// to reduce probability of allocation in appendIndent.`
			`// A factor no higher than 2 ensures that wasted space never exceeds 50%.`
			`const indentGrowthFactor = 2`

added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`// Indent appends to dst an indented form of the JSON-encoded src.`
			`// Each element in a JSON object or array begins on a new,`
			`// indented line beginning with prefix followed by one or more`
			`// copies of indent according to the indentation nesting.`
			`// The data appended to dst does not begin with the prefix nor`
			`// any indentation, to make it easier to embed inside other formatted JSON data.`
			`// Although leading space characters (space, tab, carriage return, newline)`
			`// at the beginning of src are dropped, trailing space characters`
			`// at the end of src are preserved and copied to dst.`
			`// For example, if src has no trailing spaces, neither will dst;`
			`// if src ends in a trailing newline, so will dst.`
			`func Indent(dst *bytes.Buffer, src []byte, prefix, indent string) error {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst.Grow(indentGrowthFactor * len(src))`
			`b := dst.AvailableBuffer()`
			`b, err := appendIndent(b, src, prefix, indent)`
			`dst.Write(b)`
			`return err`
			`}`

			`func appendIndent(dst, src []byte, prefix, indent string) ([]byte, error) {`
			`origLen := len(dst)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`scan := newScanner()`
			`defer freeScanner(scan)`
			`needIndent := false`
			`depth := 0`
			`for _, c := range src {`
			`scan.bytes++`
			`v := scan.step(scan, c)`
			`if v == scanSkipSpace {`
			`continue`
			`}`
			`if v == scanError {`
			`break`
			`}`
			`if needIndent && v != scanEndObject && v != scanEndArray {`
			`needIndent = false`
			`depth++`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = appendNewline(dst, prefix, indent, depth)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`

			`// Emit semantically uninteresting bytes`
			`// (in particular, punctuation in strings) unmodified.`
			`if v == scanContinue {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, c)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`continue`
			`}`

			`// Add spacing around real punctuation.`
			`switch c {`
			`case '{', '[':`
			`// delay indent so that empty object and array are formatted as {} and [].`
			`needIndent = true`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, c)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`case ',':`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, c)`
			`dst = appendNewline(dst, prefix, indent, depth)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`case ':':`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, c, ' ')`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`case '}', ']':`
			`if needIndent {`
			`// suppress indent in empty object/array`
			`needIndent = false`
			`} else {`
			`depth--`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = appendNewline(dst, prefix, indent, depth)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, c)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`default:`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`dst = append(dst, c)`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
			`}`
			`if scan.eof() == scanError {`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`return dst[:origLen], scan.err`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`
Reset gojson to golang/go\|1.23.4 [removes all custom changes] 2025-01-10 11:49:29 +01:00			`return dst, nil`
added gojson as a go/json fork (tag go1.20.2) 2023-04-20 14:30:24 +02:00			`}`