summaryrefslogtreecommitdiff
path: root/encode_string.go
blob: 12f934e0a97950ef7a8fe738c06bb4765cdd9663 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
// Copyright (C) 2022-2023  Luke Shumaker <lukeshu@lukeshu.com>
//
// SPDX-License-Identifier: GPL-2.0-or-later

package lowmemjson

import (
	"io"
	"unicode/utf8"

	"git.lukeshu.com/go/lowmemjson/internal"
)

func writeStringUnicodeEscape(w io.Writer, c rune) (int, error) {
	buf := [6]byte{
		'\\',
		'u',
		internal.Hex[(c>>12)&0xf],
		internal.Hex[(c>>8)&0xf],
		internal.Hex[(c>>4)&0xf],
		internal.Hex[(c>>0)&0xf],
	}
	return w.Write(buf[:])
}

func writeStringShortEscape(w io.Writer, c rune) (int, error) {
	var b byte
	switch c {
	case '"', '\\', '/':
		b = byte(c)
	case '\b':
		b = 'b'
	case '\f':
		b = 'f'
	case '\n':
		b = 'n'
	case '\r':
		b = 'r'
	case '\t':
		b = 't'
	default:
		panic("should not happen")
	}
	buf := [2]byte{'\\', b}
	return w.Write(buf[:])
}

func writeStringChar(w internal.AllWriter, c rune, wasEscaped BackslashEscapeMode, escaper BackslashEscaper) (int, error) {
	if escaper == nil {
		escaper = EscapeDefault
	}
	switch escaper(c, wasEscaped) {
	case BackslashEscapeNone:
		switch {
		case c < 0x0020: // override, gotta escape these
			switch c {
			case '\b', '\f', '\n', '\r', '\t': // short-escape if possible
				return writeStringShortEscape(w, c)
			default:
				return writeStringUnicodeEscape(w, c)
			}
		case c == '"' || c == '\\': // override, gotta escape these
			return writeStringShortEscape(w, c)
		default: // obey
			return w.WriteRune(c)
		}
	case BackslashEscapeShort:
		switch c {
		case '"', '\\', '/', '\b', '\f', '\n', '\r', '\t': // obey
			return writeStringShortEscape(w, c)
		default: // override, can't short-escape these
			return w.WriteRune(c)
		}
	case BackslashEscapeUnicode:
		switch {
		case c > 0xFFFF: // override, can't escape these (TODO: unless we use UTF-16 surrogates?)
			return w.WriteRune(c)
		default: // obey
			return writeStringUnicodeEscape(w, c)
		}
	default:
		panic("escaper returned an invalid escape mode")
	}
}

func encodeStringFromString(w internal.AllWriter, escaper BackslashEscaper, str string) error {
	if err := w.WriteByte('"'); err != nil {
		return err
	}
	for _, c := range str {
		if _, err := writeStringChar(w, c, BackslashEscapeNone, escaper); err != nil {
			return err
		}
	}
	if err := w.WriteByte('"'); err != nil {
		return err
	}
	return nil
}

func encodeStringFromBytes(w internal.AllWriter, escaper BackslashEscaper, str []byte) error {
	if err := w.WriteByte('"'); err != nil {
		return err
	}
	for i := 0; i < len(str); {
		c, size := utf8.DecodeRune(str[i:])
		if _, err := writeStringChar(w, c, BackslashEscapeNone, escaper); err != nil {
			return err
		}
		i += size
	}
	if err := w.WriteByte('"'); err != nil {
		return err
	}
	return nil
}

func init() {
	internal.EncodeStringFromString = func(w io.Writer, s string) {
		if err := encodeStringFromString(internal.NewAllWriter(w), nil, s); err != nil {
			panic(err)
		}
	}
	internal.EncodeStringFromBytes = func(w io.Writer, s []byte) {
		if err := encodeStringFromBytes(internal.NewAllWriter(w), nil, s); err != nil {
			panic(err)
		}
	}
}