2023-02-25 13:12:40 +01:00
|
|
|
/*
|
|
|
|
* Copyright 2021 ByteDance Inc.
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package unquote
|
|
|
|
|
|
|
|
import (
|
|
|
|
`unsafe`
|
2023-06-01 23:20:16 +02:00
|
|
|
`runtime`
|
2023-02-25 13:12:40 +01:00
|
|
|
|
|
|
|
`github.com/bytedance/sonic/internal/native`
|
|
|
|
`github.com/bytedance/sonic/internal/native/types`
|
|
|
|
`github.com/bytedance/sonic/internal/rt`
|
|
|
|
)
|
|
|
|
|
2024-05-06 10:50:47 +02:00
|
|
|
// String unescapes a escaped string (not including `"` at begining and end)
|
|
|
|
// It validates invalid UTF8 and replace with `\ufffd`
|
2023-02-25 13:12:40 +01:00
|
|
|
func String(s string) (ret string, err types.ParsingError) {
|
|
|
|
mm := make([]byte, 0, len(s))
|
2024-05-06 10:50:47 +02:00
|
|
|
err = intoBytesUnsafe(s, &mm, true)
|
2023-02-25 13:12:40 +01:00
|
|
|
ret = rt.Mem2Str(mm)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2024-05-06 10:50:47 +02:00
|
|
|
// IntoBytes is same with String besides it output result into a buffer m
|
2023-02-25 13:12:40 +01:00
|
|
|
func IntoBytes(s string, m *[]byte) types.ParsingError {
|
|
|
|
if cap(*m) < len(s) {
|
|
|
|
return types.ERR_EOF
|
|
|
|
} else {
|
2024-05-06 10:50:47 +02:00
|
|
|
return intoBytesUnsafe(s, m, true)
|
2023-02-25 13:12:40 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-06 10:50:47 +02:00
|
|
|
// String unescapes a escaped string (not including `"` at begining and end)
|
|
|
|
// - replace enables replacing invalid utf8 escaped char with `\uffd`
|
|
|
|
func _String(s string, replace bool) (ret string, err error) {
|
|
|
|
mm := make([]byte, 0, len(s))
|
|
|
|
err = intoBytesUnsafe(s, &mm, replace)
|
|
|
|
ret = rt.Mem2Str(mm)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func intoBytesUnsafe(s string, m *[]byte, replace bool) types.ParsingError {
|
2023-02-25 13:12:40 +01:00
|
|
|
pos := -1
|
|
|
|
slv := (*rt.GoSlice)(unsafe.Pointer(m))
|
|
|
|
str := (*rt.GoString)(unsafe.Pointer(&s))
|
2024-05-06 10:50:47 +02:00
|
|
|
|
|
|
|
flags := uint64(0)
|
|
|
|
if replace {
|
|
|
|
/* unquote as the default configuration, replace invalid unicode with \ufffd */
|
|
|
|
flags |= types.F_UNICODE_REPLACE
|
|
|
|
}
|
|
|
|
|
|
|
|
ret := native.Unquote(str.Ptr, str.Len, slv.Ptr, &pos, flags)
|
2023-02-25 13:12:40 +01:00
|
|
|
|
|
|
|
/* check for errors */
|
|
|
|
if ret < 0 {
|
|
|
|
return types.ParsingError(-ret)
|
|
|
|
}
|
|
|
|
|
|
|
|
/* update the length */
|
|
|
|
slv.Len = ret
|
2023-06-01 23:20:16 +02:00
|
|
|
runtime.KeepAlive(s)
|
2023-02-25 13:12:40 +01:00
|
|
|
return 0
|
|
|
|
}
|
2024-05-06 10:50:47 +02:00
|
|
|
|
|
|
|
|
|
|
|
|