30d706c35e
* p2p/discover, p2p/discv5: add marshaling methods to Node * p2p/netutil: make Netlist decodable from TOML * common/math: encode nil HexOrDecimal256 as 0x0 * cmd/geth: add --config file flag * cmd/geth: add missing license header * eth: prettify Config again, fix tests * eth: use gasprice.Config instead of duplicating its fields * eth/gasprice: hide nil default from dumpconfig output * cmd/geth: hide genesis block in dumpconfig output * node: make tests compile * console: fix tests * cmd/geth: make TOML keys look exactly like Go struct fields * p2p: use discovery by default This makes the zero Config slightly more useful. It also fixes package node tests because Node detects reuse of the datadir through the NodeDatabase. * cmd/geth: make ethstats URL settable through config file * cmd/faucet: fix configuration * cmd/geth: dedup attach tests * eth: add comment for DefaultConfig * eth: pass downloader.SyncMode in Config This removes the FastSync, LightSync flags in favour of a more general SyncMode flag. * cmd/utils: remove jitvm flags * cmd/utils: make mutually exclusive flag error prettier It now reads: Fatal: flags --dev, --testnet can't be used at the same time * p2p: fix typo * node: add DefaultConfig, use it for geth * mobile: add missing NoDiscovery option * cmd/utils: drop MakeNode This exposed a couple of places that needed to be updated to use node.DefaultConfig. * node: fix typo * eth: make fast sync the default mode * cmd/utils: remove IPCApiFlag (unused) * node: remove default IPC path Set it in the frontends instead. * cmd/geth: add --syncmode * cmd/utils: make --ipcdisable and --ipcpath mutually exclusive * cmd/utils: don't enable WS, HTTP when setting addr * cmd/utils: fix --identity
321 lines
8.0 KiB
Go
321 lines
8.0 KiB
Go
package stringutil
|
|
|
|
import (
|
|
"sync"
|
|
"unicode"
|
|
"unicode/utf8"
|
|
)
|
|
|
|
var (
|
|
mu sync.Mutex
|
|
|
|
// Based on https://github.com/golang/lint/blob/32a87160691b3c96046c0c678fe57c5bef761456/lint.go#L702
|
|
commonInitialismMap = map[string]struct{}{
|
|
"API": struct{}{},
|
|
"ASCII": struct{}{},
|
|
"CPU": struct{}{},
|
|
"CSRF": struct{}{},
|
|
"CSS": struct{}{},
|
|
"DNS": struct{}{},
|
|
"EOF": struct{}{},
|
|
"GUID": struct{}{},
|
|
"HTML": struct{}{},
|
|
"HTTP": struct{}{},
|
|
"HTTPS": struct{}{},
|
|
"ID": struct{}{},
|
|
"IP": struct{}{},
|
|
"JSON": struct{}{},
|
|
"LHS": struct{}{},
|
|
"QPS": struct{}{},
|
|
"RAM": struct{}{},
|
|
"RHS": struct{}{},
|
|
"RPC": struct{}{},
|
|
"SLA": struct{}{},
|
|
"SMTP": struct{}{},
|
|
"SQL": struct{}{},
|
|
"SSH": struct{}{},
|
|
"TCP": struct{}{},
|
|
"TLS": struct{}{},
|
|
"TTL": struct{}{},
|
|
"UDP": struct{}{},
|
|
"UI": struct{}{},
|
|
"UID": struct{}{},
|
|
"UUID": struct{}{},
|
|
"URI": struct{}{},
|
|
"URL": struct{}{},
|
|
"UTF8": struct{}{},
|
|
"VM": struct{}{},
|
|
"XML": struct{}{},
|
|
"XSRF": struct{}{},
|
|
"XSS": struct{}{},
|
|
}
|
|
commonInitialisms = keys(commonInitialismMap)
|
|
commonInitialism = mustDoubleArray(newDoubleArray(commonInitialisms))
|
|
longestLen = longestLength(commonInitialisms)
|
|
shortestLen = shortestLength(commonInitialisms, longestLen)
|
|
)
|
|
|
|
// ToUpperCamelCase returns a copy of the string s with all Unicode letters mapped to their camel case.
|
|
// It will convert to upper case previous letter of '_' and first letter, and remove letter of '_'.
|
|
func ToUpperCamelCase(s string) string {
|
|
if s == "" {
|
|
return ""
|
|
}
|
|
upper := true
|
|
start := 0
|
|
result := make([]byte, 0, len(s))
|
|
var runeBuf [utf8.UTFMax]byte
|
|
var initialism []byte
|
|
for _, c := range s {
|
|
if c == '_' {
|
|
upper = true
|
|
candidate := string(result[start:])
|
|
initialism = initialism[:0]
|
|
for _, r := range candidate {
|
|
if r < utf8.RuneSelf {
|
|
initialism = append(initialism, toUpperASCII(byte(r)))
|
|
} else {
|
|
n := utf8.EncodeRune(runeBuf[:], unicode.ToUpper(r))
|
|
initialism = append(initialism, runeBuf[:n]...)
|
|
}
|
|
}
|
|
if length := commonInitialism.LookupByBytes(initialism); length > 0 {
|
|
result = append(result[:start], initialism...)
|
|
}
|
|
start = len(result)
|
|
continue
|
|
}
|
|
if upper {
|
|
if c < utf8.RuneSelf {
|
|
result = append(result, toUpperASCII(byte(c)))
|
|
} else {
|
|
n := utf8.EncodeRune(runeBuf[:], unicode.ToUpper(c))
|
|
result = append(result, runeBuf[:n]...)
|
|
}
|
|
upper = false
|
|
continue
|
|
}
|
|
if c < utf8.RuneSelf {
|
|
result = append(result, byte(c))
|
|
} else {
|
|
n := utf8.EncodeRune(runeBuf[:], c)
|
|
result = append(result, runeBuf[:n]...)
|
|
}
|
|
}
|
|
candidate := string(result[start:])
|
|
initialism = initialism[:0]
|
|
for _, r := range candidate {
|
|
if r < utf8.RuneSelf {
|
|
initialism = append(initialism, toUpperASCII(byte(r)))
|
|
} else {
|
|
n := utf8.EncodeRune(runeBuf[:], unicode.ToUpper(r))
|
|
initialism = append(initialism, runeBuf[:n]...)
|
|
}
|
|
}
|
|
if length := commonInitialism.LookupByBytes(initialism); length > 0 {
|
|
result = append(result[:start], initialism...)
|
|
}
|
|
return string(result)
|
|
}
|
|
|
|
// ToUpperCamelCaseASCII is similar to ToUpperCamelCase, but optimized for
|
|
// only the ASCII characters.
|
|
// ToUpperCamelCaseASCII is faster than ToUpperCamelCase, but doesn't work if
|
|
// contains non-ASCII characters.
|
|
func ToUpperCamelCaseASCII(s string) string {
|
|
if s == "" {
|
|
return ""
|
|
}
|
|
upper := true
|
|
start := 0
|
|
result := make([]byte, 0, len(s))
|
|
var initialism []byte
|
|
for i := 0; i < len(s); i++ {
|
|
c := s[i]
|
|
if c == '_' {
|
|
upper = true
|
|
candidate := result[start:]
|
|
initialism = initialism[:0]
|
|
for _, b := range candidate {
|
|
initialism = append(initialism, toUpperASCII(b))
|
|
}
|
|
if length := commonInitialism.LookupByBytes(initialism); length > 0 {
|
|
result = append(result[:start], initialism...)
|
|
}
|
|
start = len(result)
|
|
continue
|
|
}
|
|
if upper {
|
|
result = append(result, toUpperASCII(c))
|
|
upper = false
|
|
continue
|
|
}
|
|
result = append(result, c)
|
|
}
|
|
candidate := result[start:]
|
|
initialism = initialism[:0]
|
|
for _, b := range candidate {
|
|
initialism = append(initialism, toUpperASCII(b))
|
|
}
|
|
if length := commonInitialism.LookupByBytes(initialism); length > 0 {
|
|
result = append(result[:start], initialism...)
|
|
}
|
|
return string(result)
|
|
}
|
|
|
|
// ToSnakeCase returns a copy of the string s with all Unicode letters mapped to their snake case.
|
|
// It will insert letter of '_' at position of previous letter of uppercase and all
|
|
// letters convert to lower case.
|
|
// ToSnakeCase does not insert '_' letter into a common initialism word like ID, URL and so on.
|
|
func ToSnakeCase(s string) string {
|
|
if s == "" {
|
|
return ""
|
|
}
|
|
result := make([]byte, 0, len(s))
|
|
var runeBuf [utf8.UTFMax]byte
|
|
var j, skipCount int
|
|
for i, c := range s {
|
|
if i < skipCount {
|
|
continue
|
|
}
|
|
if unicode.IsUpper(c) {
|
|
if i != 0 {
|
|
result = append(result, '_')
|
|
}
|
|
next := nextIndex(j, len(s))
|
|
if length := commonInitialism.Lookup(s[j:next]); length > 0 {
|
|
for _, r := range s[j : j+length] {
|
|
if r < utf8.RuneSelf {
|
|
result = append(result, toLowerASCII(byte(r)))
|
|
} else {
|
|
n := utf8.EncodeRune(runeBuf[:], unicode.ToLower(r))
|
|
result = append(result, runeBuf[:n]...)
|
|
}
|
|
}
|
|
j += length - 1
|
|
skipCount = i + length
|
|
continue
|
|
}
|
|
}
|
|
if c < utf8.RuneSelf {
|
|
result = append(result, toLowerASCII(byte(c)))
|
|
} else {
|
|
n := utf8.EncodeRune(runeBuf[:], unicode.ToLower(c))
|
|
result = append(result, runeBuf[:n]...)
|
|
}
|
|
j++
|
|
}
|
|
return string(result)
|
|
}
|
|
|
|
// ToSnakeCaseASCII is similar to ToSnakeCase, but optimized for only the ASCII
|
|
// characters.
|
|
// ToSnakeCaseASCII is faster than ToSnakeCase, but doesn't work correctly if
|
|
// contains non-ASCII characters.
|
|
func ToSnakeCaseASCII(s string) string {
|
|
if s == "" {
|
|
return ""
|
|
}
|
|
result := make([]byte, 0, len(s))
|
|
for i := 0; i < len(s); i++ {
|
|
c := s[i]
|
|
if isUpperASCII(c) {
|
|
if i != 0 {
|
|
result = append(result, '_')
|
|
}
|
|
if k := i + shortestLen - 1; k < len(s) && isUpperASCII(s[k]) {
|
|
if length := commonInitialism.Lookup(s[i:nextIndex(i, len(s))]); length > 0 {
|
|
for j, buf := 0, s[i:i+length]; j < len(buf); j++ {
|
|
result = append(result, toLowerASCII(buf[j]))
|
|
}
|
|
i += length - 1
|
|
continue
|
|
}
|
|
}
|
|
}
|
|
result = append(result, toLowerASCII(c))
|
|
}
|
|
return string(result)
|
|
}
|
|
|
|
// AddCommonInitialism adds ss to list of common initialisms.
|
|
func AddCommonInitialism(ss ...string) {
|
|
mu.Lock()
|
|
defer mu.Unlock()
|
|
for _, s := range ss {
|
|
commonInitialismMap[s] = struct{}{}
|
|
}
|
|
commonInitialisms = keys(commonInitialismMap)
|
|
commonInitialism = mustDoubleArray(newDoubleArray(commonInitialisms))
|
|
longestLen = longestLength(commonInitialisms)
|
|
shortestLen = shortestLength(commonInitialisms, longestLen)
|
|
}
|
|
|
|
// DelCommonInitialism deletes ss from list of common initialisms.
|
|
func DelCommonInitialism(ss ...string) {
|
|
mu.Lock()
|
|
defer mu.Unlock()
|
|
for _, s := range ss {
|
|
delete(commonInitialismMap, s)
|
|
}
|
|
commonInitialisms = keys(commonInitialismMap)
|
|
commonInitialism = mustDoubleArray(newDoubleArray(commonInitialisms))
|
|
longestLen = longestLength(commonInitialisms)
|
|
shortestLen = shortestLength(commonInitialisms, longestLen)
|
|
}
|
|
|
|
func isUpperASCII(c byte) bool {
|
|
return 'A' <= c && c <= 'Z'
|
|
}
|
|
|
|
func isLowerASCII(c byte) bool {
|
|
return 'a' <= c && c <= 'z'
|
|
}
|
|
|
|
func toUpperASCII(c byte) byte {
|
|
if isLowerASCII(c) {
|
|
return c - ('a' - 'A')
|
|
}
|
|
return c
|
|
}
|
|
|
|
func toLowerASCII(c byte) byte {
|
|
if isUpperASCII(c) {
|
|
return c + 'a' - 'A'
|
|
}
|
|
return c
|
|
}
|
|
|
|
func nextIndex(i, maxlen int) int {
|
|
if n := i + longestLen; n < maxlen {
|
|
return n
|
|
}
|
|
return maxlen
|
|
}
|
|
|
|
func keys(m map[string]struct{}) []string {
|
|
result := make([]string, 0, len(m))
|
|
for k := range m {
|
|
result = append(result, k)
|
|
}
|
|
return result
|
|
}
|
|
|
|
func shortestLength(strs []string, shortest int) int {
|
|
for _, s := range strs {
|
|
if candidate := utf8.RuneCountInString(s); candidate < shortest {
|
|
shortest = candidate
|
|
}
|
|
}
|
|
return shortest
|
|
}
|
|
|
|
func longestLength(strs []string) (longest int) {
|
|
for _, s := range strs {
|
|
if candidate := utf8.RuneCountInString(s); candidate > longest {
|
|
longest = candidate
|
|
}
|
|
}
|
|
return longest
|
|
}
|