fcache.go 8.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374
  1. /*
  2. * Copyright 2021 ByteDance Inc.
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. package caching
  17. import (
  18. "strings"
  19. "unicode"
  20. "unsafe"
  21. "github.com/bytedance/sonic/internal/envs"
  22. "github.com/bytedance/sonic/internal/native"
  23. "github.com/bytedance/sonic/internal/resolver"
  24. "github.com/bytedance/sonic/internal/rt"
  25. )
  26. const _AlignSize = 32
  27. const _PaddingSize = 32
  28. type FieldLookup interface {
  29. Set(fields []resolver.FieldMeta)
  30. Get(name string, caseSensitive bool) int
  31. }
  32. func isAscii(s string) bool {
  33. for i :=0; i < len(s); i++ {
  34. if s[i] > unicode.MaxASCII {
  35. return false
  36. }
  37. }
  38. return true
  39. }
  40. func NewFieldLookup(fields []resolver.FieldMeta) FieldLookup {
  41. var f FieldLookup
  42. isAsc := true
  43. n := len(fields)
  44. // when field name has non-ascii, use the fallback methods to use strings.ToLower
  45. for _, f := range fields {
  46. if !isAscii(f.Name) {
  47. isAsc = false
  48. break
  49. }
  50. }
  51. if n <= 8 {
  52. f = NewSmallFieldMap(n)
  53. } else if envs.UseFastMap && n <= 128 && isAsc {
  54. f = NewNormalFieldMap(n)
  55. } else {
  56. f = NewFallbackFieldMap(n)
  57. }
  58. f.Set(fields)
  59. return f
  60. }
  61. // Map for keys nums max 8, idx is in [0, 8)
  62. type SmallFieldMap struct {
  63. keys []string
  64. lowerKeys []string
  65. }
  66. func NewSmallFieldMap (hint int) *SmallFieldMap {
  67. return &SmallFieldMap{
  68. keys: make([]string, hint, hint),
  69. lowerKeys: make([]string, hint, hint),
  70. }
  71. }
  72. func (self *SmallFieldMap) Set(fields []resolver.FieldMeta) {
  73. if len(fields) > 8 {
  74. panic("small field map should use in small struct")
  75. }
  76. for i, f := range fields {
  77. self.keys[i] = f.Name
  78. self.lowerKeys[i] = strings.ToLower(f.Name)
  79. }
  80. }
  81. func (self *SmallFieldMap) Get(name string, caseSensitive bool) int {
  82. for i, k := range self.keys {
  83. if len(k) == len(name) && k == name {
  84. return i
  85. }
  86. }
  87. if caseSensitive {
  88. return -1
  89. }
  90. name = strings.ToLower(name)
  91. for i, k := range self.lowerKeys {
  92. if len(k) == len(name) && k == name {
  93. return i
  94. }
  95. }
  96. return -1
  97. }
  98. /*
  99. 1. select by the length: 0 ~ 32 and larger lengths
  100. 2. simd match the aligned prefix of the keys: 4/8/16/32 bytes or larger keys
  101. 3. check the key with strict match
  102. 4. check the key with case-insensitive match
  103. 5. find the index
  104. Mem Layout:
  105. fixed 33 * 5 bytes 165 bytes ||| variable keys ||| variable lowerkeys
  106. | length metadata array[33] ||| key0.0 | u8 | key0.1 | u8 | ... || key1.0 | u8 | key1.1 | u8 | ... ||| lowerkeys info ...
  107. */
  108. // Map for keys nums max 255, idx is in [0, 255), idx 255 means not found.
  109. // keysoffset
  110. // | metadata | aligned key0 | aligned key1 | ... |
  111. // 1 ~ 8
  112. // 8 ~ 16
  113. // 16 ~ 32
  114. // > 32 keys use the long keys entry lists
  115. // use bytes to reduce GC
  116. type NormalFieldMap struct {
  117. keys []byte
  118. longKeys []keyEntry
  119. // offset for lower
  120. lowOffset int
  121. }
  122. type keyEntry struct {
  123. key string
  124. lowerKey string
  125. index uint
  126. }
  127. func NewNormalFieldMap(n int) *NormalFieldMap {
  128. return &NormalFieldMap{
  129. }
  130. }
  131. const _HdrSlot = 33
  132. const _HdrSize = _HdrSlot * 5
  133. // use native SIMD to accelerate it
  134. func (self *NormalFieldMap) Get(name string, caseSensitive bool) int {
  135. // small keys use native C
  136. if len(name) <= 32 {
  137. _ = native.LookupSmallKey
  138. lowOffset := self.lowOffset
  139. if caseSensitive {
  140. lowOffset = -1
  141. }
  142. return native.LookupSmallKey(&name, &self.keys, lowOffset);
  143. }
  144. return self.getLongKey(name, caseSensitive)
  145. }
  146. func (self *NormalFieldMap) getLongKey(name string, caseSensitive bool) int {
  147. for _, k := range self.longKeys {
  148. if len(k.key) != len(name) {
  149. continue;
  150. }
  151. if k.key == name {
  152. return int(k.index)
  153. }
  154. }
  155. if caseSensitive {
  156. return -1
  157. }
  158. lower := strings.ToLower(name)
  159. for _, k := range self.longKeys {
  160. if len(k.key) != len(name) {
  161. continue;
  162. }
  163. if k.lowerKey == lower {
  164. return int(k.index)
  165. }
  166. }
  167. return -1
  168. }
  169. func (self *NormalFieldMap) Getdouble(name string) int {
  170. if len(name) > 32 {
  171. for _, k := range self.longKeys {
  172. if len(k.key) != len(name) {
  173. continue;
  174. }
  175. if k.key == name {
  176. return int(k.index)
  177. }
  178. }
  179. return self.getCaseInsensitive(name)
  180. }
  181. // check the fixed length keys, not found the target length
  182. cnt := int(self.keys[5 * len(name)])
  183. if cnt == 0 {
  184. return -1
  185. }
  186. p := ((*rt.GoSlice)(unsafe.Pointer(&self.keys))).Ptr
  187. offset := int(*(*int32)(unsafe.Pointer(uintptr(p) + uintptr(5 * len(name) + 1)))) + _HdrSize
  188. for i := 0; i < cnt; i++ {
  189. key := rt.Mem2Str(self.keys[offset: offset + len(name)])
  190. if key == name {
  191. return int(self.keys[offset + len(name)])
  192. }
  193. offset += len(name) + 1
  194. }
  195. return self.getCaseInsensitive(name)
  196. }
  197. func (self *NormalFieldMap) getCaseInsensitive(name string) int {
  198. lower := strings.ToLower(name)
  199. if len(name) > 32 {
  200. for _, k := range self.longKeys {
  201. if len(k.key) != len(name) {
  202. continue;
  203. }
  204. if k.lowerKey == lower {
  205. return int(k.index)
  206. }
  207. }
  208. return -1
  209. }
  210. cnt := int(self.keys[5 * len(name)])
  211. p := ((*rt.GoSlice)(unsafe.Pointer(&self.keys))).Ptr
  212. offset := int(*(*int32)(unsafe.Pointer(uintptr(p) + uintptr(5 * len(name) + 1)))) + self.lowOffset
  213. for i := 0; i < cnt; i++ {
  214. key := rt.Mem2Str(self.keys[offset: offset + len(name)])
  215. if key == lower {
  216. return int(self.keys[offset + len(name)])
  217. }
  218. offset += len(name) + 1
  219. }
  220. return -1
  221. }
  222. type keysInfo struct {
  223. counts int
  224. lenSum int
  225. offset int
  226. cur int
  227. }
  228. func (self *NormalFieldMap) Set(fields []resolver.FieldMeta) {
  229. if len(fields) <=8 || len(fields) > 128 {
  230. panic("normal field map should use in small struct")
  231. }
  232. // allocate the flat map in []byte
  233. var keyLenSum [_HdrSlot]keysInfo
  234. for i := 0; i < _HdrSlot; i++ {
  235. keyLenSum[i].offset = 0
  236. keyLenSum[i].counts = 0
  237. keyLenSum[i].lenSum = 0
  238. keyLenSum[i].cur = 0
  239. }
  240. kvLen := 0
  241. for _, f := range(fields) {
  242. len := len(f.Name)
  243. if len <= 32 {
  244. kvLen += len + 1 // key + index
  245. keyLenSum[len].counts++
  246. keyLenSum[len].lenSum += len + 1
  247. }
  248. }
  249. // add a padding size at last to make it friendly for SIMD.
  250. self.keys = make([]byte, _HdrSize + 2 * kvLen, _HdrSize + 2 * kvLen + _PaddingSize)
  251. self.lowOffset = _HdrSize + kvLen
  252. // initialize all keys offset
  253. self.keys[0] = byte(keyLenSum[0].counts)
  254. // self.keys[1:5] = 0 // offset is always zero here.
  255. i := 1
  256. p := ((*rt.GoSlice)(unsafe.Pointer(&self.keys))).Ptr
  257. for i < _HdrSlot {
  258. keyLenSum[i].offset = keyLenSum[i-1].offset + keyLenSum[i-1].lenSum
  259. self.keys[i * 5] = byte(keyLenSum[i].counts)
  260. // write the offset into []byte
  261. *(*int32)(unsafe.Pointer(uintptr(p) + uintptr(i * 5 + 1))) = int32(keyLenSum[i].offset)
  262. i += 1
  263. }
  264. // fill the key into bytes
  265. for i, f := range(fields) {
  266. len := len(f.Name)
  267. if len <= 32 {
  268. offset := keyLenSum[len].offset + keyLenSum[len].cur
  269. copy(self.keys[_HdrSize + offset: ], f.Name)
  270. copy(self.keys[self.lowOffset + offset: ], strings.ToLower(f.Name))
  271. self.keys[_HdrSize + offset + len] = byte(i)
  272. self.keys[self.lowOffset + offset + len] = byte(i)
  273. keyLenSum[len].cur += len + 1
  274. } else {
  275. self.longKeys = append(self.longKeys, keyEntry{f.Name, strings.ToLower(f.Name), uint(i)})
  276. }
  277. }
  278. }
  279. // use hashnap
  280. type FallbackFieldMap struct {
  281. oders []string
  282. inner map[string]int
  283. backup map[string]int
  284. }
  285. func NewFallbackFieldMap(n int) *FallbackFieldMap {
  286. return &FallbackFieldMap{
  287. oders: make([]string, n, n),
  288. inner: make(map[string]int, n*2),
  289. backup: make(map[string]int, n*2),
  290. }
  291. }
  292. func (self *FallbackFieldMap) Get(name string, caseSensitive bool) int {
  293. if i, ok := self.inner[name]; ok {
  294. return i
  295. } else if !caseSensitive {
  296. return self.getCaseInsensitive(name)
  297. } else {
  298. return -1
  299. }
  300. }
  301. func (self *FallbackFieldMap) Set(fields []resolver.FieldMeta) {
  302. for i, f := range(fields) {
  303. name := f.Name
  304. self.oders[i] = name
  305. self.inner[name] = i
  306. /* add the case-insensitive version, prefer the one with smaller field ID */
  307. key := strings.ToLower(name)
  308. if v, ok := self.backup[key]; !ok || i < v {
  309. self.backup[key] = i
  310. }
  311. }
  312. }
  313. func (self *FallbackFieldMap) getCaseInsensitive(name string) int {
  314. if i, ok := self.backup[strings.ToLower(name)]; ok {
  315. return i
  316. } else {
  317. return -1
  318. }
  319. }