You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

segment.go 14KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572
  1. // Copyright (c) 2017 Couchbase, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package zap
  15. import (
  16. "bytes"
  17. "encoding/binary"
  18. "fmt"
  19. "io"
  20. "os"
  21. "sync"
  22. "unsafe"
  23. "github.com/RoaringBitmap/roaring"
  24. "github.com/blevesearch/bleve/index/scorch/segment"
  25. "github.com/blevesearch/bleve/size"
  26. "github.com/couchbase/vellum"
  27. mmap "github.com/blevesearch/mmap-go"
  28. "github.com/golang/snappy"
  29. )
  30. var reflectStaticSizeSegmentBase int
  31. func init() {
  32. var sb SegmentBase
  33. reflectStaticSizeSegmentBase = int(unsafe.Sizeof(sb))
  34. }
  35. // Open returns a zap impl of a segment
  36. func (*ZapPlugin) Open(path string) (segment.Segment, error) {
  37. f, err := os.Open(path)
  38. if err != nil {
  39. return nil, err
  40. }
  41. mm, err := mmap.Map(f, mmap.RDONLY, 0)
  42. if err != nil {
  43. // mmap failed, try to close the file
  44. _ = f.Close()
  45. return nil, err
  46. }
  47. rv := &Segment{
  48. SegmentBase: SegmentBase{
  49. mem: mm[0 : len(mm)-FooterSize],
  50. fieldsMap: make(map[string]uint16),
  51. fieldDvReaders: make(map[uint16]*docValueReader),
  52. fieldFSTs: make(map[uint16]*vellum.FST),
  53. },
  54. f: f,
  55. mm: mm,
  56. path: path,
  57. refs: 1,
  58. }
  59. rv.SegmentBase.updateSize()
  60. err = rv.loadConfig()
  61. if err != nil {
  62. _ = rv.Close()
  63. return nil, err
  64. }
  65. err = rv.loadFields()
  66. if err != nil {
  67. _ = rv.Close()
  68. return nil, err
  69. }
  70. err = rv.loadDvReaders()
  71. if err != nil {
  72. _ = rv.Close()
  73. return nil, err
  74. }
  75. return rv, nil
  76. }
  77. // SegmentBase is a memory only, read-only implementation of the
  78. // segment.Segment interface, using zap's data representation.
  79. type SegmentBase struct {
  80. mem []byte
  81. memCRC uint32
  82. chunkMode uint32
  83. fieldsMap map[string]uint16 // fieldName -> fieldID+1
  84. fieldsInv []string // fieldID -> fieldName
  85. numDocs uint64
  86. storedIndexOffset uint64
  87. fieldsIndexOffset uint64
  88. docValueOffset uint64
  89. dictLocs []uint64
  90. fieldDvReaders map[uint16]*docValueReader // naive chunk cache per field
  91. fieldDvNames []string // field names cached in fieldDvReaders
  92. size uint64
  93. m sync.Mutex
  94. fieldFSTs map[uint16]*vellum.FST
  95. }
  96. func (sb *SegmentBase) Size() int {
  97. return int(sb.size)
  98. }
  99. func (sb *SegmentBase) updateSize() {
  100. sizeInBytes := reflectStaticSizeSegmentBase +
  101. cap(sb.mem)
  102. // fieldsMap
  103. for k := range sb.fieldsMap {
  104. sizeInBytes += (len(k) + size.SizeOfString) + size.SizeOfUint16
  105. }
  106. // fieldsInv, dictLocs
  107. for _, entry := range sb.fieldsInv {
  108. sizeInBytes += len(entry) + size.SizeOfString
  109. }
  110. sizeInBytes += len(sb.dictLocs) * size.SizeOfUint64
  111. // fieldDvReaders
  112. for _, v := range sb.fieldDvReaders {
  113. sizeInBytes += size.SizeOfUint16 + size.SizeOfPtr
  114. if v != nil {
  115. sizeInBytes += v.size()
  116. }
  117. }
  118. sb.size = uint64(sizeInBytes)
  119. }
  120. func (sb *SegmentBase) AddRef() {}
  121. func (sb *SegmentBase) DecRef() (err error) { return nil }
  122. func (sb *SegmentBase) Close() (err error) { return nil }
  123. // Segment implements a persisted segment.Segment interface, by
  124. // embedding an mmap()'ed SegmentBase.
  125. type Segment struct {
  126. SegmentBase
  127. f *os.File
  128. mm mmap.MMap
  129. path string
  130. version uint32
  131. crc uint32
  132. m sync.Mutex // Protects the fields that follow.
  133. refs int64
  134. }
  135. func (s *Segment) Size() int {
  136. // 8 /* size of file pointer */
  137. // 4 /* size of version -> uint32 */
  138. // 4 /* size of crc -> uint32 */
  139. sizeOfUints := 16
  140. sizeInBytes := (len(s.path) + size.SizeOfString) + sizeOfUints
  141. // mutex, refs -> int64
  142. sizeInBytes += 16
  143. // do not include the mmap'ed part
  144. return sizeInBytes + s.SegmentBase.Size() - cap(s.mem)
  145. }
  146. func (s *Segment) AddRef() {
  147. s.m.Lock()
  148. s.refs++
  149. s.m.Unlock()
  150. }
  151. func (s *Segment) DecRef() (err error) {
  152. s.m.Lock()
  153. s.refs--
  154. if s.refs == 0 {
  155. err = s.closeActual()
  156. }
  157. s.m.Unlock()
  158. return err
  159. }
  160. func (s *Segment) loadConfig() error {
  161. crcOffset := len(s.mm) - 4
  162. s.crc = binary.BigEndian.Uint32(s.mm[crcOffset : crcOffset+4])
  163. verOffset := crcOffset - 4
  164. s.version = binary.BigEndian.Uint32(s.mm[verOffset : verOffset+4])
  165. if s.version != Version {
  166. return fmt.Errorf("unsupported version %d", s.version)
  167. }
  168. chunkOffset := verOffset - 4
  169. s.chunkMode = binary.BigEndian.Uint32(s.mm[chunkOffset : chunkOffset+4])
  170. docValueOffset := chunkOffset - 8
  171. s.docValueOffset = binary.BigEndian.Uint64(s.mm[docValueOffset : docValueOffset+8])
  172. fieldsIndexOffset := docValueOffset - 8
  173. s.fieldsIndexOffset = binary.BigEndian.Uint64(s.mm[fieldsIndexOffset : fieldsIndexOffset+8])
  174. storedIndexOffset := fieldsIndexOffset - 8
  175. s.storedIndexOffset = binary.BigEndian.Uint64(s.mm[storedIndexOffset : storedIndexOffset+8])
  176. numDocsOffset := storedIndexOffset - 8
  177. s.numDocs = binary.BigEndian.Uint64(s.mm[numDocsOffset : numDocsOffset+8])
  178. return nil
  179. }
  180. func (s *SegmentBase) loadFields() error {
  181. // NOTE for now we assume the fields index immediately precedes
  182. // the footer, and if this changes, need to adjust accordingly (or
  183. // store explicit length), where s.mem was sliced from s.mm in Open().
  184. fieldsIndexEnd := uint64(len(s.mem))
  185. // iterate through fields index
  186. var fieldID uint64
  187. for s.fieldsIndexOffset+(8*fieldID) < fieldsIndexEnd {
  188. addr := binary.BigEndian.Uint64(s.mem[s.fieldsIndexOffset+(8*fieldID) : s.fieldsIndexOffset+(8*fieldID)+8])
  189. dictLoc, read := binary.Uvarint(s.mem[addr:fieldsIndexEnd])
  190. n := uint64(read)
  191. s.dictLocs = append(s.dictLocs, dictLoc)
  192. var nameLen uint64
  193. nameLen, read = binary.Uvarint(s.mem[addr+n : fieldsIndexEnd])
  194. n += uint64(read)
  195. name := string(s.mem[addr+n : addr+n+nameLen])
  196. s.fieldsInv = append(s.fieldsInv, name)
  197. s.fieldsMap[name] = uint16(fieldID + 1)
  198. fieldID++
  199. }
  200. return nil
  201. }
  202. // Dictionary returns the term dictionary for the specified field
  203. func (s *SegmentBase) Dictionary(field string) (segment.TermDictionary, error) {
  204. dict, err := s.dictionary(field)
  205. if err == nil && dict == nil {
  206. return &segment.EmptyDictionary{}, nil
  207. }
  208. return dict, err
  209. }
  210. func (sb *SegmentBase) dictionary(field string) (rv *Dictionary, err error) {
  211. fieldIDPlus1 := sb.fieldsMap[field]
  212. if fieldIDPlus1 > 0 {
  213. rv = &Dictionary{
  214. sb: sb,
  215. field: field,
  216. fieldID: fieldIDPlus1 - 1,
  217. }
  218. dictStart := sb.dictLocs[rv.fieldID]
  219. if dictStart > 0 {
  220. var ok bool
  221. sb.m.Lock()
  222. if rv.fst, ok = sb.fieldFSTs[rv.fieldID]; !ok {
  223. // read the length of the vellum data
  224. vellumLen, read := binary.Uvarint(sb.mem[dictStart : dictStart+binary.MaxVarintLen64])
  225. fstBytes := sb.mem[dictStart+uint64(read) : dictStart+uint64(read)+vellumLen]
  226. rv.fst, err = vellum.Load(fstBytes)
  227. if err != nil {
  228. sb.m.Unlock()
  229. return nil, fmt.Errorf("dictionary field %s vellum err: %v", field, err)
  230. }
  231. sb.fieldFSTs[rv.fieldID] = rv.fst
  232. }
  233. sb.m.Unlock()
  234. rv.fstReader, err = rv.fst.Reader()
  235. if err != nil {
  236. return nil, fmt.Errorf("dictionary field %s vellum reader err: %v", field, err)
  237. }
  238. }
  239. }
  240. return rv, nil
  241. }
  242. // visitDocumentCtx holds data structures that are reusable across
  243. // multiple VisitDocument() calls to avoid memory allocations
  244. type visitDocumentCtx struct {
  245. buf []byte
  246. reader bytes.Reader
  247. arrayPos []uint64
  248. }
  249. var visitDocumentCtxPool = sync.Pool{
  250. New: func() interface{} {
  251. reuse := &visitDocumentCtx{}
  252. return reuse
  253. },
  254. }
  255. // VisitDocument invokes the DocFieldValueVistor for each stored field
  256. // for the specified doc number
  257. func (s *SegmentBase) VisitDocument(num uint64, visitor segment.DocumentFieldValueVisitor) error {
  258. vdc := visitDocumentCtxPool.Get().(*visitDocumentCtx)
  259. defer visitDocumentCtxPool.Put(vdc)
  260. return s.visitDocument(vdc, num, visitor)
  261. }
  262. func (s *SegmentBase) visitDocument(vdc *visitDocumentCtx, num uint64,
  263. visitor segment.DocumentFieldValueVisitor) error {
  264. // first make sure this is a valid number in this segment
  265. if num < s.numDocs {
  266. meta, compressed := s.getDocStoredMetaAndCompressed(num)
  267. vdc.reader.Reset(meta)
  268. // handle _id field special case
  269. idFieldValLen, err := binary.ReadUvarint(&vdc.reader)
  270. if err != nil {
  271. return err
  272. }
  273. idFieldVal := compressed[:idFieldValLen]
  274. keepGoing := visitor("_id", byte('t'), idFieldVal, nil)
  275. if !keepGoing {
  276. visitDocumentCtxPool.Put(vdc)
  277. return nil
  278. }
  279. // handle non-"_id" fields
  280. compressed = compressed[idFieldValLen:]
  281. uncompressed, err := snappy.Decode(vdc.buf[:cap(vdc.buf)], compressed)
  282. if err != nil {
  283. return err
  284. }
  285. for keepGoing {
  286. field, err := binary.ReadUvarint(&vdc.reader)
  287. if err == io.EOF {
  288. break
  289. }
  290. if err != nil {
  291. return err
  292. }
  293. typ, err := binary.ReadUvarint(&vdc.reader)
  294. if err != nil {
  295. return err
  296. }
  297. offset, err := binary.ReadUvarint(&vdc.reader)
  298. if err != nil {
  299. return err
  300. }
  301. l, err := binary.ReadUvarint(&vdc.reader)
  302. if err != nil {
  303. return err
  304. }
  305. numap, err := binary.ReadUvarint(&vdc.reader)
  306. if err != nil {
  307. return err
  308. }
  309. var arrayPos []uint64
  310. if numap > 0 {
  311. if cap(vdc.arrayPos) < int(numap) {
  312. vdc.arrayPos = make([]uint64, numap)
  313. }
  314. arrayPos = vdc.arrayPos[:numap]
  315. for i := 0; i < int(numap); i++ {
  316. ap, err := binary.ReadUvarint(&vdc.reader)
  317. if err != nil {
  318. return err
  319. }
  320. arrayPos[i] = ap
  321. }
  322. }
  323. value := uncompressed[offset : offset+l]
  324. keepGoing = visitor(s.fieldsInv[field], byte(typ), value, arrayPos)
  325. }
  326. vdc.buf = uncompressed
  327. }
  328. return nil
  329. }
  330. // DocID returns the value of the _id field for the given docNum
  331. func (s *SegmentBase) DocID(num uint64) ([]byte, error) {
  332. if num >= s.numDocs {
  333. return nil, nil
  334. }
  335. vdc := visitDocumentCtxPool.Get().(*visitDocumentCtx)
  336. meta, compressed := s.getDocStoredMetaAndCompressed(num)
  337. vdc.reader.Reset(meta)
  338. // handle _id field special case
  339. idFieldValLen, err := binary.ReadUvarint(&vdc.reader)
  340. if err != nil {
  341. return nil, err
  342. }
  343. idFieldVal := compressed[:idFieldValLen]
  344. visitDocumentCtxPool.Put(vdc)
  345. return idFieldVal, nil
  346. }
  347. // Count returns the number of documents in this segment.
  348. func (s *SegmentBase) Count() uint64 {
  349. return s.numDocs
  350. }
  351. // DocNumbers returns a bitset corresponding to the doc numbers of all the
  352. // provided _id strings
  353. func (s *SegmentBase) DocNumbers(ids []string) (*roaring.Bitmap, error) {
  354. rv := roaring.New()
  355. if len(s.fieldsMap) > 0 {
  356. idDict, err := s.dictionary("_id")
  357. if err != nil {
  358. return nil, err
  359. }
  360. postingsList := emptyPostingsList
  361. sMax, err := idDict.fst.GetMaxKey()
  362. if err != nil {
  363. return nil, err
  364. }
  365. sMaxStr := string(sMax)
  366. filteredIds := make([]string, 0, len(ids))
  367. for _, id := range ids {
  368. if id <= sMaxStr {
  369. filteredIds = append(filteredIds, id)
  370. }
  371. }
  372. for _, id := range filteredIds {
  373. postingsList, err = idDict.postingsList([]byte(id), nil, postingsList)
  374. if err != nil {
  375. return nil, err
  376. }
  377. postingsList.OrInto(rv)
  378. }
  379. }
  380. return rv, nil
  381. }
  382. // Fields returns the field names used in this segment
  383. func (s *SegmentBase) Fields() []string {
  384. return s.fieldsInv
  385. }
  386. // Path returns the path of this segment on disk
  387. func (s *Segment) Path() string {
  388. return s.path
  389. }
  390. // Close releases all resources associated with this segment
  391. func (s *Segment) Close() (err error) {
  392. return s.DecRef()
  393. }
  394. func (s *Segment) closeActual() (err error) {
  395. if s.mm != nil {
  396. err = s.mm.Unmap()
  397. }
  398. // try to close file even if unmap failed
  399. if s.f != nil {
  400. err2 := s.f.Close()
  401. if err == nil {
  402. // try to return first error
  403. err = err2
  404. }
  405. }
  406. return
  407. }
  408. // some helpers i started adding for the command-line utility
  409. // Data returns the underlying mmaped data slice
  410. func (s *Segment) Data() []byte {
  411. return s.mm
  412. }
  413. // CRC returns the CRC value stored in the file footer
  414. func (s *Segment) CRC() uint32 {
  415. return s.crc
  416. }
  417. // Version returns the file version in the file footer
  418. func (s *Segment) Version() uint32 {
  419. return s.version
  420. }
  421. // ChunkFactor returns the chunk factor in the file footer
  422. func (s *Segment) ChunkMode() uint32 {
  423. return s.chunkMode
  424. }
  425. // FieldsIndexOffset returns the fields index offset in the file footer
  426. func (s *Segment) FieldsIndexOffset() uint64 {
  427. return s.fieldsIndexOffset
  428. }
  429. // StoredIndexOffset returns the stored value index offset in the file footer
  430. func (s *Segment) StoredIndexOffset() uint64 {
  431. return s.storedIndexOffset
  432. }
  433. // DocValueOffset returns the docValue offset in the file footer
  434. func (s *Segment) DocValueOffset() uint64 {
  435. return s.docValueOffset
  436. }
  437. // NumDocs returns the number of documents in the file footer
  438. func (s *Segment) NumDocs() uint64 {
  439. return s.numDocs
  440. }
  441. // DictAddr is a helper function to compute the file offset where the
  442. // dictionary is stored for the specified field.
  443. func (s *Segment) DictAddr(field string) (uint64, error) {
  444. fieldIDPlus1, ok := s.fieldsMap[field]
  445. if !ok {
  446. return 0, fmt.Errorf("no such field '%s'", field)
  447. }
  448. return s.dictLocs[fieldIDPlus1-1], nil
  449. }
  450. func (s *SegmentBase) loadDvReaders() error {
  451. if s.docValueOffset == fieldNotUninverted || s.numDocs == 0 {
  452. return nil
  453. }
  454. var read uint64
  455. for fieldID, field := range s.fieldsInv {
  456. var fieldLocStart, fieldLocEnd uint64
  457. var n int
  458. fieldLocStart, n = binary.Uvarint(s.mem[s.docValueOffset+read : s.docValueOffset+read+binary.MaxVarintLen64])
  459. if n <= 0 {
  460. return fmt.Errorf("loadDvReaders: failed to read the docvalue offset start for field %d", fieldID)
  461. }
  462. read += uint64(n)
  463. fieldLocEnd, n = binary.Uvarint(s.mem[s.docValueOffset+read : s.docValueOffset+read+binary.MaxVarintLen64])
  464. if n <= 0 {
  465. return fmt.Errorf("loadDvReaders: failed to read the docvalue offset end for field %d", fieldID)
  466. }
  467. read += uint64(n)
  468. fieldDvReader, err := s.loadFieldDocValueReader(field, fieldLocStart, fieldLocEnd)
  469. if err != nil {
  470. return err
  471. }
  472. if fieldDvReader != nil {
  473. s.fieldDvReaders[uint16(fieldID)] = fieldDvReader
  474. s.fieldDvNames = append(s.fieldDvNames, field)
  475. }
  476. }
  477. return nil
  478. }