document_writer.h 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134
  1. /*
  2. * Tencent is pleased to support the open source community by making wwsearch
  3. * available.
  4. *
  5. * Copyright (C) 2018-present Tencent. All Rights Reserved.
  6. *
  7. * Licensed under the Apache License, Version 2.0 (the "License"); you may not
  8. * use this file except in compliance with the License. You may obtain a copy of
  9. * the License at
  10. *
  11. * https://opensource.org/licenses/Apache-2.0
  12. *
  13. * Unless required by applicable law or agreed to in writing, software
  14. * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
  15. * WARRANTIES OF ANY KIND, either express or implied. See the License for the
  16. * specific language governing permissions and limitations under the License.
  17. */
  18. #pragma once
  19. #include "document.h"
  20. #include "index_config.h"
  21. #include "search_status.h"
  22. #include "storage_type.h"
  23. #include "tracer.h"
  24. namespace wwsearch {
  25. using TermFlagPairList = std::map<std::string, unsigned char>;
  26. using TermFlagPairListPtr = std::unique_ptr<TermFlagPairList>;
  27. class DocumentWriter {
  28. private:
  29. IndexConfig* config_;
  30. public:
  31. DocumentWriter();
  32. ~DocumentWriter();
  33. bool SetConfig(IndexConfig* config);
  34. // Update each document pair
  35. // Find the differences between old document and new document.Write document
  36. // to store field ,write inverted term index,write document value...
  37. SearchStatus UpdateDocuments(const TableID& table,
  38. std::vector<DocumentUpdater*>& documents,
  39. std::string* store_buffer,
  40. SearchTracer* tracer = nullptr);
  41. SearchStatus DeleteDocs(const TableID& table,
  42. std::vector<DocumentID>& document_ids,
  43. SearchTracer* tracer = nullptr);
  44. SearchStatus IngestInvertIndex(const TableID& table,
  45. InvertIndexItemList& indices,
  46. std::string* store_buffer,
  47. SearchTracer* tracer = nullptr);
  48. typedef struct AllocSequence {
  49. std::string user_id;
  50. uint64_t sequence;
  51. SearchStatus status;
  52. AllocSequence() { sequence = 0; }
  53. } AllocSequence;
  54. SearchStatus AcquireCurrentSequence(const TableID& table,
  55. uint64_t& current_max,
  56. std::vector<AllocSequence>& sequence_list,
  57. SearchTracer* tracer = nullptr);
  58. SearchStatus AcquireNewSequence(const TableID& table,
  59. std::vector<AllocSequence>& sequence_list,
  60. std::string* store_buffer,
  61. SearchTracer* tracer = nullptr);
  62. SearchStatus DropTable(const TableID& table, std::string* store_buffer,
  63. SearchTracer* tracer = nullptr);
  64. private:
  65. SearchStatus WriteStoredField(const TableID& table,
  66. std::vector<DocumentUpdater*>& documents,
  67. WriteBuffer& write_buffer,
  68. SearchTracer* tracer = nullptr);
  69. SearchStatus WriteDocValue(const TableID& table,
  70. std::vector<DocumentUpdater*>& documents,
  71. WriteBuffer& write_buffer,
  72. SearchTracer* tracer = nullptr);
  73. SearchStatus WriteInvertedIndex(const TableID& table,
  74. std::vector<DocumentUpdater*>& documents,
  75. WriteBuffer& write_buffer,
  76. SearchTracer* tracer = nullptr);
  77. SearchStatus WriteTableMeta(const TableID& table,
  78. std::vector<DocumentUpdater*>& documents,
  79. WriteBuffer& write_buffer,
  80. SearchTracer* tracer = nullptr);
  81. SearchStatus WriteDictionaryMeta(const TableID& table,
  82. std::vector<DocumentUpdater*>& documents,
  83. WriteBuffer& write_buffer,
  84. SearchTracer* tracer = nullptr);
  85. SearchStatus RunTokenizer(std::vector<DocumentUpdater*>& documents,
  86. SearchTracer* tracer = nullptr);
  87. SearchStatus MergeOldField(std::vector<DocumentUpdater*>& documents,
  88. SearchTracer* tracer = nullptr);
  89. void MergeDocvalue(Document& old_docvalue_document,
  90. Document* new_docvalue_document);
  91. SearchStatus WriteStoreFieldForDropTable(const TableID& table,
  92. WriteBuffer& write_buffer,
  93. SearchTracer* tracer = nullptr);
  94. SearchStatus WriteInvertedIndexForDropTable(const TableID& table,
  95. WriteBuffer& write_buffer,
  96. SearchTracer* tracer = nullptr);
  97. SearchStatus WriteDocvalueForDropTable(const TableID& table,
  98. WriteBuffer& write_buffer,
  99. SearchTracer* tracer = nullptr);
  100. SearchStatus WriteTableMetaForDropTable(const TableID& table,
  101. WriteBuffer& write_buffer,
  102. SearchTracer* tracer = nullptr);
  103. SearchStatus WriteDictionaryMetaForDropTable(const TableID& table,
  104. WriteBuffer& write_buffer,
  105. SearchTracer* tracer = nullptr);
  106. };
  107. } // namespace wwsearch