plain_table_db_test.cc 47 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375
  1. // Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
  2. // This source code is licensed under both the GPLv2 (found in the
  3. // COPYING file in the root directory) and Apache 2.0 License
  4. // (found in the LICENSE.Apache file in the root directory).
  5. //
  6. // Copyright (c) 2011 The LevelDB Authors. All rights reserved.
  7. // Use of this source code is governed by a BSD-style license that can be
  8. // found in the LICENSE file. See the AUTHORS file for names of contributors.
  9. #ifndef ROCKSDB_LITE
  10. #include <algorithm>
  11. #include <set>
  12. #include "db/db_impl/db_impl.h"
  13. #include "db/version_set.h"
  14. #include "db/write_batch_internal.h"
  15. #include "file/filename.h"
  16. #include "logging/logging.h"
  17. #include "rocksdb/cache.h"
  18. #include "rocksdb/compaction_filter.h"
  19. #include "rocksdb/db.h"
  20. #include "rocksdb/env.h"
  21. #include "rocksdb/filter_policy.h"
  22. #include "rocksdb/slice_transform.h"
  23. #include "rocksdb/table.h"
  24. #include "table/meta_blocks.h"
  25. #include "table/plain/plain_table_bloom.h"
  26. #include "table/plain/plain_table_factory.h"
  27. #include "table/plain/plain_table_key_coding.h"
  28. #include "table/plain/plain_table_reader.h"
  29. #include "table/table_builder.h"
  30. #include "test_util/testharness.h"
  31. #include "test_util/testutil.h"
  32. #include "util/hash.h"
  33. #include "util/mutexlock.h"
  34. #include "util/string_util.h"
  35. #include "utilities/merge_operators.h"
  36. using std::unique_ptr;
  37. namespace ROCKSDB_NAMESPACE {
  38. class PlainTableKeyDecoderTest : public testing::Test {};
  39. TEST_F(PlainTableKeyDecoderTest, ReadNonMmap) {
  40. std::string tmp;
  41. Random rnd(301);
  42. const uint32_t kLength = 2222;
  43. Slice contents = test::RandomString(&rnd, kLength, &tmp);
  44. test::StringSource* string_source =
  45. new test::StringSource(contents, 0, false);
  46. std::unique_ptr<RandomAccessFileReader> file_reader(
  47. test::GetRandomAccessFileReader(string_source));
  48. std::unique_ptr<PlainTableReaderFileInfo> file_info(
  49. new PlainTableReaderFileInfo(std::move(file_reader), EnvOptions(),
  50. kLength));
  51. {
  52. PlainTableFileReader reader(file_info.get());
  53. const uint32_t kReadSize = 77;
  54. for (uint32_t pos = 0; pos < kLength; pos += kReadSize) {
  55. uint32_t read_size = std::min(kLength - pos, kReadSize);
  56. Slice out;
  57. ASSERT_TRUE(reader.Read(pos, read_size, &out));
  58. ASSERT_EQ(0, out.compare(tmp.substr(pos, read_size)));
  59. }
  60. ASSERT_LT(uint32_t(string_source->total_reads()), kLength / kReadSize / 2);
  61. }
  62. std::vector<std::vector<std::pair<uint32_t, uint32_t>>> reads = {
  63. {{600, 30}, {590, 30}, {600, 20}, {600, 40}},
  64. {{800, 20}, {100, 20}, {500, 20}, {1500, 20}, {100, 20}, {80, 20}},
  65. {{1000, 20}, {500, 20}, {1000, 50}},
  66. {{1000, 20}, {500, 20}, {500, 20}},
  67. {{1000, 20}, {500, 20}, {200, 20}, {500, 20}},
  68. {{1000, 20}, {500, 20}, {200, 20}, {1000, 50}},
  69. {{600, 500}, {610, 20}, {100, 20}},
  70. {{500, 100}, {490, 100}, {550, 50}},
  71. };
  72. std::vector<int> num_file_reads = {2, 6, 2, 2, 4, 3, 2, 2};
  73. for (size_t i = 0; i < reads.size(); i++) {
  74. string_source->set_total_reads(0);
  75. PlainTableFileReader reader(file_info.get());
  76. for (auto p : reads[i]) {
  77. Slice out;
  78. ASSERT_TRUE(reader.Read(p.first, p.second, &out));
  79. ASSERT_EQ(0, out.compare(tmp.substr(p.first, p.second)));
  80. }
  81. ASSERT_EQ(num_file_reads[i], string_source->total_reads());
  82. }
  83. }
  84. class PlainTableDBTest : public testing::Test,
  85. public testing::WithParamInterface<bool> {
  86. protected:
  87. private:
  88. std::string dbname_;
  89. Env* env_;
  90. DB* db_;
  91. bool mmap_mode_;
  92. Options last_options_;
  93. public:
  94. PlainTableDBTest() : env_(Env::Default()) {}
  95. ~PlainTableDBTest() override {
  96. delete db_;
  97. EXPECT_OK(DestroyDB(dbname_, Options()));
  98. }
  99. void SetUp() override {
  100. mmap_mode_ = GetParam();
  101. dbname_ = test::PerThreadDBPath("plain_table_db_test");
  102. EXPECT_OK(DestroyDB(dbname_, Options()));
  103. db_ = nullptr;
  104. Reopen();
  105. }
  106. // Return the current option configuration.
  107. Options CurrentOptions() {
  108. Options options;
  109. PlainTableOptions plain_table_options;
  110. plain_table_options.user_key_len = 0;
  111. plain_table_options.bloom_bits_per_key = 2;
  112. plain_table_options.hash_table_ratio = 0.8;
  113. plain_table_options.index_sparseness = 3;
  114. plain_table_options.huge_page_tlb_size = 0;
  115. plain_table_options.encoding_type = kPrefix;
  116. plain_table_options.full_scan_mode = false;
  117. plain_table_options.store_index_in_file = false;
  118. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  119. options.memtable_factory.reset(NewHashLinkListRepFactory(4, 0, 3, true));
  120. options.prefix_extractor.reset(NewFixedPrefixTransform(8));
  121. options.allow_mmap_reads = mmap_mode_;
  122. options.allow_concurrent_memtable_write = false;
  123. options.unordered_write = false;
  124. return options;
  125. }
  126. DBImpl* dbfull() {
  127. return reinterpret_cast<DBImpl*>(db_);
  128. }
  129. void Reopen(Options* options = nullptr) {
  130. ASSERT_OK(TryReopen(options));
  131. }
  132. void Close() {
  133. delete db_;
  134. db_ = nullptr;
  135. }
  136. bool mmap_mode() const { return mmap_mode_; }
  137. void DestroyAndReopen(Options* options = nullptr) {
  138. //Destroy using last options
  139. Destroy(&last_options_);
  140. ASSERT_OK(TryReopen(options));
  141. }
  142. void Destroy(Options* options) {
  143. delete db_;
  144. db_ = nullptr;
  145. ASSERT_OK(DestroyDB(dbname_, *options));
  146. }
  147. Status PureReopen(Options* options, DB** db) {
  148. return DB::Open(*options, dbname_, db);
  149. }
  150. Status ReopenForReadOnly(Options* options) {
  151. delete db_;
  152. db_ = nullptr;
  153. return DB::OpenForReadOnly(*options, dbname_, &db_);
  154. }
  155. Status TryReopen(Options* options = nullptr) {
  156. delete db_;
  157. db_ = nullptr;
  158. Options opts;
  159. if (options != nullptr) {
  160. opts = *options;
  161. } else {
  162. opts = CurrentOptions();
  163. opts.create_if_missing = true;
  164. }
  165. last_options_ = opts;
  166. return DB::Open(opts, dbname_, &db_);
  167. }
  168. Status Put(const Slice& k, const Slice& v) {
  169. return db_->Put(WriteOptions(), k, v);
  170. }
  171. Status Delete(const std::string& k) {
  172. return db_->Delete(WriteOptions(), k);
  173. }
  174. std::string Get(const std::string& k, const Snapshot* snapshot = nullptr) {
  175. ReadOptions options;
  176. options.snapshot = snapshot;
  177. std::string result;
  178. Status s = db_->Get(options, k, &result);
  179. if (s.IsNotFound()) {
  180. result = "NOT_FOUND";
  181. } else if (!s.ok()) {
  182. result = s.ToString();
  183. }
  184. return result;
  185. }
  186. int NumTableFilesAtLevel(int level) {
  187. std::string property;
  188. EXPECT_TRUE(db_->GetProperty(
  189. "rocksdb.num-files-at-level" + NumberToString(level), &property));
  190. return atoi(property.c_str());
  191. }
  192. // Return spread of files per level
  193. std::string FilesPerLevel() {
  194. std::string result;
  195. size_t last_non_zero_offset = 0;
  196. for (int level = 0; level < db_->NumberLevels(); level++) {
  197. int f = NumTableFilesAtLevel(level);
  198. char buf[100];
  199. snprintf(buf, sizeof(buf), "%s%d", (level ? "," : ""), f);
  200. result += buf;
  201. if (f > 0) {
  202. last_non_zero_offset = result.size();
  203. }
  204. }
  205. result.resize(last_non_zero_offset);
  206. return result;
  207. }
  208. std::string IterStatus(Iterator* iter) {
  209. std::string result;
  210. if (iter->Valid()) {
  211. result = iter->key().ToString() + "->" + iter->value().ToString();
  212. } else {
  213. result = "(invalid)";
  214. }
  215. return result;
  216. }
  217. };
  218. TEST_P(PlainTableDBTest, Empty) {
  219. ASSERT_TRUE(dbfull() != nullptr);
  220. ASSERT_EQ("NOT_FOUND", Get("0000000000000foo"));
  221. }
  222. extern const uint64_t kPlainTableMagicNumber;
  223. class TestPlainTableReader : public PlainTableReader {
  224. public:
  225. TestPlainTableReader(const EnvOptions& env_options,
  226. const InternalKeyComparator& icomparator,
  227. EncodingType encoding_type, uint64_t file_size,
  228. int bloom_bits_per_key, double hash_table_ratio,
  229. size_t index_sparseness,
  230. const TableProperties* table_properties,
  231. std::unique_ptr<RandomAccessFileReader>&& file,
  232. const ImmutableCFOptions& ioptions,
  233. const SliceTransform* prefix_extractor,
  234. bool* expect_bloom_not_match, bool store_index_in_file,
  235. uint32_t column_family_id,
  236. const std::string& column_family_name)
  237. : PlainTableReader(ioptions, std::move(file), env_options, icomparator,
  238. encoding_type, file_size, table_properties,
  239. prefix_extractor),
  240. expect_bloom_not_match_(expect_bloom_not_match) {
  241. Status s = MmapDataIfNeeded();
  242. EXPECT_TRUE(s.ok());
  243. s = PopulateIndex(const_cast<TableProperties*>(table_properties),
  244. bloom_bits_per_key, hash_table_ratio, index_sparseness,
  245. 2 * 1024 * 1024);
  246. EXPECT_TRUE(s.ok());
  247. TableProperties* props = const_cast<TableProperties*>(table_properties);
  248. EXPECT_EQ(column_family_id, static_cast<uint32_t>(props->column_family_id));
  249. EXPECT_EQ(column_family_name, props->column_family_name);
  250. if (store_index_in_file) {
  251. auto bloom_version_ptr = props->user_collected_properties.find(
  252. PlainTablePropertyNames::kBloomVersion);
  253. EXPECT_TRUE(bloom_version_ptr != props->user_collected_properties.end());
  254. EXPECT_EQ(bloom_version_ptr->second, std::string("1"));
  255. if (ioptions.bloom_locality > 0) {
  256. auto num_blocks_ptr = props->user_collected_properties.find(
  257. PlainTablePropertyNames::kNumBloomBlocks);
  258. EXPECT_TRUE(num_blocks_ptr != props->user_collected_properties.end());
  259. }
  260. }
  261. table_properties_.reset(props);
  262. }
  263. ~TestPlainTableReader() override {}
  264. private:
  265. bool MatchBloom(uint32_t hash) const override {
  266. bool ret = PlainTableReader::MatchBloom(hash);
  267. if (*expect_bloom_not_match_) {
  268. EXPECT_TRUE(!ret);
  269. } else {
  270. EXPECT_TRUE(ret);
  271. }
  272. return ret;
  273. }
  274. bool* expect_bloom_not_match_;
  275. };
  276. extern const uint64_t kPlainTableMagicNumber;
  277. class TestPlainTableFactory : public PlainTableFactory {
  278. public:
  279. explicit TestPlainTableFactory(bool* expect_bloom_not_match,
  280. const PlainTableOptions& options,
  281. uint32_t column_family_id,
  282. std::string column_family_name)
  283. : PlainTableFactory(options),
  284. bloom_bits_per_key_(options.bloom_bits_per_key),
  285. hash_table_ratio_(options.hash_table_ratio),
  286. index_sparseness_(options.index_sparseness),
  287. store_index_in_file_(options.store_index_in_file),
  288. expect_bloom_not_match_(expect_bloom_not_match),
  289. column_family_id_(column_family_id),
  290. column_family_name_(std::move(column_family_name)) {}
  291. Status NewTableReader(
  292. const TableReaderOptions& table_reader_options,
  293. std::unique_ptr<RandomAccessFileReader>&& file, uint64_t file_size,
  294. std::unique_ptr<TableReader>* table,
  295. bool /*prefetch_index_and_filter_in_cache*/) const override {
  296. TableProperties* props = nullptr;
  297. auto s =
  298. ReadTableProperties(file.get(), file_size, kPlainTableMagicNumber,
  299. table_reader_options.ioptions, &props,
  300. true /* compression_type_missing */);
  301. EXPECT_TRUE(s.ok());
  302. if (store_index_in_file_) {
  303. BlockHandle bloom_block_handle;
  304. s = FindMetaBlock(file.get(), file_size, kPlainTableMagicNumber,
  305. table_reader_options.ioptions,
  306. BloomBlockBuilder::kBloomBlock, &bloom_block_handle,
  307. /* compression_type_missing */ true);
  308. EXPECT_TRUE(s.ok());
  309. BlockHandle index_block_handle;
  310. s = FindMetaBlock(file.get(), file_size, kPlainTableMagicNumber,
  311. table_reader_options.ioptions,
  312. PlainTableIndexBuilder::kPlainTableIndexBlock,
  313. &index_block_handle, /* compression_type_missing */ true);
  314. EXPECT_TRUE(s.ok());
  315. }
  316. auto& user_props = props->user_collected_properties;
  317. auto encoding_type_prop =
  318. user_props.find(PlainTablePropertyNames::kEncodingType);
  319. assert(encoding_type_prop != user_props.end());
  320. EncodingType encoding_type = static_cast<EncodingType>(
  321. DecodeFixed32(encoding_type_prop->second.c_str()));
  322. std::unique_ptr<PlainTableReader> new_reader(new TestPlainTableReader(
  323. table_reader_options.env_options,
  324. table_reader_options.internal_comparator, encoding_type, file_size,
  325. bloom_bits_per_key_, hash_table_ratio_, index_sparseness_, props,
  326. std::move(file), table_reader_options.ioptions,
  327. table_reader_options.prefix_extractor, expect_bloom_not_match_,
  328. store_index_in_file_, column_family_id_, column_family_name_));
  329. *table = std::move(new_reader);
  330. return s;
  331. }
  332. private:
  333. int bloom_bits_per_key_;
  334. double hash_table_ratio_;
  335. size_t index_sparseness_;
  336. bool store_index_in_file_;
  337. bool* expect_bloom_not_match_;
  338. const uint32_t column_family_id_;
  339. const std::string column_family_name_;
  340. };
  341. TEST_P(PlainTableDBTest, BadOptions1) {
  342. // Build with a prefix extractor
  343. ASSERT_OK(Put("1000000000000foo", "v1"));
  344. dbfull()->TEST_FlushMemTable();
  345. // Bad attempt to re-open without a prefix extractor
  346. Options options = CurrentOptions();
  347. options.prefix_extractor.reset();
  348. ASSERT_EQ(
  349. "Invalid argument: Prefix extractor is missing when opening a PlainTable "
  350. "built using a prefix extractor",
  351. TryReopen(&options).ToString());
  352. // Bad attempt to re-open with different prefix extractor
  353. options.prefix_extractor.reset(NewFixedPrefixTransform(6));
  354. ASSERT_EQ(
  355. "Invalid argument: Prefix extractor given doesn't match the one used to "
  356. "build PlainTable",
  357. TryReopen(&options).ToString());
  358. // Correct prefix extractor
  359. options.prefix_extractor.reset(NewFixedPrefixTransform(8));
  360. Reopen(&options);
  361. ASSERT_EQ("v1", Get("1000000000000foo"));
  362. }
  363. TEST_P(PlainTableDBTest, BadOptions2) {
  364. Options options = CurrentOptions();
  365. options.prefix_extractor.reset();
  366. options.create_if_missing = true;
  367. DestroyAndReopen(&options);
  368. // Build without a prefix extractor
  369. // (apparently works even if hash_table_ratio > 0)
  370. ASSERT_OK(Put("1000000000000foo", "v1"));
  371. dbfull()->TEST_FlushMemTable();
  372. // Bad attempt to re-open with hash_table_ratio > 0 and no prefix extractor
  373. Status s = TryReopen(&options);
  374. ASSERT_EQ(
  375. "Not implemented: PlainTable requires a prefix extractor enable prefix "
  376. "hash mode.",
  377. s.ToString());
  378. // OK to open with hash_table_ratio == 0 and no prefix extractor
  379. PlainTableOptions plain_table_options;
  380. plain_table_options.hash_table_ratio = 0;
  381. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  382. Reopen(&options);
  383. ASSERT_EQ("v1", Get("1000000000000foo"));
  384. // OK to open newly with a prefix_extractor and hash table; builds index
  385. // in memory.
  386. options = CurrentOptions();
  387. Reopen(&options);
  388. ASSERT_EQ("v1", Get("1000000000000foo"));
  389. }
  390. TEST_P(PlainTableDBTest, Flush) {
  391. for (size_t huge_page_tlb_size = 0; huge_page_tlb_size <= 2 * 1024 * 1024;
  392. huge_page_tlb_size += 2 * 1024 * 1024) {
  393. for (EncodingType encoding_type : {kPlain, kPrefix}) {
  394. for (int bloom = -1; bloom <= 117; bloom += 117) {
  395. const int bloom_bits = std::max(bloom, 0);
  396. const bool full_scan_mode = bloom < 0;
  397. for (int total_order = 0; total_order <= 1; total_order++) {
  398. for (int store_index_in_file = 0; store_index_in_file <= 1;
  399. ++store_index_in_file) {
  400. Options options = CurrentOptions();
  401. options.create_if_missing = true;
  402. // Set only one bucket to force bucket conflict.
  403. // Test index interval for the same prefix to be 1, 2 and 4
  404. if (total_order) {
  405. options.prefix_extractor.reset();
  406. PlainTableOptions plain_table_options;
  407. plain_table_options.user_key_len = 0;
  408. plain_table_options.bloom_bits_per_key = bloom_bits;
  409. plain_table_options.hash_table_ratio = 0;
  410. plain_table_options.index_sparseness = 2;
  411. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  412. plain_table_options.encoding_type = encoding_type;
  413. plain_table_options.full_scan_mode = full_scan_mode;
  414. plain_table_options.store_index_in_file = store_index_in_file;
  415. options.table_factory.reset(
  416. NewPlainTableFactory(plain_table_options));
  417. } else {
  418. PlainTableOptions plain_table_options;
  419. plain_table_options.user_key_len = 0;
  420. plain_table_options.bloom_bits_per_key = bloom_bits;
  421. plain_table_options.hash_table_ratio = 0.75;
  422. plain_table_options.index_sparseness = 16;
  423. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  424. plain_table_options.encoding_type = encoding_type;
  425. plain_table_options.full_scan_mode = full_scan_mode;
  426. plain_table_options.store_index_in_file = store_index_in_file;
  427. options.table_factory.reset(
  428. NewPlainTableFactory(plain_table_options));
  429. }
  430. DestroyAndReopen(&options);
  431. uint64_t int_num;
  432. ASSERT_TRUE(dbfull()->GetIntProperty(
  433. "rocksdb.estimate-table-readers-mem", &int_num));
  434. ASSERT_EQ(int_num, 0U);
  435. ASSERT_OK(Put("1000000000000foo", "v1"));
  436. ASSERT_OK(Put("0000000000000bar", "v2"));
  437. ASSERT_OK(Put("1000000000000foo", "v3"));
  438. dbfull()->TEST_FlushMemTable();
  439. ASSERT_TRUE(dbfull()->GetIntProperty(
  440. "rocksdb.estimate-table-readers-mem", &int_num));
  441. ASSERT_GT(int_num, 0U);
  442. TablePropertiesCollection ptc;
  443. reinterpret_cast<DB*>(dbfull())->GetPropertiesOfAllTables(&ptc);
  444. ASSERT_EQ(1U, ptc.size());
  445. auto row = ptc.begin();
  446. auto tp = row->second;
  447. if (full_scan_mode) {
  448. // Does not support Get/Seek
  449. std::unique_ptr<Iterator> iter(dbfull()->NewIterator(ReadOptions()));
  450. iter->SeekToFirst();
  451. ASSERT_TRUE(iter->Valid());
  452. ASSERT_EQ("0000000000000bar", iter->key().ToString());
  453. ASSERT_EQ("v2", iter->value().ToString());
  454. iter->Next();
  455. ASSERT_TRUE(iter->Valid());
  456. ASSERT_EQ("1000000000000foo", iter->key().ToString());
  457. ASSERT_EQ("v3", iter->value().ToString());
  458. iter->Next();
  459. ASSERT_TRUE(!iter->Valid());
  460. ASSERT_TRUE(iter->status().ok());
  461. } else {
  462. if (!store_index_in_file) {
  463. ASSERT_EQ(total_order ? "4" : "12",
  464. (tp->user_collected_properties)
  465. .at("plain_table_hash_table_size"));
  466. ASSERT_EQ("0", (tp->user_collected_properties)
  467. .at("plain_table_sub_index_size"));
  468. } else {
  469. ASSERT_EQ("0", (tp->user_collected_properties)
  470. .at("plain_table_hash_table_size"));
  471. ASSERT_EQ("0", (tp->user_collected_properties)
  472. .at("plain_table_sub_index_size"));
  473. }
  474. ASSERT_EQ("v3", Get("1000000000000foo"));
  475. ASSERT_EQ("v2", Get("0000000000000bar"));
  476. }
  477. }
  478. }
  479. }
  480. }
  481. }
  482. }
  483. TEST_P(PlainTableDBTest, Flush2) {
  484. for (size_t huge_page_tlb_size = 0; huge_page_tlb_size <= 2 * 1024 * 1024;
  485. huge_page_tlb_size += 2 * 1024 * 1024) {
  486. for (EncodingType encoding_type : {kPlain, kPrefix}) {
  487. for (int bloom_bits = 0; bloom_bits <= 117; bloom_bits += 117) {
  488. for (int total_order = 0; total_order <= 1; total_order++) {
  489. for (int store_index_in_file = 0; store_index_in_file <= 1;
  490. ++store_index_in_file) {
  491. if (encoding_type == kPrefix && total_order) {
  492. continue;
  493. }
  494. if (!bloom_bits && store_index_in_file) {
  495. continue;
  496. }
  497. if (total_order && store_index_in_file) {
  498. continue;
  499. }
  500. bool expect_bloom_not_match = false;
  501. Options options = CurrentOptions();
  502. options.create_if_missing = true;
  503. // Set only one bucket to force bucket conflict.
  504. // Test index interval for the same prefix to be 1, 2 and 4
  505. PlainTableOptions plain_table_options;
  506. if (total_order) {
  507. options.prefix_extractor = nullptr;
  508. plain_table_options.hash_table_ratio = 0;
  509. plain_table_options.index_sparseness = 2;
  510. } else {
  511. plain_table_options.hash_table_ratio = 0.75;
  512. plain_table_options.index_sparseness = 16;
  513. }
  514. plain_table_options.user_key_len = kPlainTableVariableLength;
  515. plain_table_options.bloom_bits_per_key = bloom_bits;
  516. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  517. plain_table_options.encoding_type = encoding_type;
  518. plain_table_options.store_index_in_file = store_index_in_file;
  519. options.table_factory.reset(new TestPlainTableFactory(
  520. &expect_bloom_not_match, plain_table_options,
  521. 0 /* column_family_id */, kDefaultColumnFamilyName));
  522. DestroyAndReopen(&options);
  523. ASSERT_OK(Put("0000000000000bar", "b"));
  524. ASSERT_OK(Put("1000000000000foo", "v1"));
  525. dbfull()->TEST_FlushMemTable();
  526. ASSERT_OK(Put("1000000000000foo", "v2"));
  527. dbfull()->TEST_FlushMemTable();
  528. ASSERT_EQ("v2", Get("1000000000000foo"));
  529. ASSERT_OK(Put("0000000000000eee", "v3"));
  530. dbfull()->TEST_FlushMemTable();
  531. ASSERT_EQ("v3", Get("0000000000000eee"));
  532. ASSERT_OK(Delete("0000000000000bar"));
  533. dbfull()->TEST_FlushMemTable();
  534. ASSERT_EQ("NOT_FOUND", Get("0000000000000bar"));
  535. ASSERT_OK(Put("0000000000000eee", "v5"));
  536. ASSERT_OK(Put("9000000000000eee", "v5"));
  537. dbfull()->TEST_FlushMemTable();
  538. ASSERT_EQ("v5", Get("0000000000000eee"));
  539. // Test Bloom Filter
  540. if (bloom_bits > 0) {
  541. // Neither key nor value should exist.
  542. expect_bloom_not_match = true;
  543. ASSERT_EQ("NOT_FOUND", Get("5_not00000000bar"));
  544. // Key doesn't exist any more but prefix exists.
  545. if (total_order) {
  546. ASSERT_EQ("NOT_FOUND", Get("1000000000000not"));
  547. ASSERT_EQ("NOT_FOUND", Get("0000000000000not"));
  548. }
  549. expect_bloom_not_match = false;
  550. }
  551. }
  552. }
  553. }
  554. }
  555. }
  556. }
  557. TEST_P(PlainTableDBTest, Immortal) {
  558. for (EncodingType encoding_type : {kPlain, kPrefix}) {
  559. Options options = CurrentOptions();
  560. options.create_if_missing = true;
  561. options.max_open_files = -1;
  562. // Set only one bucket to force bucket conflict.
  563. // Test index interval for the same prefix to be 1, 2 and 4
  564. PlainTableOptions plain_table_options;
  565. plain_table_options.hash_table_ratio = 0.75;
  566. plain_table_options.index_sparseness = 16;
  567. plain_table_options.user_key_len = kPlainTableVariableLength;
  568. plain_table_options.bloom_bits_per_key = 10;
  569. plain_table_options.encoding_type = encoding_type;
  570. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  571. DestroyAndReopen(&options);
  572. ASSERT_OK(Put("0000000000000bar", "b"));
  573. ASSERT_OK(Put("1000000000000foo", "v1"));
  574. dbfull()->TEST_FlushMemTable();
  575. int copied = 0;
  576. ROCKSDB_NAMESPACE::SyncPoint::GetInstance()->SetCallBack(
  577. "GetContext::SaveValue::PinSelf", [&](void* /*arg*/) { copied++; });
  578. ROCKSDB_NAMESPACE::SyncPoint::GetInstance()->EnableProcessing();
  579. ASSERT_EQ("b", Get("0000000000000bar"));
  580. ASSERT_EQ("v1", Get("1000000000000foo"));
  581. ASSERT_EQ(2, copied);
  582. copied = 0;
  583. Close();
  584. ASSERT_OK(ReopenForReadOnly(&options));
  585. ASSERT_EQ("b", Get("0000000000000bar"));
  586. ASSERT_EQ("v1", Get("1000000000000foo"));
  587. ASSERT_EQ("NOT_FOUND", Get("1000000000000bar"));
  588. if (mmap_mode()) {
  589. ASSERT_EQ(0, copied);
  590. } else {
  591. ASSERT_EQ(2, copied);
  592. }
  593. ROCKSDB_NAMESPACE::SyncPoint::GetInstance()->DisableProcessing();
  594. }
  595. }
  596. TEST_P(PlainTableDBTest, Iterator) {
  597. for (size_t huge_page_tlb_size = 0; huge_page_tlb_size <= 2 * 1024 * 1024;
  598. huge_page_tlb_size += 2 * 1024 * 1024) {
  599. for (EncodingType encoding_type : {kPlain, kPrefix}) {
  600. for (int bloom_bits = 0; bloom_bits <= 117; bloom_bits += 117) {
  601. for (int total_order = 0; total_order <= 1; total_order++) {
  602. if (encoding_type == kPrefix && total_order == 1) {
  603. continue;
  604. }
  605. bool expect_bloom_not_match = false;
  606. Options options = CurrentOptions();
  607. options.create_if_missing = true;
  608. // Set only one bucket to force bucket conflict.
  609. // Test index interval for the same prefix to be 1, 2 and 4
  610. if (total_order) {
  611. options.prefix_extractor = nullptr;
  612. PlainTableOptions plain_table_options;
  613. plain_table_options.user_key_len = 16;
  614. plain_table_options.bloom_bits_per_key = bloom_bits;
  615. plain_table_options.hash_table_ratio = 0;
  616. plain_table_options.index_sparseness = 2;
  617. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  618. plain_table_options.encoding_type = encoding_type;
  619. options.table_factory.reset(new TestPlainTableFactory(
  620. &expect_bloom_not_match, plain_table_options,
  621. 0 /* column_family_id */, kDefaultColumnFamilyName));
  622. } else {
  623. PlainTableOptions plain_table_options;
  624. plain_table_options.user_key_len = 16;
  625. plain_table_options.bloom_bits_per_key = bloom_bits;
  626. plain_table_options.hash_table_ratio = 0.75;
  627. plain_table_options.index_sparseness = 16;
  628. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  629. plain_table_options.encoding_type = encoding_type;
  630. options.table_factory.reset(new TestPlainTableFactory(
  631. &expect_bloom_not_match, plain_table_options,
  632. 0 /* column_family_id */, kDefaultColumnFamilyName));
  633. }
  634. DestroyAndReopen(&options);
  635. ASSERT_OK(Put("1000000000foo002", "v_2"));
  636. ASSERT_OK(Put("0000000000000bar", "random"));
  637. ASSERT_OK(Put("1000000000foo001", "v1"));
  638. ASSERT_OK(Put("3000000000000bar", "bar_v"));
  639. ASSERT_OK(Put("1000000000foo003", "v__3"));
  640. ASSERT_OK(Put("1000000000foo004", "v__4"));
  641. ASSERT_OK(Put("1000000000foo005", "v__5"));
  642. ASSERT_OK(Put("1000000000foo007", "v__7"));
  643. ASSERT_OK(Put("1000000000foo008", "v__8"));
  644. dbfull()->TEST_FlushMemTable();
  645. ASSERT_EQ("v1", Get("1000000000foo001"));
  646. ASSERT_EQ("v__3", Get("1000000000foo003"));
  647. Iterator* iter = dbfull()->NewIterator(ReadOptions());
  648. iter->Seek("1000000000foo000");
  649. ASSERT_TRUE(iter->Valid());
  650. ASSERT_EQ("1000000000foo001", iter->key().ToString());
  651. ASSERT_EQ("v1", iter->value().ToString());
  652. iter->Next();
  653. ASSERT_TRUE(iter->Valid());
  654. ASSERT_EQ("1000000000foo002", iter->key().ToString());
  655. ASSERT_EQ("v_2", iter->value().ToString());
  656. iter->Next();
  657. ASSERT_TRUE(iter->Valid());
  658. ASSERT_EQ("1000000000foo003", iter->key().ToString());
  659. ASSERT_EQ("v__3", iter->value().ToString());
  660. iter->Next();
  661. ASSERT_TRUE(iter->Valid());
  662. ASSERT_EQ("1000000000foo004", iter->key().ToString());
  663. ASSERT_EQ("v__4", iter->value().ToString());
  664. iter->Seek("3000000000000bar");
  665. ASSERT_TRUE(iter->Valid());
  666. ASSERT_EQ("3000000000000bar", iter->key().ToString());
  667. ASSERT_EQ("bar_v", iter->value().ToString());
  668. iter->Seek("1000000000foo000");
  669. ASSERT_TRUE(iter->Valid());
  670. ASSERT_EQ("1000000000foo001", iter->key().ToString());
  671. ASSERT_EQ("v1", iter->value().ToString());
  672. iter->Seek("1000000000foo005");
  673. ASSERT_TRUE(iter->Valid());
  674. ASSERT_EQ("1000000000foo005", iter->key().ToString());
  675. ASSERT_EQ("v__5", iter->value().ToString());
  676. iter->Seek("1000000000foo006");
  677. ASSERT_TRUE(iter->Valid());
  678. ASSERT_EQ("1000000000foo007", iter->key().ToString());
  679. ASSERT_EQ("v__7", iter->value().ToString());
  680. iter->Seek("1000000000foo008");
  681. ASSERT_TRUE(iter->Valid());
  682. ASSERT_EQ("1000000000foo008", iter->key().ToString());
  683. ASSERT_EQ("v__8", iter->value().ToString());
  684. if (total_order == 0) {
  685. iter->Seek("1000000000foo009");
  686. ASSERT_TRUE(iter->Valid());
  687. ASSERT_EQ("3000000000000bar", iter->key().ToString());
  688. }
  689. // Test Bloom Filter
  690. if (bloom_bits > 0) {
  691. if (!total_order) {
  692. // Neither key nor value should exist.
  693. expect_bloom_not_match = true;
  694. iter->Seek("2not000000000bar");
  695. ASSERT_TRUE(!iter->Valid());
  696. ASSERT_EQ("NOT_FOUND", Get("2not000000000bar"));
  697. expect_bloom_not_match = false;
  698. } else {
  699. expect_bloom_not_match = true;
  700. ASSERT_EQ("NOT_FOUND", Get("2not000000000bar"));
  701. expect_bloom_not_match = false;
  702. }
  703. }
  704. delete iter;
  705. }
  706. }
  707. }
  708. }
  709. }
  710. namespace {
  711. std::string NthKey(size_t n, char filler) {
  712. std::string rv(16, filler);
  713. rv[0] = n % 10;
  714. rv[1] = (n / 10) % 10;
  715. rv[2] = (n / 100) % 10;
  716. rv[3] = (n / 1000) % 10;
  717. return rv;
  718. }
  719. } // anonymous namespace
  720. TEST_P(PlainTableDBTest, BloomSchema) {
  721. Options options = CurrentOptions();
  722. options.create_if_missing = true;
  723. for (int bloom_locality = 0; bloom_locality <= 1; bloom_locality++) {
  724. options.bloom_locality = bloom_locality;
  725. PlainTableOptions plain_table_options;
  726. plain_table_options.user_key_len = 16;
  727. plain_table_options.bloom_bits_per_key = 3; // high FP rate for test
  728. plain_table_options.hash_table_ratio = 0.75;
  729. plain_table_options.index_sparseness = 16;
  730. plain_table_options.huge_page_tlb_size = 0;
  731. plain_table_options.encoding_type = kPlain;
  732. bool expect_bloom_not_match = false;
  733. options.table_factory.reset(new TestPlainTableFactory(
  734. &expect_bloom_not_match, plain_table_options, 0 /* column_family_id */,
  735. kDefaultColumnFamilyName));
  736. DestroyAndReopen(&options);
  737. for (unsigned i = 0; i < 2345; ++i) {
  738. ASSERT_OK(Put(NthKey(i, 'y'), "added"));
  739. }
  740. dbfull()->TEST_FlushMemTable();
  741. ASSERT_EQ("added", Get(NthKey(42, 'y')));
  742. for (unsigned i = 0; i < 32; ++i) {
  743. // Known pattern of Bloom filter false positives can detect schema change
  744. // with high probability. Known FPs stuffed into bits:
  745. uint32_t pattern;
  746. if (!bloom_locality) {
  747. pattern = 1785868347UL;
  748. } else if (CACHE_LINE_SIZE == 64U) {
  749. pattern = 2421694657UL;
  750. } else if (CACHE_LINE_SIZE == 128U) {
  751. pattern = 788710956UL;
  752. } else {
  753. ASSERT_EQ(CACHE_LINE_SIZE, 256U);
  754. pattern = 163905UL;
  755. }
  756. bool expect_fp = pattern & (1UL << i);
  757. // fprintf(stderr, "expect_fp@%u: %d\n", i, (int)expect_fp);
  758. expect_bloom_not_match = !expect_fp;
  759. ASSERT_EQ("NOT_FOUND", Get(NthKey(i, 'n')));
  760. }
  761. }
  762. }
  763. namespace {
  764. std::string MakeLongKey(size_t length, char c) {
  765. return std::string(length, c);
  766. }
  767. } // namespace
  768. TEST_P(PlainTableDBTest, IteratorLargeKeys) {
  769. Options options = CurrentOptions();
  770. PlainTableOptions plain_table_options;
  771. plain_table_options.user_key_len = 0;
  772. plain_table_options.bloom_bits_per_key = 0;
  773. plain_table_options.hash_table_ratio = 0;
  774. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  775. options.create_if_missing = true;
  776. options.prefix_extractor.reset();
  777. DestroyAndReopen(&options);
  778. std::string key_list[] = {
  779. MakeLongKey(30, '0'),
  780. MakeLongKey(16, '1'),
  781. MakeLongKey(32, '2'),
  782. MakeLongKey(60, '3'),
  783. MakeLongKey(90, '4'),
  784. MakeLongKey(50, '5'),
  785. MakeLongKey(26, '6')
  786. };
  787. for (size_t i = 0; i < 7; i++) {
  788. ASSERT_OK(Put(key_list[i], ToString(i)));
  789. }
  790. dbfull()->TEST_FlushMemTable();
  791. Iterator* iter = dbfull()->NewIterator(ReadOptions());
  792. iter->Seek(key_list[0]);
  793. for (size_t i = 0; i < 7; i++) {
  794. ASSERT_TRUE(iter->Valid());
  795. ASSERT_EQ(key_list[i], iter->key().ToString());
  796. ASSERT_EQ(ToString(i), iter->value().ToString());
  797. iter->Next();
  798. }
  799. ASSERT_TRUE(!iter->Valid());
  800. delete iter;
  801. }
  802. namespace {
  803. std::string MakeLongKeyWithPrefix(size_t length, char c) {
  804. return "00000000" + std::string(length - 8, c);
  805. }
  806. } // namespace
  807. TEST_P(PlainTableDBTest, IteratorLargeKeysWithPrefix) {
  808. Options options = CurrentOptions();
  809. PlainTableOptions plain_table_options;
  810. plain_table_options.user_key_len = 16;
  811. plain_table_options.bloom_bits_per_key = 0;
  812. plain_table_options.hash_table_ratio = 0.8;
  813. plain_table_options.index_sparseness = 3;
  814. plain_table_options.huge_page_tlb_size = 0;
  815. plain_table_options.encoding_type = kPrefix;
  816. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  817. options.create_if_missing = true;
  818. DestroyAndReopen(&options);
  819. std::string key_list[] = {
  820. MakeLongKeyWithPrefix(30, '0'), MakeLongKeyWithPrefix(16, '1'),
  821. MakeLongKeyWithPrefix(32, '2'), MakeLongKeyWithPrefix(60, '3'),
  822. MakeLongKeyWithPrefix(90, '4'), MakeLongKeyWithPrefix(50, '5'),
  823. MakeLongKeyWithPrefix(26, '6')};
  824. for (size_t i = 0; i < 7; i++) {
  825. ASSERT_OK(Put(key_list[i], ToString(i)));
  826. }
  827. dbfull()->TEST_FlushMemTable();
  828. Iterator* iter = dbfull()->NewIterator(ReadOptions());
  829. iter->Seek(key_list[0]);
  830. for (size_t i = 0; i < 7; i++) {
  831. ASSERT_TRUE(iter->Valid());
  832. ASSERT_EQ(key_list[i], iter->key().ToString());
  833. ASSERT_EQ(ToString(i), iter->value().ToString());
  834. iter->Next();
  835. }
  836. ASSERT_TRUE(!iter->Valid());
  837. delete iter;
  838. }
  839. TEST_P(PlainTableDBTest, IteratorReverseSuffixComparator) {
  840. Options options = CurrentOptions();
  841. options.create_if_missing = true;
  842. // Set only one bucket to force bucket conflict.
  843. // Test index interval for the same prefix to be 1, 2 and 4
  844. test::SimpleSuffixReverseComparator comp;
  845. options.comparator = &comp;
  846. DestroyAndReopen(&options);
  847. ASSERT_OK(Put("1000000000foo002", "v_2"));
  848. ASSERT_OK(Put("0000000000000bar", "random"));
  849. ASSERT_OK(Put("1000000000foo001", "v1"));
  850. ASSERT_OK(Put("3000000000000bar", "bar_v"));
  851. ASSERT_OK(Put("1000000000foo003", "v__3"));
  852. ASSERT_OK(Put("1000000000foo004", "v__4"));
  853. ASSERT_OK(Put("1000000000foo005", "v__5"));
  854. ASSERT_OK(Put("1000000000foo007", "v__7"));
  855. ASSERT_OK(Put("1000000000foo008", "v__8"));
  856. dbfull()->TEST_FlushMemTable();
  857. ASSERT_EQ("v1", Get("1000000000foo001"));
  858. ASSERT_EQ("v__3", Get("1000000000foo003"));
  859. Iterator* iter = dbfull()->NewIterator(ReadOptions());
  860. iter->Seek("1000000000foo009");
  861. ASSERT_TRUE(iter->Valid());
  862. ASSERT_EQ("1000000000foo008", iter->key().ToString());
  863. ASSERT_EQ("v__8", iter->value().ToString());
  864. iter->Next();
  865. ASSERT_TRUE(iter->Valid());
  866. ASSERT_EQ("1000000000foo007", iter->key().ToString());
  867. ASSERT_EQ("v__7", iter->value().ToString());
  868. iter->Next();
  869. ASSERT_TRUE(iter->Valid());
  870. ASSERT_EQ("1000000000foo005", iter->key().ToString());
  871. ASSERT_EQ("v__5", iter->value().ToString());
  872. iter->Next();
  873. ASSERT_TRUE(iter->Valid());
  874. ASSERT_EQ("1000000000foo004", iter->key().ToString());
  875. ASSERT_EQ("v__4", iter->value().ToString());
  876. iter->Seek("3000000000000bar");
  877. ASSERT_TRUE(iter->Valid());
  878. ASSERT_EQ("3000000000000bar", iter->key().ToString());
  879. ASSERT_EQ("bar_v", iter->value().ToString());
  880. iter->Seek("1000000000foo005");
  881. ASSERT_TRUE(iter->Valid());
  882. ASSERT_EQ("1000000000foo005", iter->key().ToString());
  883. ASSERT_EQ("v__5", iter->value().ToString());
  884. iter->Seek("1000000000foo006");
  885. ASSERT_TRUE(iter->Valid());
  886. ASSERT_EQ("1000000000foo005", iter->key().ToString());
  887. ASSERT_EQ("v__5", iter->value().ToString());
  888. iter->Seek("1000000000foo008");
  889. ASSERT_TRUE(iter->Valid());
  890. ASSERT_EQ("1000000000foo008", iter->key().ToString());
  891. ASSERT_EQ("v__8", iter->value().ToString());
  892. iter->Seek("1000000000foo000");
  893. ASSERT_TRUE(iter->Valid());
  894. ASSERT_EQ("3000000000000bar", iter->key().ToString());
  895. delete iter;
  896. }
  897. TEST_P(PlainTableDBTest, HashBucketConflict) {
  898. for (size_t huge_page_tlb_size = 0; huge_page_tlb_size <= 2 * 1024 * 1024;
  899. huge_page_tlb_size += 2 * 1024 * 1024) {
  900. for (unsigned char i = 1; i <= 3; i++) {
  901. Options options = CurrentOptions();
  902. options.create_if_missing = true;
  903. // Set only one bucket to force bucket conflict.
  904. // Test index interval for the same prefix to be 1, 2 and 4
  905. PlainTableOptions plain_table_options;
  906. plain_table_options.user_key_len = 16;
  907. plain_table_options.bloom_bits_per_key = 0;
  908. plain_table_options.hash_table_ratio = 0;
  909. plain_table_options.index_sparseness = 2 ^ i;
  910. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  911. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  912. DestroyAndReopen(&options);
  913. ASSERT_OK(Put("5000000000000fo0", "v1"));
  914. ASSERT_OK(Put("5000000000000fo1", "v2"));
  915. ASSERT_OK(Put("5000000000000fo2", "v"));
  916. ASSERT_OK(Put("2000000000000fo0", "v3"));
  917. ASSERT_OK(Put("2000000000000fo1", "v4"));
  918. ASSERT_OK(Put("2000000000000fo2", "v"));
  919. ASSERT_OK(Put("2000000000000fo3", "v"));
  920. dbfull()->TEST_FlushMemTable();
  921. ASSERT_EQ("v1", Get("5000000000000fo0"));
  922. ASSERT_EQ("v2", Get("5000000000000fo1"));
  923. ASSERT_EQ("v3", Get("2000000000000fo0"));
  924. ASSERT_EQ("v4", Get("2000000000000fo1"));
  925. ASSERT_EQ("NOT_FOUND", Get("5000000000000bar"));
  926. ASSERT_EQ("NOT_FOUND", Get("2000000000000bar"));
  927. ASSERT_EQ("NOT_FOUND", Get("5000000000000fo8"));
  928. ASSERT_EQ("NOT_FOUND", Get("2000000000000fo8"));
  929. ReadOptions ro;
  930. Iterator* iter = dbfull()->NewIterator(ro);
  931. iter->Seek("5000000000000fo0");
  932. ASSERT_TRUE(iter->Valid());
  933. ASSERT_EQ("5000000000000fo0", iter->key().ToString());
  934. iter->Next();
  935. ASSERT_TRUE(iter->Valid());
  936. ASSERT_EQ("5000000000000fo1", iter->key().ToString());
  937. iter->Seek("5000000000000fo1");
  938. ASSERT_TRUE(iter->Valid());
  939. ASSERT_EQ("5000000000000fo1", iter->key().ToString());
  940. iter->Seek("2000000000000fo0");
  941. ASSERT_TRUE(iter->Valid());
  942. ASSERT_EQ("2000000000000fo0", iter->key().ToString());
  943. iter->Next();
  944. ASSERT_TRUE(iter->Valid());
  945. ASSERT_EQ("2000000000000fo1", iter->key().ToString());
  946. iter->Seek("2000000000000fo1");
  947. ASSERT_TRUE(iter->Valid());
  948. ASSERT_EQ("2000000000000fo1", iter->key().ToString());
  949. iter->Seek("2000000000000bar");
  950. ASSERT_TRUE(iter->Valid());
  951. ASSERT_EQ("2000000000000fo0", iter->key().ToString());
  952. iter->Seek("5000000000000bar");
  953. ASSERT_TRUE(iter->Valid());
  954. ASSERT_EQ("5000000000000fo0", iter->key().ToString());
  955. iter->Seek("2000000000000fo8");
  956. ASSERT_TRUE(!iter->Valid() ||
  957. options.comparator->Compare(iter->key(), "20000001") > 0);
  958. iter->Seek("5000000000000fo8");
  959. ASSERT_TRUE(!iter->Valid());
  960. iter->Seek("1000000000000fo2");
  961. ASSERT_TRUE(!iter->Valid());
  962. iter->Seek("3000000000000fo2");
  963. ASSERT_TRUE(!iter->Valid());
  964. iter->Seek("8000000000000fo2");
  965. ASSERT_TRUE(!iter->Valid());
  966. delete iter;
  967. }
  968. }
  969. }
  970. TEST_P(PlainTableDBTest, HashBucketConflictReverseSuffixComparator) {
  971. for (size_t huge_page_tlb_size = 0; huge_page_tlb_size <= 2 * 1024 * 1024;
  972. huge_page_tlb_size += 2 * 1024 * 1024) {
  973. for (unsigned char i = 1; i <= 3; i++) {
  974. Options options = CurrentOptions();
  975. options.create_if_missing = true;
  976. test::SimpleSuffixReverseComparator comp;
  977. options.comparator = &comp;
  978. // Set only one bucket to force bucket conflict.
  979. // Test index interval for the same prefix to be 1, 2 and 4
  980. PlainTableOptions plain_table_options;
  981. plain_table_options.user_key_len = 16;
  982. plain_table_options.bloom_bits_per_key = 0;
  983. plain_table_options.hash_table_ratio = 0;
  984. plain_table_options.index_sparseness = 2 ^ i;
  985. plain_table_options.huge_page_tlb_size = huge_page_tlb_size;
  986. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  987. DestroyAndReopen(&options);
  988. ASSERT_OK(Put("5000000000000fo0", "v1"));
  989. ASSERT_OK(Put("5000000000000fo1", "v2"));
  990. ASSERT_OK(Put("5000000000000fo2", "v"));
  991. ASSERT_OK(Put("2000000000000fo0", "v3"));
  992. ASSERT_OK(Put("2000000000000fo1", "v4"));
  993. ASSERT_OK(Put("2000000000000fo2", "v"));
  994. ASSERT_OK(Put("2000000000000fo3", "v"));
  995. dbfull()->TEST_FlushMemTable();
  996. ASSERT_EQ("v1", Get("5000000000000fo0"));
  997. ASSERT_EQ("v2", Get("5000000000000fo1"));
  998. ASSERT_EQ("v3", Get("2000000000000fo0"));
  999. ASSERT_EQ("v4", Get("2000000000000fo1"));
  1000. ASSERT_EQ("NOT_FOUND", Get("5000000000000bar"));
  1001. ASSERT_EQ("NOT_FOUND", Get("2000000000000bar"));
  1002. ASSERT_EQ("NOT_FOUND", Get("5000000000000fo8"));
  1003. ASSERT_EQ("NOT_FOUND", Get("2000000000000fo8"));
  1004. ReadOptions ro;
  1005. Iterator* iter = dbfull()->NewIterator(ro);
  1006. iter->Seek("5000000000000fo1");
  1007. ASSERT_TRUE(iter->Valid());
  1008. ASSERT_EQ("5000000000000fo1", iter->key().ToString());
  1009. iter->Next();
  1010. ASSERT_TRUE(iter->Valid());
  1011. ASSERT_EQ("5000000000000fo0", iter->key().ToString());
  1012. iter->Seek("5000000000000fo1");
  1013. ASSERT_TRUE(iter->Valid());
  1014. ASSERT_EQ("5000000000000fo1", iter->key().ToString());
  1015. iter->Seek("2000000000000fo1");
  1016. ASSERT_TRUE(iter->Valid());
  1017. ASSERT_EQ("2000000000000fo1", iter->key().ToString());
  1018. iter->Next();
  1019. ASSERT_TRUE(iter->Valid());
  1020. ASSERT_EQ("2000000000000fo0", iter->key().ToString());
  1021. iter->Seek("2000000000000fo1");
  1022. ASSERT_TRUE(iter->Valid());
  1023. ASSERT_EQ("2000000000000fo1", iter->key().ToString());
  1024. iter->Seek("2000000000000var");
  1025. ASSERT_TRUE(iter->Valid());
  1026. ASSERT_EQ("2000000000000fo3", iter->key().ToString());
  1027. iter->Seek("5000000000000var");
  1028. ASSERT_TRUE(iter->Valid());
  1029. ASSERT_EQ("5000000000000fo2", iter->key().ToString());
  1030. std::string seek_key = "2000000000000bar";
  1031. iter->Seek(seek_key);
  1032. ASSERT_TRUE(!iter->Valid() ||
  1033. options.prefix_extractor->Transform(iter->key()) !=
  1034. options.prefix_extractor->Transform(seek_key));
  1035. iter->Seek("1000000000000fo2");
  1036. ASSERT_TRUE(!iter->Valid());
  1037. iter->Seek("3000000000000fo2");
  1038. ASSERT_TRUE(!iter->Valid());
  1039. iter->Seek("8000000000000fo2");
  1040. ASSERT_TRUE(!iter->Valid());
  1041. delete iter;
  1042. }
  1043. }
  1044. }
  1045. TEST_P(PlainTableDBTest, NonExistingKeyToNonEmptyBucket) {
  1046. Options options = CurrentOptions();
  1047. options.create_if_missing = true;
  1048. // Set only one bucket to force bucket conflict.
  1049. // Test index interval for the same prefix to be 1, 2 and 4
  1050. PlainTableOptions plain_table_options;
  1051. plain_table_options.user_key_len = 16;
  1052. plain_table_options.bloom_bits_per_key = 0;
  1053. plain_table_options.hash_table_ratio = 0;
  1054. plain_table_options.index_sparseness = 5;
  1055. options.table_factory.reset(NewPlainTableFactory(plain_table_options));
  1056. DestroyAndReopen(&options);
  1057. ASSERT_OK(Put("5000000000000fo0", "v1"));
  1058. ASSERT_OK(Put("5000000000000fo1", "v2"));
  1059. ASSERT_OK(Put("5000000000000fo2", "v3"));
  1060. dbfull()->TEST_FlushMemTable();
  1061. ASSERT_EQ("v1", Get("5000000000000fo0"));
  1062. ASSERT_EQ("v2", Get("5000000000000fo1"));
  1063. ASSERT_EQ("v3", Get("5000000000000fo2"));
  1064. ASSERT_EQ("NOT_FOUND", Get("8000000000000bar"));
  1065. ASSERT_EQ("NOT_FOUND", Get("1000000000000bar"));
  1066. Iterator* iter = dbfull()->NewIterator(ReadOptions());
  1067. iter->Seek("5000000000000bar");
  1068. ASSERT_TRUE(iter->Valid());
  1069. ASSERT_EQ("5000000000000fo0", iter->key().ToString());
  1070. iter->Seek("5000000000000fo8");
  1071. ASSERT_TRUE(!iter->Valid());
  1072. iter->Seek("1000000000000fo2");
  1073. ASSERT_TRUE(!iter->Valid());
  1074. iter->Seek("8000000000000fo2");
  1075. ASSERT_TRUE(!iter->Valid());
  1076. delete iter;
  1077. }
  1078. static std::string Key(int i) {
  1079. char buf[100];
  1080. snprintf(buf, sizeof(buf), "key_______%06d", i);
  1081. return std::string(buf);
  1082. }
  1083. static std::string RandomString(Random* rnd, int len) {
  1084. std::string r;
  1085. test::RandomString(rnd, len, &r);
  1086. return r;
  1087. }
  1088. TEST_P(PlainTableDBTest, CompactionTrigger) {
  1089. Options options = CurrentOptions();
  1090. options.write_buffer_size = 120 << 10; // 100KB
  1091. options.num_levels = 3;
  1092. options.level0_file_num_compaction_trigger = 3;
  1093. Reopen(&options);
  1094. Random rnd(301);
  1095. for (int num = 0; num < options.level0_file_num_compaction_trigger - 1;
  1096. num++) {
  1097. std::vector<std::string> values;
  1098. // Write 120KB (10 values, each 12K)
  1099. for (int i = 0; i < 10; i++) {
  1100. values.push_back(RandomString(&rnd, 12000));
  1101. ASSERT_OK(Put(Key(i), values[i]));
  1102. }
  1103. ASSERT_OK(Put(Key(999), ""));
  1104. dbfull()->TEST_WaitForFlushMemTable();
  1105. ASSERT_EQ(NumTableFilesAtLevel(0), num + 1);
  1106. }
  1107. //generate one more file in level-0, and should trigger level-0 compaction
  1108. std::vector<std::string> values;
  1109. for (int i = 0; i < 12; i++) {
  1110. values.push_back(RandomString(&rnd, 10000));
  1111. ASSERT_OK(Put(Key(i), values[i]));
  1112. }
  1113. ASSERT_OK(Put(Key(999), ""));
  1114. dbfull()->TEST_WaitForCompact();
  1115. ASSERT_EQ(NumTableFilesAtLevel(0), 0);
  1116. ASSERT_EQ(NumTableFilesAtLevel(1), 1);
  1117. }
  1118. TEST_P(PlainTableDBTest, AdaptiveTable) {
  1119. Options options = CurrentOptions();
  1120. options.create_if_missing = true;
  1121. options.table_factory.reset(NewPlainTableFactory());
  1122. DestroyAndReopen(&options);
  1123. ASSERT_OK(Put("1000000000000foo", "v1"));
  1124. ASSERT_OK(Put("0000000000000bar", "v2"));
  1125. ASSERT_OK(Put("1000000000000foo", "v3"));
  1126. dbfull()->TEST_FlushMemTable();
  1127. options.create_if_missing = false;
  1128. std::shared_ptr<TableFactory> block_based_factory(
  1129. NewBlockBasedTableFactory());
  1130. std::shared_ptr<TableFactory> plain_table_factory(
  1131. NewPlainTableFactory());
  1132. std::shared_ptr<TableFactory> dummy_factory;
  1133. options.table_factory.reset(NewAdaptiveTableFactory(
  1134. block_based_factory, block_based_factory, plain_table_factory));
  1135. Reopen(&options);
  1136. ASSERT_EQ("v3", Get("1000000000000foo"));
  1137. ASSERT_EQ("v2", Get("0000000000000bar"));
  1138. ASSERT_OK(Put("2000000000000foo", "v4"));
  1139. ASSERT_OK(Put("3000000000000bar", "v5"));
  1140. dbfull()->TEST_FlushMemTable();
  1141. ASSERT_EQ("v4", Get("2000000000000foo"));
  1142. ASSERT_EQ("v5", Get("3000000000000bar"));
  1143. Reopen(&options);
  1144. ASSERT_EQ("v3", Get("1000000000000foo"));
  1145. ASSERT_EQ("v2", Get("0000000000000bar"));
  1146. ASSERT_EQ("v4", Get("2000000000000foo"));
  1147. ASSERT_EQ("v5", Get("3000000000000bar"));
  1148. options.paranoid_checks = false;
  1149. options.table_factory.reset(NewBlockBasedTableFactory());
  1150. Reopen(&options);
  1151. ASSERT_NE("v3", Get("1000000000000foo"));
  1152. options.paranoid_checks = false;
  1153. options.table_factory.reset(NewPlainTableFactory());
  1154. Reopen(&options);
  1155. ASSERT_NE("v5", Get("3000000000000bar"));
  1156. }
  1157. INSTANTIATE_TEST_CASE_P(PlainTableDBTest, PlainTableDBTest, ::testing::Bool());
  1158. } // namespace ROCKSDB_NAMESPACE
  1159. int main(int argc, char** argv) {
  1160. ::testing::InitGoogleTest(&argc, argv);
  1161. return RUN_ALL_TESTS();
  1162. }
  1163. #else
  1164. #include <stdio.h>
  1165. int main(int /*argc*/, char** /*argv*/) {
  1166. fprintf(stderr, "SKIPPED as plain table is not supported in ROCKSDB_LITE\n");
  1167. return 0;
  1168. }
  1169. #endif // !ROCKSDB_LITE