cassandra_format_test.cc 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375
  1. // Copyright (c) 2017-present, Facebook, Inc. All rights reserved.
  2. // This source code is licensed under both the GPLv2 (found in the
  3. // COPYING file in the root directory) and Apache 2.0 License
  4. // (found in the LICENSE.Apache file in the root directory).
  5. #include <cstring>
  6. #include <memory>
  7. #include "test_util/testharness.h"
  8. #include "utilities/cassandra/format.h"
  9. #include "utilities/cassandra/serialize.h"
  10. #include "utilities/cassandra/test_utils.h"
  11. namespace ROCKSDB_NAMESPACE::cassandra {
  12. TEST(ColumnTest, Column) {
  13. char data[4] = {'d', 'a', 't', 'a'};
  14. int8_t mask = 0;
  15. int8_t index = 1;
  16. int64_t timestamp = 1494022807044;
  17. Column c = Column(mask, index, timestamp, sizeof(data), data);
  18. EXPECT_EQ(c.Index(), index);
  19. EXPECT_EQ(c.Timestamp(), timestamp);
  20. EXPECT_EQ(c.Size(), 14 + sizeof(data));
  21. // Verify the serialization.
  22. std::string dest;
  23. dest.reserve(c.Size() * 2);
  24. c.Serialize(&dest);
  25. EXPECT_EQ(dest.size(), c.Size());
  26. std::size_t offset = 0;
  27. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), mask);
  28. offset += sizeof(int8_t);
  29. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), index);
  30. offset += sizeof(int8_t);
  31. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), timestamp);
  32. offset += sizeof(int64_t);
  33. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), sizeof(data));
  34. offset += sizeof(int32_t);
  35. EXPECT_TRUE(std::memcmp(data, dest.c_str() + offset, sizeof(data)) == 0);
  36. // Verify the deserialization.
  37. std::string saved_dest = dest;
  38. std::shared_ptr<Column> c1 = Column::Deserialize(saved_dest.c_str(), 0);
  39. EXPECT_EQ(c1->Index(), index);
  40. EXPECT_EQ(c1->Timestamp(), timestamp);
  41. EXPECT_EQ(c1->Size(), 14 + sizeof(data));
  42. c1->Serialize(&dest);
  43. EXPECT_EQ(dest.size(), 2 * c.Size());
  44. EXPECT_TRUE(std::memcmp(dest.c_str(), dest.c_str() + c.Size(), c.Size()) ==
  45. 0);
  46. // Verify the ColumnBase::Deserialization.
  47. saved_dest = dest;
  48. std::shared_ptr<ColumnBase> c2 =
  49. ColumnBase::Deserialize(saved_dest.c_str(), c.Size());
  50. c2->Serialize(&dest);
  51. EXPECT_EQ(dest.size(), 3 * c.Size());
  52. EXPECT_TRUE(std::memcmp(dest.c_str() + c.Size(), dest.c_str() + c.Size() * 2,
  53. c.Size()) == 0);
  54. }
  55. TEST(ExpiringColumnTest, ExpiringColumn) {
  56. char data[4] = {'d', 'a', 't', 'a'};
  57. int8_t mask = ColumnTypeMask::EXPIRATION_MASK;
  58. int8_t index = 3;
  59. int64_t timestamp = 1494022807044;
  60. int32_t ttl = 3600;
  61. ExpiringColumn c =
  62. ExpiringColumn(mask, index, timestamp, sizeof(data), data, ttl);
  63. EXPECT_EQ(c.Index(), index);
  64. EXPECT_EQ(c.Timestamp(), timestamp);
  65. EXPECT_EQ(c.Size(), 18 + sizeof(data));
  66. // Verify the serialization.
  67. std::string dest;
  68. dest.reserve(c.Size() * 2);
  69. c.Serialize(&dest);
  70. EXPECT_EQ(dest.size(), c.Size());
  71. std::size_t offset = 0;
  72. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), mask);
  73. offset += sizeof(int8_t);
  74. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), index);
  75. offset += sizeof(int8_t);
  76. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), timestamp);
  77. offset += sizeof(int64_t);
  78. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), sizeof(data));
  79. offset += sizeof(int32_t);
  80. EXPECT_TRUE(std::memcmp(data, dest.c_str() + offset, sizeof(data)) == 0);
  81. offset += sizeof(data);
  82. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), ttl);
  83. // Verify the deserialization.
  84. std::string saved_dest = dest;
  85. std::shared_ptr<ExpiringColumn> c1 =
  86. ExpiringColumn::Deserialize(saved_dest.c_str(), 0);
  87. EXPECT_EQ(c1->Index(), index);
  88. EXPECT_EQ(c1->Timestamp(), timestamp);
  89. EXPECT_EQ(c1->Size(), 18 + sizeof(data));
  90. c1->Serialize(&dest);
  91. EXPECT_EQ(dest.size(), 2 * c.Size());
  92. EXPECT_TRUE(std::memcmp(dest.c_str(), dest.c_str() + c.Size(), c.Size()) ==
  93. 0);
  94. // Verify the ColumnBase::Deserialization.
  95. saved_dest = dest;
  96. std::shared_ptr<ColumnBase> c2 =
  97. ColumnBase::Deserialize(saved_dest.c_str(), c.Size());
  98. c2->Serialize(&dest);
  99. EXPECT_EQ(dest.size(), 3 * c.Size());
  100. EXPECT_TRUE(std::memcmp(dest.c_str() + c.Size(), dest.c_str() + c.Size() * 2,
  101. c.Size()) == 0);
  102. }
  103. TEST(TombstoneTest, TombstoneCollectable) {
  104. int32_t now = (int32_t)time(nullptr);
  105. int32_t gc_grace_seconds = 16440;
  106. int32_t time_delta_seconds = 10;
  107. EXPECT_TRUE(
  108. Tombstone(ColumnTypeMask::DELETION_MASK, 0,
  109. now - gc_grace_seconds - time_delta_seconds,
  110. ToMicroSeconds(now - gc_grace_seconds - time_delta_seconds))
  111. .Collectable(gc_grace_seconds));
  112. EXPECT_FALSE(
  113. Tombstone(ColumnTypeMask::DELETION_MASK, 0,
  114. now - gc_grace_seconds + time_delta_seconds,
  115. ToMicroSeconds(now - gc_grace_seconds + time_delta_seconds))
  116. .Collectable(gc_grace_seconds));
  117. }
  118. TEST(TombstoneTest, Tombstone) {
  119. int8_t mask = ColumnTypeMask::DELETION_MASK;
  120. int8_t index = 2;
  121. int32_t local_deletion_time = 1494022807;
  122. int64_t marked_for_delete_at = 1494022807044;
  123. Tombstone c =
  124. Tombstone(mask, index, local_deletion_time, marked_for_delete_at);
  125. EXPECT_EQ(c.Index(), index);
  126. EXPECT_EQ(c.Timestamp(), marked_for_delete_at);
  127. EXPECT_EQ(c.Size(), 14);
  128. // Verify the serialization.
  129. std::string dest;
  130. dest.reserve(c.Size() * 2);
  131. c.Serialize(&dest);
  132. EXPECT_EQ(dest.size(), c.Size());
  133. std::size_t offset = 0;
  134. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), mask);
  135. offset += sizeof(int8_t);
  136. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), index);
  137. offset += sizeof(int8_t);
  138. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), local_deletion_time);
  139. offset += sizeof(int32_t);
  140. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), marked_for_delete_at);
  141. // Verify the deserialization.
  142. std::shared_ptr<Tombstone> c1 = Tombstone::Deserialize(dest.c_str(), 0);
  143. EXPECT_EQ(c1->Index(), index);
  144. EXPECT_EQ(c1->Timestamp(), marked_for_delete_at);
  145. EXPECT_EQ(c1->Size(), 14);
  146. c1->Serialize(&dest);
  147. EXPECT_EQ(dest.size(), 2 * c.Size());
  148. EXPECT_TRUE(std::memcmp(dest.c_str(), dest.c_str() + c.Size(), c.Size()) ==
  149. 0);
  150. // Verify the ColumnBase::Deserialization.
  151. std::shared_ptr<ColumnBase> c2 =
  152. ColumnBase::Deserialize(dest.c_str(), c.Size());
  153. c2->Serialize(&dest);
  154. EXPECT_EQ(dest.size(), 3 * c.Size());
  155. EXPECT_TRUE(std::memcmp(dest.c_str() + c.Size(), dest.c_str() + c.Size() * 2,
  156. c.Size()) == 0);
  157. }
  158. class RowValueTest : public testing::Test {};
  159. TEST(RowValueTest, RowTombstone) {
  160. int32_t local_deletion_time = 1494022807;
  161. int64_t marked_for_delete_at = 1494022807044;
  162. RowValue r = RowValue(local_deletion_time, marked_for_delete_at);
  163. EXPECT_EQ(r.Size(), 12);
  164. EXPECT_EQ(r.IsTombstone(), true);
  165. EXPECT_EQ(r.LastModifiedTime(), marked_for_delete_at);
  166. // Verify the serialization.
  167. std::string dest;
  168. dest.reserve(r.Size() * 2);
  169. r.Serialize(&dest);
  170. EXPECT_EQ(dest.size(), r.Size());
  171. std::size_t offset = 0;
  172. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), local_deletion_time);
  173. offset += sizeof(int32_t);
  174. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), marked_for_delete_at);
  175. // Verify the deserialization.
  176. RowValue r1 = RowValue::Deserialize(dest.c_str(), r.Size());
  177. EXPECT_EQ(r1.Size(), 12);
  178. EXPECT_EQ(r1.IsTombstone(), true);
  179. EXPECT_EQ(r1.LastModifiedTime(), marked_for_delete_at);
  180. r1.Serialize(&dest);
  181. EXPECT_EQ(dest.size(), 2 * r.Size());
  182. EXPECT_TRUE(std::memcmp(dest.c_str(), dest.c_str() + r.Size(), r.Size()) ==
  183. 0);
  184. }
  185. TEST(RowValueTest, RowWithColumns) {
  186. std::vector<std::shared_ptr<ColumnBase>> columns;
  187. int64_t last_modified_time = 1494022807048;
  188. std::size_t columns_data_size = 0;
  189. char e_data[5] = {'e', 'd', 'a', 't', 'a'};
  190. int8_t e_index = 0;
  191. int64_t e_timestamp = 1494022807044;
  192. int32_t e_ttl = 3600;
  193. columns.push_back(std::shared_ptr<ExpiringColumn>(
  194. new ExpiringColumn(ColumnTypeMask::EXPIRATION_MASK, e_index, e_timestamp,
  195. sizeof(e_data), e_data, e_ttl)));
  196. columns_data_size += columns[0]->Size();
  197. char c_data[4] = {'d', 'a', 't', 'a'};
  198. int8_t c_index = 1;
  199. int64_t c_timestamp = 1494022807048;
  200. columns.push_back(std::shared_ptr<Column>(
  201. new Column(0, c_index, c_timestamp, sizeof(c_data), c_data)));
  202. columns_data_size += columns[1]->Size();
  203. int8_t t_index = 2;
  204. int32_t t_local_deletion_time = 1494022801;
  205. int64_t t_marked_for_delete_at = 1494022807043;
  206. columns.push_back(std::shared_ptr<Tombstone>(
  207. new Tombstone(ColumnTypeMask::DELETION_MASK, t_index,
  208. t_local_deletion_time, t_marked_for_delete_at)));
  209. columns_data_size += columns[2]->Size();
  210. RowValue r = RowValue(std::move(columns), last_modified_time);
  211. EXPECT_EQ(r.Size(), columns_data_size + 12);
  212. EXPECT_EQ(r.IsTombstone(), false);
  213. EXPECT_EQ(r.LastModifiedTime(), last_modified_time);
  214. // Verify the serialization.
  215. std::string dest;
  216. dest.reserve(r.Size() * 2);
  217. r.Serialize(&dest);
  218. EXPECT_EQ(dest.size(), r.Size());
  219. std::size_t offset = 0;
  220. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset),
  221. std::numeric_limits<int32_t>::max());
  222. offset += sizeof(int32_t);
  223. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset),
  224. std::numeric_limits<int64_t>::min());
  225. offset += sizeof(int64_t);
  226. // Column0: ExpiringColumn
  227. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset),
  228. ColumnTypeMask::EXPIRATION_MASK);
  229. offset += sizeof(int8_t);
  230. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), e_index);
  231. offset += sizeof(int8_t);
  232. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), e_timestamp);
  233. offset += sizeof(int64_t);
  234. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), sizeof(e_data));
  235. offset += sizeof(int32_t);
  236. EXPECT_TRUE(std::memcmp(e_data, dest.c_str() + offset, sizeof(e_data)) == 0);
  237. offset += sizeof(e_data);
  238. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), e_ttl);
  239. offset += sizeof(int32_t);
  240. // Column1: Column
  241. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), 0);
  242. offset += sizeof(int8_t);
  243. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), c_index);
  244. offset += sizeof(int8_t);
  245. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), c_timestamp);
  246. offset += sizeof(int64_t);
  247. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), sizeof(c_data));
  248. offset += sizeof(int32_t);
  249. EXPECT_TRUE(std::memcmp(c_data, dest.c_str() + offset, sizeof(c_data)) == 0);
  250. offset += sizeof(c_data);
  251. // Column2: Tombstone
  252. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset),
  253. ColumnTypeMask::DELETION_MASK);
  254. offset += sizeof(int8_t);
  255. EXPECT_EQ(Deserialize<int8_t>(dest.c_str(), offset), t_index);
  256. offset += sizeof(int8_t);
  257. EXPECT_EQ(Deserialize<int32_t>(dest.c_str(), offset), t_local_deletion_time);
  258. offset += sizeof(int32_t);
  259. EXPECT_EQ(Deserialize<int64_t>(dest.c_str(), offset), t_marked_for_delete_at);
  260. // Verify the deserialization.
  261. RowValue r1 = RowValue::Deserialize(dest.c_str(), r.Size());
  262. EXPECT_EQ(r1.Size(), columns_data_size + 12);
  263. EXPECT_EQ(r1.IsTombstone(), false);
  264. EXPECT_EQ(r1.LastModifiedTime(), last_modified_time);
  265. r1.Serialize(&dest);
  266. EXPECT_EQ(dest.size(), 2 * r.Size());
  267. EXPECT_TRUE(std::memcmp(dest.c_str(), dest.c_str() + r.Size(), r.Size()) ==
  268. 0);
  269. }
  270. TEST(RowValueTest, PurgeTtlShouldRemvoeAllColumnsExpired) {
  271. int64_t now = time(nullptr);
  272. auto row_value = CreateTestRowValue(
  273. {CreateTestColumnSpec(kColumn, 0, ToMicroSeconds(now)),
  274. CreateTestColumnSpec(kExpiringColumn, 1,
  275. ToMicroSeconds(now - kTtl - 10)), // expired
  276. CreateTestColumnSpec(kExpiringColumn, 2,
  277. ToMicroSeconds(now)), // not expired
  278. CreateTestColumnSpec(kTombstone, 3, ToMicroSeconds(now))});
  279. bool changed = false;
  280. auto purged = row_value.RemoveExpiredColumns(&changed);
  281. EXPECT_TRUE(changed);
  282. EXPECT_EQ(purged.get_columns().size(), 3);
  283. VerifyRowValueColumns(purged.get_columns(), 0, kColumn, 0,
  284. ToMicroSeconds(now));
  285. VerifyRowValueColumns(purged.get_columns(), 1, kExpiringColumn, 2,
  286. ToMicroSeconds(now));
  287. VerifyRowValueColumns(purged.get_columns(), 2, kTombstone, 3,
  288. ToMicroSeconds(now));
  289. purged.RemoveExpiredColumns(&changed);
  290. EXPECT_FALSE(changed);
  291. }
  292. TEST(RowValueTest, ExpireTtlShouldConvertExpiredColumnsToTombstones) {
  293. int64_t now = time(nullptr);
  294. auto row_value = CreateTestRowValue(
  295. {CreateTestColumnSpec(kColumn, 0, ToMicroSeconds(now)),
  296. CreateTestColumnSpec(kExpiringColumn, 1,
  297. ToMicroSeconds(now - kTtl - 10)), // expired
  298. CreateTestColumnSpec(kExpiringColumn, 2,
  299. ToMicroSeconds(now)), // not expired
  300. CreateTestColumnSpec(kTombstone, 3, ToMicroSeconds(now))});
  301. bool changed = false;
  302. auto compacted = row_value.ConvertExpiredColumnsToTombstones(&changed);
  303. EXPECT_TRUE(changed);
  304. EXPECT_EQ(compacted.get_columns().size(), 4);
  305. VerifyRowValueColumns(compacted.get_columns(), 0, kColumn, 0,
  306. ToMicroSeconds(now));
  307. VerifyRowValueColumns(compacted.get_columns(), 1, kTombstone, 1,
  308. ToMicroSeconds(now - 10));
  309. VerifyRowValueColumns(compacted.get_columns(), 2, kExpiringColumn, 2,
  310. ToMicroSeconds(now));
  311. VerifyRowValueColumns(compacted.get_columns(), 3, kTombstone, 3,
  312. ToMicroSeconds(now));
  313. compacted.ConvertExpiredColumnsToTombstones(&changed);
  314. EXPECT_FALSE(changed);
  315. }
  316. } // namespace ROCKSDB_NAMESPACE::cassandra
  317. int main(int argc, char** argv) {
  318. ROCKSDB_NAMESPACE::port::InstallStackTraceHandler();
  319. ::testing::InitGoogleTest(&argc, argv);
  320. return RUN_ALL_TESTS();
  321. }