/* * Copyright 2018, Oath Inc. Licensed under the terms of the * Apache License 2.0. See LICENSE file at the project root for terms. */ #include "hll.hpp" #include "CouponHashSet.hpp" #include "HllSketch.hpp" #include "HllUtil.hpp" #include #include #include #include #include #include namespace datasketches { class CouponHashSetTest : public CppUnit::TestFixture { CPPUNIT_TEST_SUITE(CouponHashSetTest); CPPUNIT_TEST(checkCorruptBytearray); CPPUNIT_TEST(checkCorruptStream); CPPUNIT_TEST_SUITE_END(); void checkCorruptBytearray() { int lgK = 8; hll_sketch sk1 = HllSketch::newInstance(lgK); for (int i = 0; i < 24; ++i) { sk1->update(i); } std::pair, size_t> sketchBytes = sk1->serializeUpdatable(); uint8_t* bytes = sketchBytes.first.get(); bytes[HllUtil::PREAMBLE_INTS_BYTE] = 0; // fail in HllSketchImpl CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in preInts byte", HllSketch::deserialize(bytes, sketchBytes.second), std::invalid_argument); // fail in CouponHashSet CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in preInts byte", CouponHashSet::newSet(bytes, sketchBytes.second), std::invalid_argument); bytes[HllUtil::PREAMBLE_INTS_BYTE] = HllUtil::HASH_SET_PREINTS; bytes[HllUtil::SER_VER_BYTE] = 0; CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in serialization version byte", HllSketch::deserialize(bytes, sketchBytes.second), std::invalid_argument); bytes[HllUtil::SER_VER_BYTE] = HllUtil::SER_VER; bytes[HllUtil::FAMILY_BYTE] = 0; CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in family id byte", HllSketch::deserialize(bytes, sketchBytes.second), std::invalid_argument); bytes[HllUtil::FAMILY_BYTE] = HllUtil::FAMILY_ID; bytes[HllUtil::LG_K_BYTE] = 6; CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect too small a lgK for Set mode", HllSketch::deserialize(bytes, sketchBytes.second), std::invalid_argument); bytes[HllUtil::LG_K_BYTE] = lgK; uint8_t tmp = bytes[HllUtil::MODE_BYTE]; bytes[HllUtil::MODE_BYTE] = 0x10; // HLL_6, LIST CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in mode byte", HllSketch::deserialize(bytes, sketchBytes.second), std::invalid_argument); bytes[HllUtil::MODE_BYTE] = tmp; tmp = bytes[HllUtil::LG_ARR_BYTE]; bytes[HllUtil::LG_ARR_BYTE] = 0; HllSketch::deserialize(bytes, sketchBytes.second); // should work fine despite the corruption bytes[HllUtil::LG_ARR_BYTE] = tmp; CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in serialized length", HllSketch::deserialize(bytes, sketchBytes.second - 1), std::invalid_argument); CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in serialized length", HllSketch::deserialize(bytes, 3), std::invalid_argument); } void checkCorruptStream() { int lgK = 9; hll_sketch sk1 = HllSketch::newInstance(lgK); for (int i = 0; i < 24; ++i) { sk1->update(i); } std::stringstream ss; sk1->serializeCompact(ss); ss.seekp(HllUtil::PREAMBLE_INTS_BYTE); ss.put(0); ss.seekg(0); // fail in HllSketchImpl CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in preInts byte", HllSketch::deserialize(ss), std::invalid_argument); // fail in CouponHashSet CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in preInts byte", CouponHashSet::newSet(ss), std::invalid_argument); ss.seekp(HllUtil::PREAMBLE_INTS_BYTE); ss.put(HllUtil::HASH_SET_PREINTS); ss.seekp(HllUtil::SER_VER_BYTE); ss.put(0); ss.seekg(0); CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in serialization version byte", HllSketch::deserialize(ss), std::invalid_argument); ss.seekp(HllUtil::SER_VER_BYTE); ss.put(HllUtil::SER_VER); ss.seekp(HllUtil::FAMILY_BYTE); ss.put(0); ss.seekg(0); CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in family id byte", HllSketch::deserialize(ss), std::invalid_argument); ss.seekp(HllUtil::FAMILY_BYTE); ss.put(HllUtil::FAMILY_ID); ss.seekg(HllUtil::MODE_BYTE); uint8_t tmp = ss.get(); ss.seekp(HllUtil::MODE_BYTE); ss.put(0x22); // HLL_8, HLL ss.seekg(0); CPPUNIT_ASSERT_THROW_MESSAGE("Failed to detect error in mode byte", HllSketch::deserialize(ss), std::invalid_argument); ss.seekp(HllUtil::MODE_BYTE); ss.put(tmp); ss.seekg(HllUtil::LG_ARR_BYTE); tmp = ss.get(); ss.seekp(HllUtil::LG_ARR_BYTE); ss.put(0); ss.seekg(0); HllSketch::deserialize(ss); // should work fine despite the corruption ss.seekp(HllUtil::LG_ARR_BYTE); ss.put(tmp); } }; CPPUNIT_TEST_SUITE_REGISTRATION(CouponHashSetTest); } // namespace datasketches