/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ #include #include #include namespace datasketches { // assume the binary sketches for this test have been generated by datasketches-java code // in the subdirectory called "java" in the root directory of this project static std::string testBinaryInputPath = std::string(TEST_BINARY_INPUT_PATH) + "../../java/"; TEST_CASE("var opt sketch long", "[serde_compat]") { const unsigned n_arr[] = {0, 1, 10, 100, 1000, 10000, 100000, 1000000}; for (const unsigned n: n_arr) { std::ifstream is; is.exceptions(std::ios::failbit | std::ios::badbit); is.open(testBinaryInputPath + "varopt_sketch_long_n" + std::to_string(n) + "_java.sk", std::ios::binary); const auto sketch = var_opt_sketch::deserialize(is); REQUIRE(sketch.is_empty() == (n == 0)); REQUIRE(sketch.get_num_samples() == (n > 10 ? 32 : n)); } } TEST_CASE("var opt sketch: deserialize exact from java", "[serde_compat]") { const double EPS = 1e-13; std::ifstream is; is.exceptions(std::ios::failbit | std::ios::badbit); is.open(testBinaryInputPath + "varopt_sketch_string_exact_java.sk", std::ios::binary); const auto sketch = var_opt_sketch::deserialize(is); REQUIRE_FALSE(sketch.is_empty()); REQUIRE(sketch.get_k() == 1024); REQUIRE(sketch.get_n() == 200); REQUIRE(sketch.get_num_samples() == 200); const subset_summary ss = sketch.estimate_subset_sum([](std::string){ return true; }); double tgt_wt = 0.0; for (int i = 1; i <= 200; ++i) { tgt_wt += 1000.0 / i; } REQUIRE(ss.total_sketch_weight == Approx(tgt_wt).margin(EPS)); } TEST_CASE("var opt sketch: deserialize sampling from java", "[serde_compat]") { const double EPS = 1e-13; std::ifstream is; is.exceptions(std::ios::failbit | std::ios::badbit); is.open(testBinaryInputPath + "varopt_sketch_long_sampling_java.sk", std::ios::binary); const auto sketch = var_opt_sketch::deserialize(is); REQUIRE_FALSE(sketch.is_empty()); REQUIRE(sketch.get_k() == 1024); REQUIRE(sketch.get_n() == 2003); REQUIRE(sketch.get_num_samples() == sketch.get_k()); subset_summary ss = sketch.estimate_subset_sum([](int64_t){ return true; }); REQUIRE(ss.estimate == Approx(332000.0).margin(EPS)); REQUIRE(ss.total_sketch_weight == Approx(332000.0).margin(EPS)); ss = sketch.estimate_subset_sum([](int64_t x){ return x < 0; }); REQUIRE(ss.estimate == 330000.0); // heavy item, weight is exact ss = sketch.estimate_subset_sum([](int64_t x){ return x >= 0; }); REQUIRE(ss.estimate == Approx(2000.0).margin(EPS)); } } /* namespace datasketches */