Skip to content

Commit

Permalink
Add Enumeration support for Array v2 Serialization
Browse files Browse the repository at this point in the history
This adds the new Array::serialize_enumerations() method that indicates
whether enumerations should be loaded and returned for v2 serialization.
  • Loading branch information
davisp committed Aug 31, 2023
1 parent 84172df commit 682a838
Show file tree
Hide file tree
Showing 4 changed files with 93 additions and 2 deletions.
76 changes: 74 additions & 2 deletions test/src/unit-enumerations.cc
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,7 @@

#ifdef TILEDB_SERIALIZATION
#include "tiledb/sm/enums/serialization_type.h"
#include "tiledb/sm/serialization/array.h"
#include "tiledb/sm/serialization/array_schema.h"
#include "tiledb/sm/serialization/array_schema_evolution.h"
#include "tiledb/sm/serialization/query.h"
Expand Down Expand Up @@ -114,6 +115,13 @@ struct EnumerationFx {
void ser_des_query(
Query* q_in, Query* q_out, bool client_side, SerializationType stype);

void ser_des_array(
Context& ctx,
Array* in,
Array* out,
bool client_size,
SerializationType stype);

template <typename T>
bool vec_cmp(std::vector<T> v1, std::vector<T> v2);

Expand Down Expand Up @@ -1550,6 +1558,44 @@ TEST_CASE_METHOD(
REQUIRE(node2->use_enumeration() == true);
}

TEST_CASE_METHOD(
EnumerationFx,
"Cap'N Proto - Basic Array v2 Serialization",
"[enumeration][capnp][serialization][v2][array]") {
auto client_side = GENERATE(true, false);
auto ser_type = GENERATE(SerializationType::CAPNP, SerializationType::JSON);
auto do_load = GENERATE(std::string("true"), std::string("false"));

create_array();

Config cfg;
throw_if_not_ok(cfg.set("rest.use_refactored_array_open", "true"));
throw_if_not_ok(cfg.set("rest.load_enumerations_on_array_open", do_load));
Context ctx(cfg);

auto a1 = make_shared<Array>(HERE(), uri_, ctx.storage_manager());
throw_if_not_ok(
a1->open(QueryType::READ, EncryptionType::NO_ENCRYPTION, nullptr, 0));
REQUIRE(a1->serialize_enumerations() == (do_load == "true" ? true : false));
REQUIRE(
a1->array_schema_latest_ptr()->get_loaded_enumeration_names().size() ==
0);

auto a2 = make_shared<Array>(HERE(), uri_, ctx.storage_manager());

ser_des_array(ctx, a1.get(), a2.get(), client_side, ser_type);

auto schema = a2->array_schema_latest_ptr();
auto names = schema->get_enumeration_names();
auto loaded = schema->get_loaded_enumeration_names();

if (do_load == "true") {
REQUIRE(vec_cmp(loaded, names));
} else {
REQUIRE(loaded.size() == 0);
}
}

#endif // ifdef TILEDB_SERIALIZATIONs

/* ********************************* */
Expand Down Expand Up @@ -1839,9 +1885,9 @@ shared_ptr<ArraySchema> EnumerationFx::create_schema() {
throw_if_not_ok(schema->set_domain(dom));

std::vector<std::string> values = {"ant", "bat", "cat", "dog", "emu"};
auto enmr =
auto enmr1 =
create_enumeration(values, false, Datatype::STRING_ASCII, "test_enmr");
schema->add_enumeration(enmr);
schema->add_enumeration(enmr1);

auto attr1 = make_shared<Attribute>(HERE(), "attr1", Datatype::INT32);
attr1->set_enumeration_name("test_enmr");
Expand All @@ -1850,6 +1896,15 @@ shared_ptr<ArraySchema> EnumerationFx::create_schema() {
auto attr2 = make_shared<Attribute>(HERE(), "attr2", Datatype::STRING_ASCII);
throw_if_not_ok(schema->add_attribute(attr2));

std::vector<std::string> names = {"fred", "wilma", "barney", "betty"};
auto enmr2 =
create_enumeration(names, false, Datatype::STRING_UTF8, "flintstones");
schema->add_enumeration(enmr2);

auto attr3 = make_shared<Attribute>(HERE(), "attr3", Datatype::UINT8);
attr3->set_enumeration_name("flintstones");
throw_if_not_ok(schema->add_attribute(attr3));

return schema;
}

Expand Down Expand Up @@ -1923,6 +1978,18 @@ void EnumerationFx::ser_des_query(
&(ctx_.resources().compute_tp())));
}

void EnumerationFx::ser_des_array(
Context& ctx,
Array* in,
Array* out,
bool client_side,
SerializationType stype) {
Buffer buf;
throw_if_not_ok(serialization::array_serialize(in, stype, &buf, client_side));
throw_if_not_ok(
serialization::array_deserialize(out, stype, buf, ctx.storage_manager()));
}

#else // No TILEDB_SERIALIZATION

ArraySchema EnumerationFx::ser_des_array_schema(
Expand All @@ -1939,6 +2006,11 @@ void EnumerationFx::ser_des_query(Query*, Query*, bool, SerializationType) {
throw std::logic_error("Serialization not enabled.");
}

void EnumerataionFx::ser_des_array(

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci4 / ubuntu-22.04 - HDFS

‘EnumerataionFx’ has not been declared

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci6 / macos-11 - GCS

use of undeclared identifier 'EnumerataionFx'; did you mean 'EnumerationFx'?

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci6 / macos-11 - GCS

out-of-line definition of 'ser_des_array' does not match any declaration in 'EnumerationFx'

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci10 / macos-11 - AZURE

use of undeclared identifier 'EnumerataionFx'; did you mean 'EnumerationFx'?

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci10 / macos-11 - AZURE

out-of-line definition of 'ser_des_array' does not match any declaration in 'EnumerationFx'

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci1 / ubuntu-22.04 - AZURE

‘EnumerataionFx’ has not been declared

Check failure on line 2009 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci2 / ubuntu-20.04 - GCS

‘EnumerataionFx’ has not been declared
Context&, Array*, Array* bool, SerializationType) {

Check failure on line 2010 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci4 / ubuntu-22.04 - HDFS

expected ‘,’ or ‘...’ before ‘bool’

Check failure on line 2010 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci6 / macos-11 - GCS

invalid parameter name: 'bool' is a keyword

Check failure on line 2010 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci10 / macos-11 - AZURE

invalid parameter name: 'bool' is a keyword

Check failure on line 2010 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci1 / ubuntu-22.04 - AZURE

expected ‘,’ or ‘...’ before ‘bool’

Check failure on line 2010 in test/src/unit-enumerations.cc

View workflow job for this annotation

GitHub Actions / ci2 / ubuntu-20.04 - GCS

expected ‘,’ or ‘...’ before ‘bool’
throw std::logic_error("Serialization not enabled.");
}

#endif // TILEDB_SERIALIZATION

template <typename T>
Expand Down
10 changes: 10 additions & 0 deletions tiledb/sm/array/array.cc
Original file line number Diff line number Diff line change
Expand Up @@ -1103,6 +1103,16 @@ bool Array::serialize_non_empty_domain() const {
return serialize_ned_array_open;
}

bool Array::serialize_enumerations() const {
auto serialize = config_.get<bool>("rest.load_enumerations_on_array_open");
if (!serialize.has_value()) {
throw std::runtime_error(
"Cannot get rest.load_enumerations_on_array_open configuration option "
"from config");
}
return serialize.value();
}

bool Array::serialize_metadata() const {
auto found = false;
auto serialize_metadata_array_open = false;
Expand Down
5 changes: 5 additions & 0 deletions tiledb/sm/array/array.h
Original file line number Diff line number Diff line change
Expand Up @@ -536,6 +536,11 @@ class Array {
* open. */
bool serialize_non_empty_domain() const;

/**
* Checks the config to se if enumerations should be serialized on array open.
*/
bool serialize_enumerations() const;

/**
* Checks the config to see if metadata should be serialized on array open.
*/
Expand Down
4 changes: 4 additions & 0 deletions tiledb/sm/serialization/array.cc
Original file line number Diff line number Diff line change
Expand Up @@ -134,6 +134,10 @@ Status array_to_capnp(

array_builder->setQueryType(query_type_str(array->get_query_type()));

if (array->use_refactored_array_open() && array->serialize_enumerations()) {
array->load_all_enumerations();
}

const auto& array_schema_latest = array->array_schema_latest();
auto array_schema_latest_builder = array_builder->initArraySchemaLatest();
RETURN_NOT_OK(array_schema_to_capnp(
Expand Down

0 comments on commit 682a838

Please sign in to comment.