From 0cdeb5afcf3cc8b4645822c69e0eb88b2f815502 Mon Sep 17 00:00:00 2001 From: Tao He Date: Sat, 20 Jan 2024 15:33:51 +0800 Subject: [PATCH] Enable date and time types support in vineyard-graph (and GIE) Signed-off-by: Tao He --- .../build-graphscope-wheels-macos.yml | 2 +- .github/workflows/gae.yml | 2 +- .../networkx-forward-algo-nightly.yml | 2 +- .github/workflows/nightly.yml | 2 +- .../core/object/fragment_wrapper.h | 72 ++++ .../groot/common/meta/DataType.java | 15 + .../groot/common/meta/InternalDataType.java | 13 +- .../groot/common/schema/wrapper/DataType.java | 6 + .../gremlin/result/ParserUtils.java | 38 +- .../src/adapters/gs_store/details.rs | 15 + .../executor/store/global_query/Cargo.toml | 1 + .../store_impl/v6d/native/global_store_ffi.cc | 46 +++ .../store_impl/v6d/native/global_store_ffi.h | 32 ++ .../src/store_impl/v6d/native/htap_ds_impl.cc | 229 ++++++++++- .../src/store_impl/v6d/native/htap_ds_impl.h | 18 + .../src/store_impl/v6d/read_ffi.rs | 367 +++++++++++++++++- k8s/Makefile | 2 +- .../manylinux/Makefile | 2 +- k8s/internal/Makefile | 2 +- proto/schema_common.proto | 14 + python/graphscope/framework/utils.py | 28 ++ python/graphscope/tests/minitest/test_min.py | 99 +++++ scripts/install_deps.sh | 4 +- 23 files changed, 983 insertions(+), 28 deletions(-) diff --git a/.github/workflows/build-graphscope-wheels-macos.yml b/.github/workflows/build-graphscope-wheels-macos.yml index b1df3832cb03..d235887fcd00 100644 --- a/.github/workflows/build-graphscope-wheels-macos.yml +++ b/.github/workflows/build-graphscope-wheels-macos.yml @@ -185,7 +185,7 @@ jobs: run: | . ~/.graphscope_env python3 -m pip install libclang - git clone --single-branch -b v0.18.2 --depth=1 https://github.com/v6d-io/v6d.git /tmp/v6d + git clone --single-branch -b v0.20.1 --depth=1 https://github.com/v6d-io/v6d.git /tmp/v6d cd /tmp/v6d git submodule update --init cmake . -DCMAKE_INSTALL_PREFIX=/usr/local \ diff --git a/.github/workflows/gae.yml b/.github/workflows/gae.yml index 004ba6b9f314..eaec5434ea5d 100644 --- a/.github/workflows/gae.yml +++ b/.github/workflows/gae.yml @@ -30,7 +30,7 @@ jobs: runs-on: ubuntu-20.04 if: ${{ github.repository == 'alibaba/GraphScope' }} container: - image: registry.cn-hongkong.aliyuncs.com/graphscope/graphscope-dev:v0.18.2 + image: registry.cn-hongkong.aliyuncs.com/graphscope/graphscope-dev:v0.20.1 steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/networkx-forward-algo-nightly.yml b/.github/workflows/networkx-forward-algo-nightly.yml index 80ef55087777..977c0d82c0e3 100644 --- a/.github/workflows/networkx-forward-algo-nightly.yml +++ b/.github/workflows/networkx-forward-algo-nightly.yml @@ -17,7 +17,7 @@ jobs: run: shell: bash --noprofile --norc -eo pipefail {0} container: - image: registry.cn-hongkong.aliyuncs.com/graphscope/graphscope-dev:v0.18.2 + image: registry.cn-hongkong.aliyuncs.com/graphscope/graphscope-dev:v0.20.1 options: --shm-size 4096m diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml index 9b52d81dd960..122f5d709379 100644 --- a/.github/workflows/nightly.yml +++ b/.github/workflows/nightly.yml @@ -44,7 +44,7 @@ jobs: sudo mkdir /opt/graphscope sudo chown -R $(id -u):$(id -g) /opt/graphscope python3 -m pip install click - python3 gsctl.py install-deps dev --v6d-version v0.18.2 + python3 gsctl.py install-deps dev --v6d-version v0.20.1 - name: Setup tmate session if: false diff --git a/analytical_engine/core/object/fragment_wrapper.h b/analytical_engine/core/object/fragment_wrapper.h index 0ade61758f8a..f35c6f04bffc 100644 --- a/analytical_engine/core/object/fragment_wrapper.h +++ b/analytical_engine/core/object/fragment_wrapper.h @@ -93,6 +93,46 @@ gs::rpc::graph::DataTypePb PropertyTypeToPb(vineyard::PropertyType type) { return gs::rpc::graph::DataTypePb::STRING; } else if (arrow::large_utf8()->Equals(type)) { return gs::rpc::graph::DataTypePb::STRING; + } else if (arrow::date32()->Equals(type)) { + return gs::rpc::graph::DataTypePb::DATE32; + } else if (arrow::date64()->Equals(type)) { + return gs::rpc::graph::DataTypePb::DATE64; + } else if (type->id() == arrow::Type::TIME32) { + auto time32_type = std::dynamic_pointer_cast(type); + switch (time32_type->unit()) { + case arrow::TimeUnit::SECOND: + return gs::rpc::graph::DataTypePb::TIME32_S; + case arrow::TimeUnit::MILLI: + return gs::rpc::graph::DataTypePb::TIME32_MS; + case arrow::TimeUnit::MICRO: + return gs::rpc::graph::DataTypePb::TIME32_US; + case arrow::TimeUnit::NANO: + return gs::rpc::graph::DataTypePb::TIME32_NS; + } + } else if (type->id() == arrow::Type::TIME64) { + auto time64_type = std::dynamic_pointer_cast(type); + switch (time64_type->unit()) { + case arrow::TimeUnit::SECOND: + return gs::rpc::graph::DataTypePb::TIME64_S; + case arrow::TimeUnit::MILLI: + return gs::rpc::graph::DataTypePb::TIME64_MS; + case arrow::TimeUnit::MICRO: + return gs::rpc::graph::DataTypePb::TIME64_US; + case arrow::TimeUnit::NANO: + return gs::rpc::graph::DataTypePb::TIME64_NS; + } + } else if (type->id() == arrow::Type::TIMESTAMP) { + auto timestamp_type = std::dynamic_pointer_cast(type); + switch (timestamp_type->unit()) { + case arrow::TimeUnit::SECOND: + return gs::rpc::graph::DataTypePb::TIMESTAMP_S; + case arrow::TimeUnit::MILLI: + return gs::rpc::graph::DataTypePb::TIMESTAMP_MS; + case arrow::TimeUnit::MICRO: + return gs::rpc::graph::DataTypePb::TIMESTAMP_US; + case arrow::TimeUnit::NANO: + return gs::rpc::graph::DataTypePb::TIMESTAMP_NS; + } } else if (arrow::large_list(arrow::int32())->Equals(type)) { return gs::rpc::graph::DataTypePb::INT_LIST; } else if (arrow::large_list(arrow::int64())->Equals(type)) { @@ -138,6 +178,38 @@ gs::rpc::graph::DataTypePb PropertyTypeToPb(const std::string& type) { return gs::rpc::graph::DataTypePb::LONG_LIST; } else if (type == "float_list") { return gs::rpc::graph::DataTypePb::FLOAT_LIST; + } else if (type == "date32[day]") { + return gs::rpc::graph::DataTypePb::DATE32; + } else if (type == "date64[ms]") { + return gs::rpc::graph::DataTypePb::DATE64; + } else if (type == "time32[s]") { + return gs::rpc::graph::DataTypePb::TIME32_S; + } else if (type == "time32[ms]") { + return gs::rpc::graph::DataTypePb::TIME32_MS; + } else if (type == "time32[us]") { + return gs::rpc::graph::DataTypePb::TIME32_US; + } else if (type == "time32[ns]") { + return gs::rpc::graph::DataTypePb::TIME32_NS; + } else if (type == "time64[s]") { + return gs::rpc::graph::DataTypePb::TIME64_S; + } else if (type == "time64[ms]") { + return gs::rpc::graph::DataTypePb::TIME64_MS; + } else if (type == "time64[us]") { + return gs::rpc::graph::DataTypePb::TIME64_US; + } else if (type == "time64[ns]") { + return gs::rpc::graph::DataTypePb::TIME64_NS; + } else if (type.substr(0, std::string("timestamp[s]").length()) == + "timestamp[s]") { + return gs::rpc::graph::DataTypePb::TIMESTAMP_S; + } else if (type.substr(0, std::string("timestamp[ms]").length()) == + "timestamp[ms]") { + return gs::rpc::graph::DataTypePb::TIMESTAMP_MS; + } else if (type.substr(0, std::string("timestamp[us]").length()) == + "timestamp[us]") { + return gs::rpc::graph::DataTypePb::TIMESTAMP_US; + } else if (type.substr(0, std::string("timestamp[ns]").length()) == + "timestamp[ns]") { + return gs::rpc::graph::DataTypePb::TIMESTAMP_NS; } else if (type == "double_list") { return gs::rpc::graph::DataTypePb::DOUBLE_LIST; } else if (type == "string_list" || type == "str_list") { diff --git a/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/DataType.java b/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/DataType.java index 5ab1f4c9cba1..009bdabe6947 100644 --- a/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/DataType.java +++ b/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/DataType.java @@ -43,7 +43,13 @@ public class DataType { public static final DataType DOUBLE = new DataType(InternalDataType.DOUBLE); public static final DataType BYTES = new DataType(InternalDataType.BYTES); public static final DataType STRING = new DataType(InternalDataType.STRING); + + // See also: `Date32` in common.proto. public static final DataType DATE = new DataType(InternalDataType.DATE); + // See also: `Time32` in common.proto. + public static final DataType TIME = new DataType(InternalDataType.TIME); + // See also: `Timestamp` in common.proto. + public static final DataType TIMESTAMP = new DataType(InternalDataType.TIMESTAMP); // For LIST, SET and MAP @JsonProperty private String expression; @@ -58,6 +64,15 @@ public static DataType toDataType(int i) { } public static DataType valueOf(String typeName) { + if (typeName.startsWith("DATE")) { + return DATE; + } + if (typeName.startsWith("TIME")) { + return TIME; + } + if (typeName.startsWith("TIMESTAMP")) { + return TIMESTAMP; + } return new DataType(InternalDataType.valueOf(typeName)); } diff --git a/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/InternalDataType.java b/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/InternalDataType.java index 1ced3999de93..4cc8b352f77c 100644 --- a/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/InternalDataType.java +++ b/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/meta/InternalDataType.java @@ -56,10 +56,19 @@ public enum InternalDataType { * STRING data type in InteractiveEngine, map to String in Java */ STRING, + /** - * INT data type in InteractiveEngine, map to Integer(int) in Java + * Date data type in InteractiveEngine, map to DateValue in Java */ DATE, + /** + * Date data type in InteractiveEngine, map to TimeValue in Java + */ + TIME, + /** + * Date data type in InteractiveEngine, map to DateTimeValue in Java + */ + TIMESTAMP, /** * SET data type, Collection Type, can mixed with list and map, example:Set, value: List,List>> @@ -94,6 +103,8 @@ public enum InternalDataType { && value != UNKNOWN && value != CHAR && value != DATE + && value != TIME + && value != TIMESTAMP && value != SHORT) { primitiveTypes.add(value.name()); } diff --git a/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/schema/wrapper/DataType.java b/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/schema/wrapper/DataType.java index 33d52ffa0431..3b90f8eebfc0 100644 --- a/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/schema/wrapper/DataType.java +++ b/interactive_engine/common/src/main/java/com/alibaba/graphscope/groot/common/schema/wrapper/DataType.java @@ -147,6 +147,12 @@ public static DataType parseFromDataType( case DATE: return DataType.STRING; + case TIME: + return DataType.STRING; + + case TIMESTAMP: + return DataType.STRING; + case BYTES: return DataType.BYTES; diff --git a/interactive_engine/compiler/src/main/java/com/alibaba/graphscope/gremlin/result/ParserUtils.java b/interactive_engine/compiler/src/main/java/com/alibaba/graphscope/gremlin/result/ParserUtils.java index a08d6729f588..5250c9df033c 100644 --- a/interactive_engine/compiler/src/main/java/com/alibaba/graphscope/gremlin/result/ParserUtils.java +++ b/interactive_engine/compiler/src/main/java/com/alibaba/graphscope/gremlin/result/ParserUtils.java @@ -22,6 +22,7 @@ import com.alibaba.graphscope.gaia.proto.IrResult; import com.alibaba.graphscope.gremlin.exception.GremlinResultParserException; +import com.google.common.base.Preconditions; import org.apache.tinkerpop.gremlin.structure.Edge; import org.apache.tinkerpop.gremlin.structure.Vertex; import org.apache.tinkerpop.gremlin.structure.util.detached.DetachedEdge; @@ -29,10 +30,9 @@ import org.slf4j.Logger; import org.slf4j.LoggerFactory; -import java.util.HashMap; -import java.util.LinkedHashMap; -import java.util.List; -import java.util.Map; +import java.sql.Timestamp; +import java.time.*; +import java.util.*; import java.util.stream.Collectors; public class ParserUtils { @@ -91,6 +91,36 @@ private static Object parseCommonValue(Common.Value value) { return value.getF64(); case STR: return value.getStr(); + case DATE: + Preconditions.checkArgument(value.getDate().getItem() >= 0, + "Date prior to 1970-00-00 is not supported, got %d", value.getDate().getItem()); + return new Date(((long) value.getDate().getItem()) * 24 * 60 * 60 * 1000); + case TIME: + Preconditions.checkArgument(value.getTime().getItem() >= 0, + "Time of day must be greater than 00:00:00, got %d", value.getTime().getItem()); + // gremlin-python doesn't support local time + // + // see also: https://github.com/apache/tinkerpop/blob/master/gremlin-python/src/main/python/gremlin_python/structure/io/graphbinaryV1.py#L105-L107 + OffsetTime time = LocalTime.ofNanoOfDay(((long) value.getTime().getItem()) * 1000_000L).atOffset(ZoneOffset.UTC); + // to ISO-8601 formats: HH:mm:ss.SSSSSS + // + // see also: + // - https://docs.oracle.com/javase/8/docs/api/java/time/LocalTime.html#toString-- + // - https://docs.oracle.com/javase/8/docs/api/java/time/OffsetTime.html#toString-- + return time.toString(); + case TIMESTAMP: + Preconditions.checkArgument(value.getTimestamp().getItem() >= 0, + "Timestamp prior to 1970-00-00 00:00:00 is not supported, got %d", value.getTimestamp().getItem()); + // gremlin-python will convert timestamp to float, that isn't what we want + // + // see also: https://github.com/apache/tinkerpop/blob/master/gremlin-python/src/main/python/gremlin_python/statics.py#L48 + // + // We use java.util.Instant rather than java.sql.Timestamp for a UTC timestamp value + OffsetDateTime ts = Instant.ofEpochSecond(value.getTimestamp().getItem() / 1000L, value.getTimestamp().getItem() % 1000L * 1000_000L).atOffset(ZoneOffset.UTC); + // to ISO-8601 format: uuuu-MM-dd'T'HH:mm:ss.SSSSSSXXXXX + // + // see also: https://docs.oracle.com/javase/8/docs/api/java/time/OffsetDateTime.html#toString-- + return ts.toString(); case PAIR_ARRAY: Common.PairArray pairs = value.getPairArray(); Map pairInMap = new HashMap(); diff --git a/interactive_engine/executor/ir/graph_proxy/src/adapters/gs_store/details.rs b/interactive_engine/executor/ir/graph_proxy/src/adapters/gs_store/details.rs index 909f7189644e..007fd1049aa3 100644 --- a/interactive_engine/executor/ir/graph_proxy/src/adapters/gs_store/details.rs +++ b/interactive_engine/executor/ir/graph_proxy/src/adapters/gs_store/details.rs @@ -16,6 +16,9 @@ use std::fmt; use ahash::HashMap; +use chrono::{NaiveDate, NaiveDateTime, NaiveTime, Datelike, Timelike}; + +use dyn_type::DateTimeFormats; use dyn_type::Object; use dyn_type::Primitives; use global_query::store_api::prelude::Property; @@ -52,6 +55,18 @@ fn encode_runtime_prop_val(prop_val: Property) -> Object { Property::Double(d) => Object::Primitive(Primitives::Float(d)), Property::Bytes(v) => Object::Blob(v.into_boxed_slice()), Property::String(s) => Object::String(s), + Property::Date(s) => { + match NaiveDate::parse_from_str(&s, "%Y-%m-%d") { + Ok(date) => Object::DateFormat(DateTimeFormats::Date(date)), + Err(_) => match NaiveTime::parse_from_str(&s, "%H:%M:%S.%6f") { + Ok(time) => Object::DateFormat(DateTimeFormats::Time(time)), + Err(_) => match NaiveDateTime::parse_from_str(&s, "%Y-%m-%d %H:%M:%S.%6f") { + Ok(datetime) => Object::DateFormat(DateTimeFormats::DateTime(datetime)), + Err(_) => unimplemented!("Failed to parse the datetime/timestamp property value: '{}'", s), + } + } + } + }, _ => unimplemented!(), } } diff --git a/interactive_engine/executor/store/global_query/Cargo.toml b/interactive_engine/executor/store/global_query/Cargo.toml index c3611fbadade..0f4c429ae833 100644 --- a/interactive_engine/executor/store/global_query/Cargo.toml +++ b/interactive_engine/executor/store/global_query/Cargo.toml @@ -6,6 +6,7 @@ edition = "2021" # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html [dependencies] +chrono = "0.4" log = "0.4" itertools = "0.10" byteorder = "1.4.3" diff --git a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.cc b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.cc index 2204aaf02160..52bc69f9031b 100644 --- a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.cc +++ b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.cc @@ -570,6 +570,52 @@ int v6d_get_property_as_string_list(Property* property, const char*** out, return htap_impl::get_property_as_string_list(property, out, out_len, out_num); } +int v6d_get_property_as_date32(struct Property* property, int32_t *out) { + return htap_impl::get_property_as_date32(property, out); +} +int v6d_get_property_as_date64(struct Property* property, int64_t *out) { + return htap_impl::get_property_as_date64(property, out); +} +int v6d_get_property_as_time32_s(struct Property* property, int32_t *out) { + return htap_impl::get_property_as_time32_s(property, out); +} +int v6d_get_property_as_time32_ms(struct Property* property, int32_t *out) { + return htap_impl::get_property_as_time32_ms(property, out); +} +int v6d_get_property_as_time32_us(struct Property* property, int32_t *out) { + return htap_impl::get_property_as_time32_us(property, out); +} +int v6d_get_property_as_time32_ns(struct Property* property, int32_t *out) { + return htap_impl::get_property_as_time32_ns(property, out); +} +int v6d_get_property_as_time64_s(struct Property* property, int64_t *out) { + return htap_impl::get_property_as_time64_s(property, out); +} +int v6d_get_property_as_time64_ms(struct Property* property, int64_t *out) { + return htap_impl::get_property_as_time64_ms(property, out); +} +int v6d_get_property_as_time64_us(struct Property* property, int64_t *out) { + return htap_impl::get_property_as_time64_us(property, out); +} +int v6d_get_property_as_time64_ns(struct Property* property, int64_t *out) { + return htap_impl::get_property_as_time64_ns(property, out); +} +int v6d_get_property_as_timestamp_s(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + return htap_impl::get_property_as_timestamp_s(property, out, out_timezone, out_timezone_len); +} +int v6d_get_property_as_timestamp_ms(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + return htap_impl::get_property_as_timestamp_ms(property, out, out_timezone, out_timezone_len); +} +int v6d_get_property_as_timestamp_us(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + return htap_impl::get_property_as_timestamp_us(property, out, out_timezone, out_timezone_len); +} +int v6d_get_property_as_timestamp_ns(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + return htap_impl::get_property_as_timestamp_ns(property, out, out_timezone, out_timezone_len); +} void v6d_free_property(Property* property) {} diff --git a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.h b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.h index a9af4e275310..ac1fd52868e4 100644 --- a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.h +++ b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/global_store_ffi.h @@ -63,6 +63,20 @@ enum PropertyType { FLOAT_LIST = 12, DOUBLE_LIST = 13, STRING_LIST = 14, + DATE32 = 15, + DATE64 = 16, + TIME32_S = 17, + TIME32_MS = 18, + TIME32_US = 19, + TIME32_NS = 20, + TIME64_S = 21, + TIME64_MS = 22, + TIME64_US = 23, + TIME64_NS = 24, + TIMESTAMP_S = 25, + TIMESTAMP_MS = 26, + TIMESTAMP_US = 27, + TIMESTAMP_NS = 28, }; struct Property { @@ -240,6 +254,24 @@ int v6d_get_property_as_double_list(struct Property* property, const double** ou int* out_len); int v6d_get_property_as_string_list(struct Property* property, const char*** out, const int** out_len, int* out_num); +int v6d_get_property_as_date32(struct Property* property, int32_t *out); +int v6d_get_property_as_date64(struct Property* property, int64_t *out); +int v6d_get_property_as_time32_s(struct Property* property, int32_t *out); +int v6d_get_property_as_time32_ms(struct Property* property, int32_t *out); +int v6d_get_property_as_time32_us(struct Property* property, int32_t *out); +int v6d_get_property_as_time32_ns(struct Property* property, int32_t *out); +int v6d_get_property_as_time64_s(struct Property* property, int64_t *out); +int v6d_get_property_as_time64_ms(struct Property* property, int64_t *out); +int v6d_get_property_as_time64_us(struct Property* property, int64_t *out); +int v6d_get_property_as_time64_ns(struct Property* property, int64_t *out); +int v6d_get_property_as_timestamp_s(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); +int v6d_get_property_as_timestamp_ms(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); +int v6d_get_property_as_timestamp_us(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); +int v6d_get_property_as_timestamp_ns(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); // *out_num为string的个数 // (*out_len)[i]为第i个string的长度 diff --git a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.cc b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.cc index f9459f5dcd75..aedffff7bd56 100644 --- a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.cc +++ b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.cc @@ -271,44 +271,107 @@ static int get_property_from_table(arrow::Table* table, int64_t row_id, if (dt == arrow::boolean()) { p_out->type = BOOL; pp.bool_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::int8()) { p_out->type = CHAR; pp.char_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::int16()) { p_out->type = SHORT; pp.int16_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::int32()) { p_out->type = INT; pp.int_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::int64()) { p_out->type = LONG; pp.long_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::float32()) { p_out->type = FLOAT; pp.float_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::float64()) { p_out->type = DOUBLE; pp.double_value = - std::dynamic_pointer_cast(array)->Value(row_id); + static_cast(array.get())->Value(row_id); } else if (dt == arrow::utf8()) { p_out->type = STRING; auto view = - std::dynamic_pointer_cast(array)->GetView(row_id); + static_cast(array.get())->GetView(row_id); pp.long_value = view.length(); p_out->data = const_cast(static_cast(view.data())); } else if (dt == arrow::large_utf8()) { p_out->type = STRING; auto view = - std::dynamic_pointer_cast(array)->GetView( + static_cast(array.get())->GetView( row_id); pp.long_value = view.length(); p_out->data = const_cast(static_cast(view.data())); + } else if (dt == arrow::date32()) { + p_out->type = DATE32; + pp.int_value = + static_cast(array.get())->GetView(row_id); + } else if (dt == arrow::date64()) { + p_out->type = DATE64; + pp.long_value = + static_cast(array.get())->GetView(row_id); + } else if (dt->id() == arrow::Type::TIME32) { + auto time32_type = static_cast(dt.get()); + switch (time32_type->unit()) { + case arrow::TimeUnit::SECOND: + p_out->type = TIME32_S; + break; + case arrow::TimeUnit::MILLI: + p_out->type = TIME32_MS; + break; + case arrow::TimeUnit::MICRO: + p_out->type = TIME32_US; + break; + case arrow::TimeUnit::NANO: + p_out->type = TIME32_NS; + break; + } + pp.int_value = + static_cast(array.get())->GetView(row_id); + } else if (dt->id() == arrow::Type::TIME64) { + auto time64_type = static_cast(dt.get()); + switch (time64_type->unit()) { + case arrow::TimeUnit::SECOND: + p_out->type = TIME64_S; + break; + case arrow::TimeUnit::MILLI: + p_out->type = TIME64_MS; + break; + case arrow::TimeUnit::MICRO: + p_out->type = TIME64_US; + break; + case arrow::TimeUnit::NANO: + p_out->type = TIME64_NS; + break; + } + pp.long_value = + static_cast(array.get())->GetView(row_id); + } else if (dt->id() == arrow::Type::TIMESTAMP) { + auto timestamp_type = static_cast(dt.get()); + switch (timestamp_type->unit()) { + case arrow::TimeUnit::SECOND: + p_out->type = TIMESTAMP_S; + break; + case arrow::TimeUnit::MILLI: + p_out->type = TIMESTAMP_MS; + break; + case arrow::TimeUnit::MICRO: + p_out->type = TIMESTAMP_US; + break; + case arrow::TimeUnit::NANO: + p_out->type = TIMESTAMP_NS; + break; + } + pp.long_value = + static_cast(array.get())->GetView(row_id); + // TODO: the timezone is not supported yet, and ignored during returning. } else { LOG(ERROR) << "invalid dt is = " << dt->ToString(); return -1; @@ -1322,6 +1385,154 @@ int get_property_as_string_list(Property* property, const char*** out, return -1; // FIXME } +int get_property_as_date32(struct Property* property, int32_t *out) { + if (property->type != DATE32) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.int_value; + return 0; +} + +int get_property_as_date64(struct Property* property, int64_t *out) { + if (property->type != DATE64) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + return 0; +} + +int get_property_as_time32_s(struct Property* property, int32_t *out) { + if (property->type != TIME32_S) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.int_value; + return 0; +} + +int get_property_as_time32_ms(struct Property* property, int32_t *out) { + if (property->type != TIME32_MS) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.int_value; + return 0; +} + +int get_property_as_time32_us(struct Property* property, int32_t *out) { + if (property->type != TIME32_US) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.int_value; + return 0; +} + +int get_property_as_time32_ns(struct Property* property, int32_t *out) { + if (property->type != TIME32_NS) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.int_value; + return 0; +} + +int get_property_as_time64_s(struct Property* property, int64_t *out) { + if (property->type != TIME64_S) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + return 0; +} + +int get_property_as_time64_ms(struct Property* property, int64_t *out) { + if (property->type != TIME64_MS) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + return 0; +} + +int get_property_as_time64_us(struct Property* property, int64_t *out) { + if (property->type != TIME64_US) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + return 0; +} + +int get_property_as_time64_ns(struct Property* property, int64_t *out) { + if (property->type != TIME64_NS) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + return 0; +} + +int get_property_as_timestamp_s(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + if (property->type != TIMESTAMP_S) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + // TODO: add timezone info to return value + return 0; +} + +int get_property_as_timestamp_ms(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + if (property->type != TIMESTAMP_MS) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + // TODO: add timezone info to return value + return 0; +} + +int get_property_as_timestamp_us(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + if (property->type != TIMESTAMP_US) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + // TODO: add timezone info to return value + return 0; +} + +int get_property_as_timestamp_ns(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len) { + if (property->type != TIMESTAMP_NS) { + return -1; + } + PodProperties pp; + pp.long_value = property->len; + *out = pp.long_value; + // TODO: add timezone info to return value + return 0; +} + void free_property(Property* property) {} } // namespace htap_impl diff --git a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.h b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.h index b6fbf27a8533..a516c3ab22e1 100644 --- a/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.h +++ b/interactive_engine/executor/store/global_query/src/store_impl/v6d/native/htap_ds_impl.h @@ -252,6 +252,24 @@ int get_property_as_double_list(Property* property, const double** out, int* out_len); int get_property_as_string_list(Property* property, const char*** out, const int** out_len, int* out_num); +int get_property_as_date32(struct Property* property, int32_t *out); +int get_property_as_date64(struct Property* property, int64_t *out); +int get_property_as_time32_s(struct Property* property, int32_t *out); +int get_property_as_time32_ms(struct Property* property, int32_t *out); +int get_property_as_time32_us(struct Property* property, int32_t *out); +int get_property_as_time32_ns(struct Property* property, int32_t *out); +int get_property_as_time64_s(struct Property* property, int64_t *out); +int get_property_as_time64_ms(struct Property* property, int64_t *out); +int get_property_as_time64_us(struct Property* property, int64_t *out); +int get_property_as_time64_ns(struct Property* property, int64_t *out); +int get_property_as_timestamp_s(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); +int get_property_as_timestamp_ms(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); +int get_property_as_timestamp_us(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); +int get_property_as_timestamp_ns(struct Property* property, int64_t *out, + const char **out_timezone, int *out_timezone_len); void free_property(Property* property); diff --git a/interactive_engine/executor/store/global_query/src/store_impl/v6d/read_ffi.rs b/interactive_engine/executor/store/global_query/src/store_impl/v6d/read_ffi.rs index 50d0ff42450e..c5ed611df9d2 100644 --- a/interactive_engine/executor/store/global_query/src/store_impl/v6d/read_ffi.rs +++ b/interactive_engine/executor/store/global_query/src/store_impl/v6d/read_ffi.rs @@ -1,6 +1,8 @@ use std::ffi::{CStr, CString}; use std::sync::Arc; +use chrono::{NaiveDate, NaiveDateTime, NaiveTime, Datelike, Timelike, Days}; + use crate::store_api::*; pub type GraphId = i64; type GetVertexIterator = *const ::libc::c_void; @@ -14,9 +16,7 @@ type InEdgeIterator = *const ::libc::c_void; type GetAllEdgesIterator = *const ::libc::c_void; // these are for path directly to GAIA -use dyn_type::object::Primitives; -use dyn_type::object::RawType; -use dyn_type::Object; +use dyn_type::object::{Object, Primitives, RawType, DateTimeFormats}; use ir_common::generated::common as common_pb; use ir_common::KeyId; @@ -66,6 +66,20 @@ pub enum PropertyType { FloatList = 12, DoubleList = 13, StringList = 14, + Date32 = 15, + Date64 = 16, + Time32S = 17, + Time32MS = 18, + Time32US = 19, + Time32NS = 20, + Time64S = 21, + Time64MS = 22, + Time64US = 23, + Time64NS = 24, + TimestampS = 25, + TimestampMS = 26, + TimestampUS = 27, + TimestampNS = 28, } #[repr(C)] @@ -174,6 +188,52 @@ extern "C" { property: *const NativeProperty, out: *mut *const *const u8, out_len: *mut *const i32, out_num: *mut i32, ) -> FFIState; + fn v6d_get_property_as_date32( + property: *const NativeProperty, out: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_date64( + property: *const NativeProperty, out: *mut i64 + ) -> FFIState; + fn v6d_get_property_as_time32_s( + property: *const NativeProperty, out: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_time32_ms( + property: *const NativeProperty, out: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_time32_us( + property: *const NativeProperty, out: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_time32_ns( + property: *const NativeProperty, out: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_time64_s( + property: *const NativeProperty, out: *mut i64 + ) -> FFIState; + fn v6d_get_property_as_time64_ms( + property: *const NativeProperty, out: *mut i64 + ) -> FFIState; + fn v6d_get_property_as_time64_us( + property: *const NativeProperty, out: *mut i64 + ) -> FFIState; + fn v6d_get_property_as_time64_ns( + property: *const NativeProperty, out: *mut i64 + ) -> FFIState; + fn v6d_get_property_as_timestamp_s( + property: *const NativeProperty, out: *mut i64, + out_timezone: *mut *const u8, out_timezone_len: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_timestamp_ms( + property: *const NativeProperty, out: *mut i64, + out_timezone: *mut *const u8, out_timezone_len: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_timestamp_us( + property: *const NativeProperty, out: *mut i64, + out_timezone: *mut *const u8, out_timezone_len: *mut i32 + ) -> FFIState; + fn v6d_get_property_as_timestamp_ns( + property: *const NativeProperty, out: *mut i64, + out_timezone: *mut *const u8, out_timezone_len: *mut i32 + ) -> FFIState; fn v6d_free_property(p: *const NativeProperty); @@ -318,7 +378,116 @@ impl NativeProperty { return Some(Object::Blob(ret.into_boxed_slice())); } } - _ => (), + PropertyType::Date32 => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_date32(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveDate::from_num_days_from_ce_opt(v).map(|v| Object::DateFormat(DateTimeFormats::Date(v))); + } + } + PropertyType::Date64 => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_date64(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_millis(v).map(|v| Object::DateFormat(DateTimeFormats::DateTime(v))); + } + } + PropertyType::Time32S => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_s(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt(v as u32, 0).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time32MS => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_ms(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000) as u32, (v % 1000 * 1000000) as u32).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time32US => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_us(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000) as u32, (v % 1000000 * 1000) as u32).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time32NS => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_ns(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000000) as u32, (v % 1000000000) as u32).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time64S => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_s(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt(v as u32, 0).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time64MS => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_ms(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000) as u32, (v % 1000 * 1000000) as u32).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time64US => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_us(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000) as u32, (v % 1000000 * 1000) as u32).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::Time64NS => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_ns(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000000) as u32, (v % 1000000000) as u32).map(|v| Object::DateFormat(DateTimeFormats::Time(v))); + } + } + PropertyType::TimestampS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_s(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_opt(v, 0).map(|v| Object::DateFormat(DateTimeFormats::DateTime(v))); + } + } + PropertyType::TimestampMS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_ms(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_millis(v).map(|v| Object::DateFormat(DateTimeFormats::DateTime(v))); + } + } + PropertyType::TimestampUS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_us(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_micros(v).map(|v| Object::DateFormat(DateTimeFormats::DateTime(v))); + } + } + PropertyType::TimestampNS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_ns(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_opt(v / 1000000000, (v % 1000000000) as u32).map(|v| Object::DateFormat(DateTimeFormats::DateTime(v))); + } + } + _ => { + error!("NativeProperty::to_object: unsupported property type: {:?}", self.r#type); + return None; + } } None } @@ -445,6 +614,114 @@ impl NativeProperty { return ret.map(|x| Property::ListString(x)); } } + PropertyType::Date32 => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_date32(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveDate::from_ymd_opt(1970, 1, 1) + .map_or(None, |d| d.checked_add_days(Days::new(v as u64))) + .map(|v| Property::Date(v.format("%Y-%m-%d").to_string())); + } + } + PropertyType::Date64 => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_date64(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_millis(v).map(|v| Property::Date(v.format("%Y-%m-%d %H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time32S => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_s(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt(v as u32, 0).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time32MS => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_ms(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000) as u32, (v % 1000 * 1000000) as u32).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time32US => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_us(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000) as u32, (v % 1000000 * 1000) as u32).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time32NS => { + let mut v: i32 = 0; + let res = unsafe { v6d_get_property_as_time32_ns(property, &mut v as *mut i32) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000000) as u32, (v % 1000000000) as u32).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time64S => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_s(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt(v as u32, 0).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time64MS => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_ms(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000) as u32, (v % 1000 * 1000000) as u32).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time64US => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_us(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000) as u32, (v % 1000000 * 1000) as u32).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::Time64NS => { + let mut v: i64 = 0; + let res = unsafe { v6d_get_property_as_time64_ns(property, &mut v as *mut i64) }; + if res == STATE_SUCCESS { + return NaiveTime::from_num_seconds_from_midnight_opt((v / 1000000000) as u32, (v % 1000000000) as u32).map(|v| Property::Date(v.format("%H:%M:%S.%6f").to_string())); + } + } + PropertyType::TimestampS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_s(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_opt(v, 0).map(|v| Property::Date(v.format("%Y-%m-%d %H:%M:%S.%6f").to_string())); + } + } + PropertyType::TimestampMS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_ms(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_millis(v).map(|v| Property::Date(v.format("%Y-%m-%d %H:%M:%S.%6f").to_string())); + } + } + PropertyType::TimestampUS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_us(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_micros(v).map(|v| Property::Date(v.format("%Y-%m-%d %H:%M:%S.%6f").to_string())); + } + } + PropertyType::TimestampNS => { + let mut v: i64 = 0; + let mut tz_v: *const u8 = std::ptr::null(); + let mut tz_len = 0; + let res = unsafe { v6d_get_property_as_timestamp_ns(property, &mut v as *mut i64, &mut tz_v, &mut tz_len) }; + if res == STATE_SUCCESS { + return NaiveDateTime::from_timestamp_opt(v / 1000000000, (v % 1000000000) as u32).map(|v| Property::Date(v.format("%Y-%m-%d %H:%M:%S.%6f").to_string())); + } + } } None } @@ -513,6 +790,22 @@ impl WriteNativeProperty { let len = vecdata.len() as i64; (PropertyType::Bytes, vecdata, len) } + Object::DateFormat(DateTimeFormats::Date(v)) => { + let u = PropertyUnion { i: v.num_days_from_ce() as i32 }; + (PropertyType::Date32, vec![], unsafe { u.l }) + } + Object::DateFormat(DateTimeFormats::Time(v)) => { + let u = PropertyUnion { i: (v.num_seconds_from_midnight() * 1000) as i32 + (v.nanosecond() / 1000000) as i32 }; + (PropertyType::Time32MS, vec![], unsafe { u.l }) + } + Object::DateFormat(DateTimeFormats::DateTime(v)) => { + let u = PropertyUnion { l: v.timestamp_millis() }; + (PropertyType::TimestampMS, vec![], unsafe { u.l }) + } + Object::DateFormat(DateTimeFormats::DateTimeWithTz(v)) => { + let u = PropertyUnion { l: v.timestamp_millis() }; + (PropertyType::TimestampMS, vec![], unsafe { u.l }) + } _ => { panic!("Unsupported object type: {:?}", property) } @@ -541,7 +834,21 @@ impl Drop for WriteNativeProperty { | PropertyType::Int | PropertyType::Long | PropertyType::Float - | PropertyType::Double => unsafe { + | PropertyType::Double + | PropertyType::Date32 + | PropertyType::Date64 + | PropertyType::Time32S + | PropertyType::Time32MS + | PropertyType::Time32US + | PropertyType::Time32NS + | PropertyType::Time64S + | PropertyType::Time64MS + | PropertyType::Time64US + | PropertyType::Time64NS + | PropertyType::TimestampS + | PropertyType::TimestampMS + | PropertyType::TimestampUS + | PropertyType::TimestampNS => unsafe { drop(Vec::from_raw_parts(self.data as *mut u8, 0, 0)); }, _ => unsafe { @@ -561,6 +868,10 @@ impl PropertyType { RawType::ULLong => PropertyType::Long, RawType::Float => PropertyType::Double, RawType::String => PropertyType::String, + RawType::Date => PropertyType::Date32, + RawType::Time => PropertyType::Time32MS, + RawType::DateTime => PropertyType::TimestampMS, + RawType::DateTimeWithTz => PropertyType::TimestampMS, RawType::Blob(_) => PropertyType::Bytes, _ => { unimplemented!("Unsupported data type {:?}", raw_type) @@ -577,6 +888,20 @@ impl PropertyType { PropertyType::Float => RawType::Float, PropertyType::Double => RawType::Float, PropertyType::String => RawType::String, + PropertyType::Date32 => RawType::Date, + PropertyType::Date64 => RawType::DateTime, + PropertyType::Time32S => RawType::Time, + PropertyType::Time32MS => RawType::Time, + PropertyType::Time32US => RawType::Time, + PropertyType::Time32NS => RawType::Time, + PropertyType::Time64S => RawType::Time, + PropertyType::Time64MS => RawType::Time, + PropertyType::Time64US => RawType::Time, + PropertyType::Time64NS => RawType::Time, + PropertyType::TimestampS => RawType::DateTime, + PropertyType::TimestampMS => RawType::DateTime, + PropertyType::TimestampUS => RawType::DateTime, + PropertyType::TimestampNS => RawType::DateTime, _ => { unimplemented!("Unsupported data type {:?}", *self) } @@ -595,6 +920,9 @@ impl PropertyType { common_pb::DataType::Int64Array => PropertyType::LongList, common_pb::DataType::DoubleArray => PropertyType::DoubleList, common_pb::DataType::StringArray => PropertyType::StringList, + common_pb::DataType::Date32 => PropertyType::Date32, + common_pb::DataType::Time32 => PropertyType::Time32MS, + common_pb::DataType::Timestamp => PropertyType::TimestampMS, _ => { unimplemented!("Unsupported data type {:?}", raw_type) } @@ -612,6 +940,20 @@ impl PropertyType { PropertyType::LongList => common_pb::DataType::Int64Array, PropertyType::DoubleList => common_pb::DataType::DoubleArray, PropertyType::StringList => common_pb::DataType::StringArray, + PropertyType::Date32 => common_pb::DataType::Date32, + PropertyType::Date64 => common_pb::DataType::Timestamp, + PropertyType::Time32S => common_pb::DataType::Time32, + PropertyType::Time32MS => common_pb::DataType::Time32, + PropertyType::Time32US => common_pb::DataType::Time32, + PropertyType::Time32NS => common_pb::DataType::Time32, + PropertyType::Time64S => common_pb::DataType::Time32, + PropertyType::Time64MS => common_pb::DataType::Time32, + PropertyType::Time64US => common_pb::DataType::Time32, + PropertyType::Time64NS => common_pb::DataType::Time32, + PropertyType::TimestampS => common_pb::DataType::Timestamp, + PropertyType::TimestampMS => common_pb::DataType::Timestamp, + PropertyType::TimestampUS => common_pb::DataType::Timestamp, + PropertyType::TimestampNS => common_pb::DataType::Timestamp, _ => { unimplemented!("Unsupported data type {:?}", *self) } @@ -634,6 +976,7 @@ impl PropertyType { DataType::ListFloat => PropertyType::FloatList, DataType::ListDouble => PropertyType::DoubleList, DataType::ListString => PropertyType::StringList, + DataType::Date => PropertyType::TimestampMS, _ => { unimplemented!("Unsupported data type {:?}", data_type) } @@ -656,6 +999,20 @@ impl PropertyType { PropertyType::FloatList => DataType::ListFloat, PropertyType::DoubleList => DataType::ListDouble, PropertyType::StringList => DataType::ListString, + PropertyType::Date32 => DataType::Date, + PropertyType::Date64 => DataType::Date, + PropertyType::Time32S => DataType::Date, + PropertyType::Time32MS => DataType::Date, + PropertyType::Time32US => DataType::Date, + PropertyType::Time32NS => DataType::Date, + PropertyType::Time64S => DataType::Date, + PropertyType::Time64MS => DataType::Date, + PropertyType::Time64US => DataType::Date, + PropertyType::Time64NS => DataType::Date, + PropertyType::TimestampS => DataType::Date, + PropertyType::TimestampMS => DataType::Date, + PropertyType::TimestampUS => DataType::Date, + PropertyType::TimestampNS => DataType::Date, } } } diff --git a/k8s/Makefile b/k8s/Makefile index 53d2c76dd2b8..5282f7a80ca9 100644 --- a/k8s/Makefile +++ b/k8s/Makefile @@ -10,7 +10,7 @@ endif ARCH := $(shell uname -m) VERSION ?= latest -VINEYARD_VERSION ?= v0.18.2 +VINEYARD_VERSION ?= v0.20.1 # This is the version of builder base image in most cases, except for graphscope-dev BUILDER_VERSION ?= $(VINEYARD_VERSION) # This is the version of runtime base image diff --git a/k8s/actions-runner-controller/manylinux/Makefile b/k8s/actions-runner-controller/manylinux/Makefile index a8820c74efe1..97a425ff721f 100644 --- a/k8s/actions-runner-controller/manylinux/Makefile +++ b/k8s/actions-runner-controller/manylinux/Makefile @@ -12,7 +12,7 @@ TARGETPLATFORM ?= $(shell arch) RUNNER_VERSION ?= 2.287.1 DOCKER_VERSION ?= 20.10.12 -VINEYARD_VERSION ?= v0.18.2 +VINEYARD_VERSION ?= v0.20.1 BUILDER_VERSION ?= $(VINEYARD_VERSION) # default list of platforms for which multiarch image is built diff --git a/k8s/internal/Makefile b/k8s/internal/Makefile index c80c70bbafaa..290e55a0fa82 100644 --- a/k8s/internal/Makefile +++ b/k8s/internal/Makefile @@ -42,7 +42,7 @@ GRAPHSCOPE_HOME ?= /usr/local INSTALL_PREFIX ?= /opt/graphscope VERSION ?= latest -VINEYARD_VERSION ?= v0.18.2 +VINEYARD_VERSION ?= v0.20.1 PROFILE ?= release CI ?= false diff --git a/proto/schema_common.proto b/proto/schema_common.proto index 27ac05643e50..0c20ea259b9d 100644 --- a/proto/schema_common.proto +++ b/proto/schema_common.proto @@ -33,6 +33,20 @@ enum DataTypePb { UINT = 16; ULONG = 17; DYNAMIC = 18; + DATE32 = 19; + DATE64 = 20; + TIME32_S = 21; + TIME32_MS = 22; + TIME32_US = 23; + TIME32_NS = 24; + TIME64_S = 25; + TIME64_MS = 26; + TIME64_US = 27; + TIME64_NS = 28; + TIMESTAMP_S = 29; + TIMESTAMP_MS = 30; + TIMESTAMP_US = 31; + TIMESTAMP_NS = 32; } message PropertyValuePb { diff --git a/python/graphscope/framework/utils.py b/python/graphscope/framework/utils.py index 94214241b22b..b66dd66faacf 100644 --- a/python/graphscope/framework/utils.py +++ b/python/graphscope/framework/utils.py @@ -502,6 +502,34 @@ def _unify_str_type(t): return graph_def_pb2.DataTypePb.STRING elif t == "bytes": return graph_def_pb2.DataTypePb.BYTES + elif t == "date32[day]": + return graph_def_pb2.DataTypePb.DATE32 + elif t == "date64[ms]": + return graph_def_pb2.DataTypePb.DATE64 + elif t == "time32[s]": + return graph_def_pb2.DataTypePb.TIME32_S + elif t == "time32[ms]": + return graph_def_pb2.DataTypePb.TIME32_MS + elif t == "time32[us]": + return graph_def_pb2.DataTypePb.TIME32_US + elif t == "time32[ns]": + return graph_def_pb2.DataTypePb.TIME32_NS + elif t == "time64[s]": + return graph_def_pb2.DataTypePb.TIME64_S + elif t == "time64[ms]": + return graph_def_pb2.DataTypePb.TIME64_MS + elif t == "time64[us]": + return graph_def_pb2.DataTypePb.TIME64_US + elif t == "time64[ns]": + return graph_def_pb2.DataTypePb.TIME64_NS + elif t.startswith("timestamp[s]"): + return graph_def_pb2.DataTypePb.TIMESTAMP_S + elif t.startswith("timestamp[ms]"): + return graph_def_pb2.DataTypePb.TIMESTAMP_MS + elif t.startswith("timestamp[us]"): + return graph_def_pb2.DataTypePb.TIMESTAMP_US + elif t.startswith("timestamp[ns]"): + return graph_def_pb2.DataTypePb.TIMESTAMP_NS elif t == "int_list" or t.startswith("fixedlistint"): return graph_def_pb2.DataTypePb.INT_LIST elif t == "long_list" or t.startswith("fixedlistlong"): diff --git a/python/graphscope/tests/minitest/test_min.py b/python/graphscope/tests/minitest/test_min.py index 82b4c0fd04a6..964e3e66d747 100644 --- a/python/graphscope/tests/minitest/test_min.py +++ b/python/graphscope/tests/minitest/test_min.py @@ -16,6 +16,7 @@ # limitations under the License. # +import datetime import logging import os import sys @@ -27,6 +28,8 @@ from graphscope.dataset import load_modern_graph from graphscope.dataset import load_ogbn_mag from graphscope.framework.app import AppAssets +from graphscope.framework.loader import Loader +from graphscope.tests.conftest import property_dir logger = logging.getLogger("graphscope") @@ -349,3 +352,99 @@ def subgraph_roundtrip_and_pk_scan(num_workers, threads_per_worker): } ): subgraph_roundtrip_and_pk_scan(num_workers, threads_per_worker) + + +def test_graph_with_datetime_property(): + def check_node_values(nodes): + values1 = set( + [ + datetime.datetime(2017, 10, 17, 0, 0), + datetime.datetime(2017, 10, 18, 0, 0), + datetime.datetime(2017, 10, 19, 0, 0), + datetime.datetime(2017, 10, 20, 0, 0), + ] + ) + values2 = set( + [ + "1991-06-22T04:00Z", + "1991-06-23T05:00Z", + "1991-06-24T06:00Z", + "1991-06-25T07:00Z", + ] + ) + node_values1, node_values2 = set(), set() + for item in nodes: + if "vval1" in item and "vval2" in item: + node_values1.add(item["vval1"][0]) + node_values2.add(item["vval2"][0]) + assert node_values1 == values1 + assert node_values2 == values2 + + def check_edge_values(edges): + values1 = set( + [ + datetime.datetime(2017, 10, 17, 0, 0), + datetime.datetime(2017, 10, 18, 0, 0), + datetime.datetime(2017, 10, 19, 0, 0), + datetime.datetime(2017, 10, 20, 0, 0), + ] + ) + values2 = set( + [ + "1991-06-22T04:00Z", + "1991-06-23T05:00Z", + "1991-06-24T06:00Z", + "1991-06-25T07:00Z", + ] + ) + edge_values1, edge_values2 = set(), set() + for item in nodes: + if "vval1" in item and "vval2" in item: + edge_values1.add(item["vval1"][0]) + edge_values2.add(item["vval2"][0]) + assert edge_values1 == values1 + assert edge_values2 == values2 + + session = graphscope.session(cluster_type="hosts") + g = session.load_from( + edges={ + "e0": [ + ( + Loader( + f"{property_dir}/e_with_date.csv", + header_row=True, + delimiter=",", + ), + ), + ], + }, + vertices={ + "v0": Loader( + f"{property_dir}/v_with_date.csv", + header_row=True, + delimiter=",", + ), + }, + generate_eid=True, + retain_oid=True, + directed=True, + compact_edges=False, + use_perfect_hash=False, + ) + + interactive = session.gremlin(g) + + # test subgraph + vquery = "g.V().valueMap()" + equery = "g.E().valueMap()" # introduce labels into the result + + nodes = interactive.execute(vquery).all().result() + edges = interactive.execute(equery).all().result() + + logger.info("nodes = %s", nodes) + logger.info("edges = %s", edges) + + check_node_values(nodes) + check_edge_values(edges) + + session.close() diff --git a/scripts/install_deps.sh b/scripts/install_deps.sh index d63f63761649..c780e0f3881e 100755 --- a/scripts/install_deps.sh +++ b/scripts/install_deps.sh @@ -14,8 +14,8 @@ readonly GREEN="\033[0;32m" readonly NC="\033[0m" # No Color readonly GRAPE_BRANCH="master" # libgrape-lite branch -readonly V6D_VERSION="0.16.4" # vineyard version -readonly V6D_BRANCH="v0.18.2" # vineyard branch +readonly V6D_VERSION="0.20.1" # vineyard version +readonly V6D_BRANCH="v0.20.1" # vineyard branch readonly OUTPUT_ENV_FILE="${HOME}/.graphscope_env" IS_IN_WSL=false && [[ ! -z "${IS_WSL}" || ! -z "${WSL_DISTRO_NAME}" ]] && IS_IN_WSL=true