Async rust client for Apache Druid

Fully asynchronous, future-enabled Apache Druid client library for rust programming language.

The library provides staticly typed API for Native Queries

Installation

The library is hosted on crates.io.

toml [dependencies] druid-io = "*"

Supported Native Queries

Timeseries
TopN
GroupBy
Scan
Search
TimeBoundary
SegmentMetadata
DataSourceMetadata

Usage

Client

Connect to a druid cluster throughly staticly provided list of brokers:

```rust

let druidclient = DruidClient::new(vec!["localhost:8082".tostring()]); ```

Connector to Druid cluster through Zookeeper - supports autodiscovery of new brokers and load balancing:

```rust

TODO: ```

Querying

Timeseries

See Timeseries query documentation

```rust

[derive(Serialize, Deserialize, Debug)]

pub struct TimeAggr { count: usize, count_fraction: f32, user: String, }

let timeseries = Timeseries { datasource: DataSource::table("wikipedia"), limit: Some(10), descending: false, granularity: Granularity::All, filter: Some(Filter::selector("user", "Taffe316")), aggregations: vec![ Aggregation::count("count"), Aggregation::StringFirst { name: "user".into(), fieldname: "user".into(), maxstringbytes: 1024, }, ], postaggregations: vec![PostAggregation::Arithmetic { name: "countfraction".into(), function: "/".into(), fields: vec![ PostAggregator::fieldaccess("countpercent", "count"), PostAggregator::constant("hundred", 100.into()), ], ordering: None, }], intervals: vec!["-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z".into()], context: context, }; let result = tokiotest::blockon(druid_client.timeseries::(&timeseries));

```

TopN

See Apache Druid TopN query documentation

```rust

[derive(Serialize, Deserialize, Debug)]

struct WikiPage { page: String, user: Option, count: usize, }

let topn = TopN { datasource: DataSource::table("wikipedia"), dimension: Dimension::default("page"), threshold: 10, metric: "count".into(), aggregations: vec![ Aggregation::count("count"), Aggregation::StringFirst { name: "user".into(), fieldname: "user".into(), maxstringbytes: 1024, }, ], intervals: vec!["-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z".into()], granularity: Granularity::All, context: Default::default(), }; let druidclient = DruidClient::new(vec!["localhost:8082".tostring()]); let result = tokiotest::blockon(druidclient.topn::(&topn));

```

GroupBy

See Apache Druid GroupBy query documentation

```rust

let groupby = GroupBy { datasource: DataSource::table("wikipedia"), dimensions: vec![Dimension::Default { dimension: "page".into(), outputname: "page".into(), outputtype: OutputType::STRING, }], limitspec: Some(LimitSpec { limit: 10, columns: vec![OrderByColumnSpec::new( "page", Ordering::Descending, SortingOrder::Alphanumeric, )], }), granularity: Granularity::All, filter: Some(Filter::selector("user", "Taffe316")), aggregations: vec![ Aggregation::count("count"), Aggregation::StringFirst { name: "user".into(), fieldname: "user".into(), maxstringbytes: 1024, }, ], postaggregations: vec![PostAggregation::Arithmetic { name: "countfraction".into(), function: "/".into(), fields: vec![ PostAggregator::fieldaccess("countpercent", "count"), PostAggregator::constant("hundred", 100.into()), ], ordering: None, }], having: Some(HavingSpec::greaterthan("countfraction", 0.01.into())), intervals: vec!["-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z".into()], subtotalspec: Default::default(), context: Default::default(), }; let result = tokiotest::blockon(druidclient.groupby::(&groupby));

```

Scan (with inner join)

See Apache Druid TimeBoundary query documentation

Let's try something more complex: inner join

```rust

[derive(Serialize, Deserialize, Debug)]

[serde(rename_all = "camelCase")]

struct ScanEvent { #[serde(rename(deserialize = "_time"))] time: usize, cityname: Option, comment: Option, namespace: Option, page: Option, regionisocode: Option, user: String, #[serde(rename(deserialize = "c.languages"))] languages: Option, } let scan = Scan { datasource: DataSource::join(JoinType::Inner) .left(DataSource::table("wikipedia")) .right( DataSource::query( Scan { datasource: DataSource::table("countries"), batchsize: 10, intervals: vec![ "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z" .into(), ], resultformat: ResultFormat::List, columns: vec!["Name".into(), "languages".into()], limit: None, filter: None, ordering: Some(Ordering::None), context: std::collections::HashMap::new(), } .into(), ), "c.", ) .condition("countryName == \"c.Name\"") .build() .unwrap(), batchsize: 10, intervals: vec!["-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z".into()], resultformat: ResultFormat::List, columns: vec![], limit: Some(10), filter: None, ordering: Some(Ordering::None), context: Default::default(), };

let result = tokiotest::blockon(druid_client.scan::(&scan));

```