-
Notifications
You must be signed in to change notification settings - Fork 108
Expand file tree
/
Copy pathtutorial6.rs
More file actions
101 lines (94 loc) · 2.85 KB
/
tutorial6.rs
File metadata and controls
101 lines (94 loc) · 2.85 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
use anyhow::Result;
use chrono::Datelike;
use csv::Reader;
use dbsp::typed_batch::IndexedZSetReader;
use dbsp::{
OrdIndexedZSet, OutputHandle, RootCircuit, ZSetHandle, ZWeight,
operator::time_series::{RelOffset, RelRange},
utils::{Tup2, Tup3},
};
use feldera_macros::IsNone;
use rkyv::{Archive, Serialize};
use size_of::SizeOf;
#[derive(
Clone,
Default,
Debug,
Eq,
PartialEq,
Ord,
PartialOrd,
Hash,
SizeOf,
Archive,
Serialize,
rkyv::Deserialize,
serde::Deserialize,
IsNone,
)]
#[archive_attr(derive(Ord, Eq, PartialEq, PartialOrd))]
struct Record {
location: String,
date: i32,
daily_vaccinations: Option<u64>,
}
#[allow(clippy::type_complexity)]
fn build_circuit(
circuit: &mut RootCircuit,
) -> Result<(
ZSetHandle<Record>,
OutputHandle<OrdIndexedZSet<Tup3<String, i32, u8>, Tup2<i64, i64>>>,
)> {
let (input_stream, input_handle) = circuit.add_input_zset::<Record>();
let subset = input_stream.filter(|r| {
r.location == "England"
|| r.location == "Northern Ireland"
|| r.location == "Scotland"
|| r.location == "Wales"
});
let monthly_totals = subset
.map_index(|r| {
let date = chrono::NaiveDate::from_epoch_days(r.date).unwrap();
(
Tup3(r.location.clone(), date.year(), date.month() as u8),
r.daily_vaccinations.unwrap_or(0),
)
})
.aggregate_linear(|v| *v as ZWeight);
let moving_averages = monthly_totals
.map_index(|(Tup3(l, y, m), v)| (*y as u32 * 12 + (*m as u32 - 1), Tup2(l.clone(), *v)))
.partitioned_rolling_average(
|Tup2(l, v)| (l.clone(), *v),
RelRange::new(RelOffset::Before(2), RelOffset::Before(0)),
)
.map_index(|(l, Tup2(date, avg))| {
(
Tup3(l.clone(), (date / 12) as i32, (date % 12 + 1) as u8),
avg.unwrap(),
)
});
let joined = monthly_totals.join_index(&moving_averages, |Tup3(l, y, m), cur, avg| {
Some((Tup3(l.clone(), *y, *m), Tup2(*cur, *avg)))
});
Ok((input_handle, joined.output()))
}
fn main() -> Result<()> {
let (circuit, (input_handle, output_handle)) = RootCircuit::build(build_circuit)?;
let path = format!(
"{}/examples/tutorial/vaccinations.csv",
env!("CARGO_MANIFEST_DIR")
);
let mut input_records = Reader::from_path(path)?
.deserialize()
.map(|result| result.map(|record| Tup2(record, 1)))
.collect::<Result<Vec<Tup2<Record, ZWeight>>, _>>()?;
input_handle.append(&mut input_records);
circuit.transaction()?;
output_handle
.consolidate()
.iter()
.for_each(|(Tup3(l, y, m), Tup2(cur, avg), w)| {
println!("{l:16} {y}-{m:02} {cur:10} {avg:10}: {w:+}")
});
Ok(())
}