forked from feast-dev/feast
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathfeature_set.py
More file actions
96 lines (75 loc) · 2.4 KB
/
Copy pathfeature_set.py
File metadata and controls
96 lines (75 loc) · 2.4 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
# Copyright 2018 The Feast Authors
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from feast.core.DatasetService_pb2 import FeatureSet as FeatureSet_pb
class FeatureSet:
"""
Represent a collection of features having same entity.
"""
def __init__(self, entity, features):
self._ensure_same_entity(entity, features)
self._features = features
self._entity = entity
self._proto = FeatureSet_pb(entityName=entity, featureIds=features)
@property
def features(self):
"""
Return list of feature ID of this feature set
Returns: list of feature ID in this feature set
"""
return self._features
@property
def entity(self):
return self._entity
@property
def proto(self):
return self._proto
def _ensure_same_entity(self, entity, features):
for feature in features:
e = feature.split(".")[0]
if e != entity:
raise ValueError("feature set has different entity: " + e)
class FileType(object):
"""
File type for downloading training dataset as file
"""
CSV = "CSV"
"""CSV file format"""
JSON = "NEWLINE_DELIMITED_JSON"
"""Newline delimited JSON file format"""
AVRO = "AVRO"
"""Avro file format"""
class DatasetInfo:
def __init__(self, name, full_table_id):
"""
Create instance of DatasetInfo with a BigQuery table as its
backing store.
Args:
name: (str) dataset name
full_table_id: (str) fully qualified table id
"""
self._name = name
self._full_table_id = full_table_id
@property
def name(self):
"""
Dataset name
Returns: dataset name
"""
return self._name
@property
def full_table_id(self):
"""
Returns: fully qualified table id
"""
return self._full_table_id