77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287 | class RelationalDBArtifactStoreSession(ArtifactStoreSession):
"""A relational DB implementation of the MLTE artifact store session."""
def __init__(self, storage: RDBStorage) -> None:
self.storage = storage
"""A reference to underlying storage."""
def close(self) -> None:
"""Close the session."""
self.storage.close()
# -------------------------------------------------------------------------
# Structural Elements
# -------------------------------------------------------------------------
def create_model(self, model: Model) -> Model:
with Session(self.storage.engine) as session:
try:
_, _ = DBReader.get_model(model.identifier, session)
raise errors.ErrorAlreadyExists(
f"Model with identifier {model.identifier} already exists."
)
except errors.ErrorNotFound:
# If it was not found, it means we can create it.
model_obj = DBModel(
name=model.identifier,
versions=[],
)
session.add(model_obj)
session.commit()
return Model(identifier=model.identifier, versions=[])
def read_model(self, model_id: str) -> Model:
with Session(self.storage.engine) as session:
model, _ = DBReader.get_model(model_id, session)
return model
def list_models(self) -> List[str]:
models: List[str] = []
with Session(self.storage.engine) as session:
model_objs = session.scalars(select(DBModel))
for model_obj in model_objs:
models.append(model_obj.name)
return models
def delete_model(self, model_id: str) -> Model:
with Session(self.storage.engine) as session:
model, model_obj = DBReader.get_model(model_id, session)
session.delete(model_obj)
session.commit()
return model
def create_version(self, model_id: str, version: Version) -> Version:
with Session(self.storage.engine) as session:
try:
_, _ = DBReader.get_version(
model_id, version.identifier, session
)
raise errors.ErrorAlreadyExists(
f"Version with identifier {version.identifier} for model {model_id} already exists."
)
except errors.ErrorNotFound:
# Check if model exists.
_, model_obj = DBReader.get_model(model_id, session)
# Now create version.
version_obj = DBVersion(
name=version.identifier, model_id=model_obj.id
)
session.add(version_obj)
session.commit()
return Version(identifier=version.identifier)
def read_version(self, model_id: str, version_id: str) -> Version:
with Session(self.storage.engine) as session:
version, _ = DBReader.get_version(model_id, version_id, session)
return version
def list_versions(self, model_id: str) -> List[str]:
versions: List[str] = []
with Session(self.storage.engine) as session:
version_objs = session.scalars(
(
select(DBVersion)
.where(DBVersion.model_id == DBModel.id)
.where(DBModel.name == model_id)
)
)
for version_obj in version_objs:
versions.append(version_obj.name)
return versions
def delete_version(self, model_id: str, version_id: str) -> Version:
with Session(self.storage.engine) as session:
version, version_obj = DBReader.get_version(
model_id, version_id, session
)
session.delete(version_obj)
session.commit()
return version
# -------------------------------------------------------------------------
# Artifacts
# -------------------------------------------------------------------------
def write_artifact(
self,
model_id: str,
version_id: str,
artifact: ArtifactModel,
*,
force: bool = False,
parents: bool = False,
) -> ArtifactModel:
with Session(self.storage.engine) as session:
if parents:
storeutil.create_parents(self, model_id, version_id)
else:
# Ensure parents exist.
_ = DBReader.get_version(model_id, version_id, session)
# Check if artifact already exists.
try:
_, artifact_obj = DBReader.get_artifact(
model_id,
version_id,
artifact.header.identifier,
session,
)
if not force:
raise errors.ErrorAlreadyExists(
f"Artifact '{artifact.header.identifier}' already exists."
)
else:
# We have no edit functionality, nor any versioning system, so delete the previous version.
# TODO: versioning? Keep previous versions?
session.delete(artifact_obj)
except errors.ErrorNotFound:
# If artifact was not found, it is ok, force it or not we will create it.
pass
# Get type and parent version info.
artifact_type_obj = DBReader.get_artifact_type(
artifact.header.type, session
)
_, version_obj = DBReader.get_version(model_id, version_id, session)
# Create the actual object.
new_artifact_obj = factory.create_db_artifact(
artifact, artifact_type_obj, version_obj.id, session
)
# Use session to add object.
session.add(new_artifact_obj)
session.commit()
return artifact
def read_artifact(
self,
model_id: str,
version_id: str,
artifact_id: str,
) -> ArtifactModel:
with Session(self.storage.engine) as session:
artifact, _ = DBReader.get_artifact(
model_id, version_id, artifact_id, session
)
return artifact
def read_artifacts(
self,
model_id: str,
version_id: str,
limit: int = 100,
offset: int = 0,
) -> List[ArtifactModel]:
# TODO: not the best support of offset and limit, still loading everything from DB.
with Session(self.storage.engine) as session:
all_artifacts = []
for artifact_type in DBReader.SUPPORTED_ARTIFACT_DB_CLASSES.keys():
artifacts = DBReader.get_artifacts_for_type(
model_id, version_id, artifact_type, session
)
all_artifacts.extend(artifacts)
return all_artifacts[offset : offset + limit]
def search_artifacts(
self,
model_id: str,
version_id: str,
query: Query = Query(),
) -> List[ArtifactModel]:
# TODO: not the most efficient way, since it loads all artifacts first, before filtering.
artifacts = self.read_artifacts(model_id, version_id)
return [
artifact for artifact in artifacts if query.filter.match(artifact)
]
def delete_artifact(
self,
model_id: str,
version_id: str,
artifact_id: str,
) -> ArtifactModel:
with Session(self.storage.engine) as session:
artifact, artifact_obj = DBReader.get_artifact(
model_id, version_id, artifact_id, session
)
session.delete(artifact_obj)
session.commit()
return artifact
|