-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathimpl.py
More file actions
493 lines (416 loc) · 18.4 KB
/
impl.py
File metadata and controls
493 lines (416 loc) · 18.4 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
"""
DataSHIELD Interface implementation for Opal.
"""
from argparse import Namespace
from contextlib import suppress
from obiba_opal.core import OpalClient, UriBuilder, OpalRequest, OpalResponse, HTTPError
from datashield.interface import DSLoginInfo, DSDriver, DSConnection, DSResult, DSError, RSession
class OpalDSError(DSError):
def __init__(self, exception: Exception = None):
super().__init__(exception.args[0])
self.exception = exception
def get_error(self) -> dict:
return self.exception.error if isinstance(self.exception, HTTPError) else {"arguments": self.args}
def is_client_error(self) -> bool:
return not isinstance(self.exception, HTTPError) or (self.exception.code >= 400 and self.exception.code < 500)
def is_server_error(self) -> bool:
return isinstance(self.exception, HTTPError) and self.exception.code >= 500
class OpalRSession(RSession):
def __init__(self, client: OpalClient, profile: str = None, restore: str = None, verbose: bool = False):
self.client = client
self.profile = profile
self.restore = restore
self.verbose = verbose
self.id = None
def get_id(self) -> str:
if self.id is None:
self.start(False)
return self.id
def start(self, asynchronous: bool = True) -> None:
builder = UriBuilder(["datashield", "sessions"]).query("wait", not asynchronous)
if self.profile is not None:
builder.query("profile", self.profile)
if self.restore is not None:
builder.query("restore", self.restore)
response = self._post(builder.build()).send()
if response.code != 201:
raise OpalDSError(ValueError(f"Failed to start R session: {response.code}"))
session = response.from_json()
if "id" not in session:
raise OpalDSError(ValueError("Failed to start R session: no session id returned"))
self.id = session["id"]
def is_started(self) -> bool:
return self.id is not None
def is_ready(self) -> bool:
if self.id is None:
raise OpalDSError(ValueError("R session not started"))
response = self._get(UriBuilder(["datashield", "session", self.id]).build()).send()
if response.code != 200:
raise OpalDSError(ValueError(f"Failed to check R session status: {response.code}"))
session = response.from_json()
return session.get("state", "").lower() == "running"
def is_pending(self) -> bool:
if self.id is None:
raise OpalDSError(ValueError("R session not started"))
response = self._get(UriBuilder(["datashield", "session", self.id]).build()).send()
if response.code != 200:
raise OpalDSError(ValueError(f"Failed to check R session status: {response.code}"))
session = response.from_json()
return session.get("state", "").lower() == "pending"
def is_failed(self) -> bool:
if self.id is None:
raise OpalDSError(ValueError("R session not started"))
response = self._get(UriBuilder(["datashield", "session", self.id]).build()).send()
if response.code != 200:
raise OpalDSError(ValueError(f"Failed to check R session status: {response.code}"))
session = response.from_json()
return session.get("state", "").lower() == "failed"
def is_terminated(self) -> bool:
if self.id is None:
raise OpalDSError(ValueError("R session not started"))
response = self._get(UriBuilder(["datashield", "session", self.id]).build()).send()
if response.code != 200:
raise OpalDSError(ValueError(f"Failed to check R session status: {response.code}"))
session = response.from_json()
return session.get("state", "").lower() == "terminated"
def get_events(self) -> list:
if self.id is None:
raise OpalDSError(ValueError("R session not started"))
response = self._get(UriBuilder(["datashield", "session", self.id]).build()).send()
if response.code != 200:
raise OpalDSError(ValueError(f"Failed to retrieve R session events: {response.code}"))
session = response.from_json()
events = [evt.split(";") for evt in session.get("events", [])]
return events
def get_last_message(self) -> str:
events = self.get_events()
if events and len(events) > 0:
last_event = events[-1]
return last_event[2] if len(last_event) > 2 else "No message"
return "No recent events"
def close(self) -> None:
if self.id is not None:
builder = UriBuilder(["datashield", "session", self.id])
self._delete(builder.build()).send()
self.id = None
def _post(self, ws: str) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().post().resource(ws)
def _get(self, ws: str) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().get().resource(ws)
def _delete(self, ws: str) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().delete().resource(ws)
class OpalConnection(DSConnection):
def __init__(self, name: str, loginInfo: OpalClient.LoginInfo, profile: str = "default", restore: str = None):
self.name = name
self.client = OpalClient.build(loginInfo)
self.subject = None
self.profile = profile
self.restore = restore
self.verbose = False
self.rsession = None
self.rsession_started = False
def check_user(self) -> bool:
"""Check if the user can authenticate by trying to retrieve the current subject profile."""
try:
self._get("/system/subject-profile/_current").fail_on_error().send()
return True
except Exception:
return False
#
# Content listing
#
def list_tables(self) -> list:
response = self._get("/datasources").fail_on_error().send()
datasources = response.from_json()
names = []
for ds in datasources:
if "table" in ds:
for table in ds["table"]:
names.append(ds["name"] + "." + table)
return names
def has_table(self, name: str) -> bool:
parts = name.split(".")
response = self._get(UriBuilder(["datasource", parts[0], "table", parts[1]]).build()).send()
return response.code == 200
def list_resources(self) -> list:
response = self._get("/projects").fail_on_error().send()
projects = response.from_json()
names = []
for project in projects:
response = self._get(UriBuilder(["project", project["name"], "resources"]).build()).fail_on_error().send()
resources = response.from_json()
for resource in resources:
names.append(project["name"] + "." + resource["name"])
return names
def has_resource(self, name: str) -> bool:
parts = name.split(".")
response = self._get(UriBuilder(["project", parts[0], "resource", parts[1]]).build()).send()
return response.code == 200
#
# R Session (server side)
#
def has_session(self) -> bool:
return self.rsession is not None
def start_session(self, asynchronous: bool = True) -> RSession:
if self.rsession is not None:
return self.rsession
self.rsession = OpalRSession(self.client, profile=self.profile, restore=self.restore, verbose=self.verbose)
self.rsession.start(asynchronous=asynchronous)
self.rsession_started = not asynchronous or not self.rsession.is_pending()
return self.rsession
def is_session_started(self) -> bool:
if self.rsession is None:
return False
if self.rsession_started:
return True
self.rsession_started = not self.rsession.is_pending()
return self.rsession_started
def get_session(self) -> RSession:
if self.rsession is None:
raise OpalDSError(ValueError("No R session established. Please start a session first."))
return self.rsession
#
# Assign
#
def assign_table(
self,
symbol: str,
table: str,
variables: list = None,
missings: bool = False,
identifiers: str = None,
id_name: str = None,
asynchronous: bool = True,
) -> DSResult:
builder = (
UriBuilder(["datashield", "session", self._get_session_id(), "symbol", symbol, "table", table])
.query("missings", missings)
.query("async", asynchronous)
)
if variables is not None:
vars = ",".join([f'"{v}"' for v in variables])
builder.query("variables", f"name.any({vars})")
if identifiers is not None:
builder.query("identifiers", identifiers)
if id_name is not None:
builder.query("id", id_name)
try:
response = self._put(builder.build()).fail_on_error().send()
except HTTPError as e:
raise OpalDSError(e) from e
return OpalResult(self, rid=str(response)) if asynchronous else OpalResult(self, result=None)
def assign_resource(self, symbol: str, resource: str, asynchronous: bool = True) -> DSResult:
builder = UriBuilder([
"datashield",
"session",
self._get_session_id(),
"symbol",
symbol,
"resource",
resource,
]).query("async", asynchronous)
try:
response = self._put(builder.build()).fail_on_error().send()
except HTTPError as e:
raise OpalDSError(e) from e
return OpalResult(self, rid=str(response)) if asynchronous else OpalResult(self, result=None)
def assign_expr(self, symbol: str, expr: str, asynchronous: bool = True) -> DSResult:
builder = UriBuilder(["datashield", "session", self._get_session_id(), "symbol", symbol]).query(
"async", asynchronous
)
try:
response = self._put(builder.build()).content_type_rscript().content(expr).fail_on_error().send()
except HTTPError as e:
raise OpalDSError(e) from e
return OpalResult(self, rid=str(response)) if asynchronous else OpalResult(self, result=None)
#
# Aggregate
#
def aggregate(self, expr: str, asynchronous: bool = True) -> DSResult:
builder = UriBuilder(["datashield", "session", self._get_session_id(), "aggregate"]).query(
"async", asynchronous
)
try:
response = self._post(builder.build()).content_type_rscript().content(expr).fail_on_error().send()
except HTTPError as e:
raise OpalDSError(e) from e
return OpalResult(self, rid=str(response)) if asynchronous else OpalResult(self, result=response)
#
# Symbols
#
def list_symbols(self) -> list:
builder = UriBuilder(["datashield", "session", self._get_session_id(), "symbols"])
response = self._get(builder.build()).fail_on_error().send()
rval = response.from_json()
if type(rval) is str:
rval = [rval]
return rval
def rm_symbol(self, name: str) -> None:
builder = UriBuilder(["datashield", "session", self._get_session_id(), "symbol", name])
self._delete(builder.build()).send()
#
# DataSHIELD config
#
def list_profiles(self) -> list:
builder = UriBuilder(["datashield", "profiles"])
response = self._get(builder.build()).send()
profiles = response.from_json()
names = [x["name"] for x in profiles if x["enabled"]]
return {"available": names, "current": self.profile}
def list_methods(self, type: str = "aggregate") -> list:
builder = UriBuilder(["datashield", "env", type, "methods"]).query("profile", self.profile)
response = self._get(builder.build()).send()
methods = response.from_json()
def format(x):
item = {"name": x["name"]}
if "DataShield.RFunctionDataShieldMethodDto.method" in x:
method = x["DataShield.RFunctionDataShieldMethodDto.method"]
item["class"] = "func" if "func" in method else "script"
item["value"] = method["func"] if "func" in method else method["script"]
item["pkg"] = method.get("rPackage", None)
item["version"] = method.get("version", None)
return item
methods = [format(x) for x in methods]
return methods
def list_packages(self) -> list:
aggregate = self.list_methods(type="aggregate")
assign = self.list_methods(type="assign")
def format_method(x):
return f"{x['pkg']}:{x['version']}" if "pkg" in x and "version" in x else None
aggregate = [x for x in [format_method(x) for x in aggregate] if x is not None]
assign = [x for x in [format_method(x) for x in assign] if x is not None]
# unique values
pkgs = list(set(aggregate + assign))
def format_pkg(x):
parts = x.split(":")
return {"pkg": parts[0], "version": parts[1]}
return [format_pkg(x) for x in pkgs]
#
# Workspaces
#
def list_workspaces(self) -> list:
builder = (
UriBuilder(["service", "r", "workspaces"])
.query("context", "DataSHIELD")
.query("user", self._get_subject()["principal"])
)
response = self._get(builder.build()).send()
return response.from_json()
def save_workspace(self, name: str) -> list:
builder = UriBuilder(["datashield", "session", self._get_session_id(), "workspaces"]).query("save", name)
self._post(builder.build()).send()
def restore_workspace(self, name: str) -> list:
builder = UriBuilder(["datashield", "session", self._get_session_id(), "workspace", name])
self._put(builder.build()).send()
def rm_workspace(self, name: str) -> list:
builder = (
UriBuilder(["service", "r", "workspaces"])
.query("context", "DataSHIELD")
.query("user", self._get_subject()["principal"])
.query("name", name)
)
self._delete(builder.build()).send()
#
# Utils
#
def is_async(self) -> dict:
return {"aggregate": True, "assign_table": True, "assign_resource": True, "assign_expr": True}
def keep_alive(self) -> None:
with suppress(Exception):
self.list_symbols()
def disconnect(self) -> None:
"""
Close DataSHIELD session, and then Opal session.
"""
if self.rsession is not None:
self.rsession.close()
self.client.close()
#
# Private methods
#
def _get_subject(self):
if self.subject is None:
builder = UriBuilder(["system", "subject-profile", "_current"])
response = self._get(builder.build()).fail_on_error().send()
self.subject = response.from_json()
return self.subject
def _get_session_id(self) -> str:
self.start_session(asynchronous=False)
return self.rsession.get_id()
def _get(self, ws) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().get().resource(ws)
def _post(self, ws) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().post().resource(ws)
def _put(self, ws) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().put().resource(ws)
def _delete(self, ws) -> OpalRequest:
request = self.client.new_request()
if self.verbose:
request.verbose()
return request.accept_json().delete().resource(ws)
class OpalDriver(DSDriver):
@classmethod
def new_connection(cls, args: DSLoginInfo, restore: str = None) -> DSConnection:
namedArgs = Namespace(opal=args.url, user=args.user, password=args.password, token=args.token)
loginInfo = OpalClient.LoginInfo.parse(namedArgs)
conn = OpalConnection(args.name, loginInfo, args.profile, restore)
if not conn.check_user():
creds = f"user {args.user}" if args.user else "token"
raise OpalDSError(ValueError(f"Failed to authenticate on {args.url} with {creds}"))
return conn
class OpalResult(DSResult):
def __init__(self, conn: OpalConnection, rid: str = None, result: any = None):
self.conn = conn
self.rid = rid
self.result = result
self.cmd = None
def is_completed(self) -> bool:
if self.rid is None:
return True
else:
# check if R command is completed
builder = UriBuilder(["datashield", "session", self.conn._get_session_id(), "command", self.rid]).query(
"wait", False
)
response = self.conn._get(builder.build()).send()
cmd = response.from_json()
status = (cmd["status"] == "COMPLETED" or cmd["status"] == "FAILED") if "status" in cmd else False
if status:
# store final state
self.cmd = cmd
return status
def fetch(self) -> any:
if self.rid is None:
return self.result.from_json() if type(self.result) is OpalResponse else None
else:
if not self.cmd:
# get the result of R command by its id
builder = UriBuilder(["datashield", "session", self.conn._get_session_id(), "command", self.rid]).query(
"wait", True
)
response = self.conn._get(builder.build()).send()
self.cmd = response.from_json()
if "status" in self.cmd and self.cmd["status"] == "FAILED":
msg = self.cmd.get("error", "<no message>")
raise OpalDSError(ValueError(f"Command {self.rid} failed on {self.conn.name}: {msg}"))
builder = UriBuilder(["datashield", "session", self.conn._get_session_id(), "command", self.rid, "result"])
response = self.conn._get(builder.build()).send()
return response.from_json() if self.cmd["withResult"] else None