|
16 | 16 |
|
17 | 17 | from prov.identifier import Identifier
|
18 | 18 | from prov.model import PROV, PROV_LABEL, PROV_TYPE, PROV_VALUE, ProvDocument, ProvEntity
|
19 |
| -from tools.load_ga_export import load_ga_history_export, GalaxyJob |
| 19 | +from tools.load_ga_export import load_ga_history_export, GalaxyJob, GalaxyDataset |
20 | 20 | from ast import literal_eval
|
21 | 21 | import os
|
22 | 22 |
|
@@ -109,14 +109,30 @@ def __init__(
|
109 | 109 | # move to separate function
|
110 | 110 | metadata_export = load_ga_history_export(ga_export)
|
111 | 111 | self.generate_prov_doc()
|
112 |
| - self.jobs = [] |
| 112 | + |
| 113 | + self.datasets = {} |
113 | 114 | # print(metadata_export["jobs_attrs"][0]["params"])
|
114 |
| - for job in metadata_export["jobs_attrs"]: |
| 115 | + for i,dataset in enumerate(metadata_export["datasets_attrs"]): |
| 116 | + datasets_attrs = GalaxyDataset() |
| 117 | + datasets_attrs.parse_ga_dataset_attrs(dataset) |
| 118 | + print(i) |
| 119 | + print(datasets_attrs.attributes['encoded_id']) |
| 120 | + self.datasets[datasets_attrs.attributes['encoded_id']] = datasets_attrs.attributes |
| 121 | + # self.declare_process(ds_attrs.attributes) |
| 122 | + |
| 123 | + self.jobs = {} |
| 124 | + for i,job in enumerate(metadata_export["jobs_attrs"]): |
115 | 125 | job_attrs = GalaxyJob()
|
116 | 126 | job_attrs.parse_ga_jobs_attrs(job)
|
117 |
| - self.jobs.append(job_attrs.attributes) |
| 127 | + print(i) |
| 128 | + print(job_attrs.attributes.keys()) |
| 129 | + # for k,v in job_attrs.attributes['parameters'].items(): |
| 130 | + # print(k, " : ",v) |
| 131 | + self.jobs[job_attrs.attributes['encoded_id']] = job_attrs.attributes |
118 | 132 | self.declare_process(job_attrs.attributes)
|
119 | 133 |
|
| 134 | + # print(self.jobs[0]['inputs']) |
| 135 | + |
120 | 136 | def __str__(self) -> str:
|
121 | 137 | """Represent this Provenvance profile as a string."""
|
122 | 138 | return "ProvenanceProfile <{}>".format(
|
@@ -223,7 +239,8 @@ def declare_process(
|
223 | 239 | # cmd = ga_export_jobs_attrs["command_line"]
|
224 | 240 | process_name = ga_export_jobs_attrs["tool_id"]
|
225 | 241 | # tool_version = ga_export_jobs_attrs["tool_version"]
|
226 |
| - prov_label = "Run of ga_export/jobs_attrs.txt#" + process_name |
| 242 | + # TODO: insert workflow id |
| 243 | + prov_label = "Run of workflow_id_placeholder" + process_name |
227 | 244 | start_time = ga_export_jobs_attrs["create_time"]
|
228 | 245 | end_time = ga_export_jobs_attrs["update_time"]
|
229 | 246 |
|
|
0 commit comments