[ ]:
import pandas as pd
import tempfile
import atexit
from pathlib import Path
import urgap
tmp_dir_obj = tempfile.TemporaryDirectory()
tmp_dir = Path(tmp_dir_obj.name)
atexit.register(tmp_dir_obj.cleanup)
print(f"Temp directory: {tmp_dir}")
[ ]:
notebook_dir = Path.cwd()
test_data_dir = notebook_dir.parent.parent / "tests" / "data"
[ ]:
ufiles = urgap.UFileList(
[
urgap.UFile(
uri=f"file://{test_data_dir}?uftype={urgap.uftypes.any.CSV}"
f"#unified_csvs/BSA1_xtandem_alanine_unified.csv",
),
],
)
print(ufiles)
[ ]:
urun_dict = urgap.URunDict(
{
"parameters": {
"FilterTabularToCSV:1.0.0": {
"-q": "500 < `exp_mz` < 1000",
},
"CompressToTar:1.0.0": {},
},
"unode_parameters": {
"storage_base_uri": f"file://{tmp_dir}",
},
},
)
print(urun_dict)
[ ]:
filter_node = urgap.init_unode("FilterTabularToCSV:1.0.0")
[ ]:
filter_results = filter_node.run(urun_dict=urun_dict, ufiles=ufiles)
print(filter_results)
[ ]:
df = pd.read_csv(filter_results[0].path)
print(df)
[ ]:
compress_node = urgap.init_unode("CompressToTar:1.0.0")
[ ]:
compress_results = compress_node.run(urun_dict=urun_dict, ufiles=filter_results)
print(compress_results)
[ ]: