[ ]:
import pandas as pd
import tempfile
import atexit
from pathlib import Path

import urgap


tmp_dir_obj = tempfile.TemporaryDirectory()
tmp_dir = Path(tmp_dir_obj.name)

atexit.register(tmp_dir_obj.cleanup)

print(f"Temp directory: {tmp_dir}")
[ ]:
notebook_dir = Path.cwd()
test_data_dir = notebook_dir.parent.parent / "tests" / "data"
[ ]:
ufiles = urgap.UFileList(
    [
        urgap.UFile(
            uri=f"file://{test_data_dir}?uftype={urgap.uftypes.any.CSV}"
            f"#unified_csvs/BSA1_xtandem_alanine_unified.csv",
        ),
    ],
)
print(ufiles)
[ ]:
urun_dict = urgap.URunDict(
    {
        "parameters": {
            "FilterTabularToCSV:1.0.0": {
                "-q": "500 < `exp_mz` < 1000",
            },
            "CompressToTar:1.0.0": {},
        },
        "unode_parameters": {
            "storage_base_uri": f"file://{tmp_dir}",
        },
    },
)
print(urun_dict)
[ ]:
filter_node = urgap.init_unode("FilterTabularToCSV:1.0.0")
[ ]:
filter_results = filter_node.run(urun_dict=urun_dict, ufiles=ufiles)
print(filter_results)
[ ]:
df = pd.read_csv(filter_results[0].path)
print(df)
[ ]:
compress_node = urgap.init_unode("CompressToTar:1.0.0")
[ ]:
compress_results = compress_node.run(urun_dict=urun_dict, ufiles=filter_results)
print(compress_results)
[ ]: