Source code for pimlico.cli.browser.tool

# This file is part of Pimlico
# Copyright (C) 2020 Mark Granroth-Wilding
# Licensed under the GNU LGPL v3.0 - https://www.gnu.org/licenses/lgpl-3.0.en.html

"""
Tool for browsing datasets, reading from the data output by pipeline modules.
"""
from __future__ import print_function
import sys


[docs]def browse_cmd(pipeline, opts): """ Command for main Pimlico CLI """ module_name = opts.module_name output_name = opts.output_name print("Loading %s of module '%s'" % \ ("default output" if output_name is None else "output '%s'" % output_name, module_name)) reader_setup = pipeline[module_name].get_output_reader_setup(output_name) datatype = reader_setup.datatype print("Datatype: %s" % datatype.datatype_name) if not reader_setup.ready_to_read(): print("Data not ready: cannot browse it", file=sys.stderr) sys.exit(1) # Get a reader for the corpus reader = reader_setup(pipeline, module_name) try: datatype.run_browser(reader, opts) except NotImplementedError as e: print("Datatype of this dataset ({}) does not provide a browser to view its data".format( datatype.datatype_name), file=sys.stderr) sys.exit(1)