Source code for ALLCools.plot.genome_track._pygenometrack

"""
Modified from pygenometracks
LICENSE: https://github.com/deeptools/pyGenomeTracks/blob/master/LICENSE
"""

import logging
import os
import pathlib
import time
import warnings
from collections import OrderedDict
from configparser import ConfigParser

import matplotlib
import matplotlib.cm
import matplotlib.colors
import matplotlib.gridspec
import matplotlib.pyplot as plt
import matplotlib.textpath
import mpl_toolkits.axisartist as axisartist
import numpy as np
from pygenometracks.tracks.GenomeTrack import GenomeTrack
from pygenometracks.utilities import InputError
from pygenometracks.utilities import file_to_intervaltree, change_chrom_names

matplotlib.use('Agg')

warnings.filterwarnings("ignore", message="numpy.dtype size changed")
warnings.filterwarnings("ignore", message="numpy.ndarray size changed")
warnings.simplefilter(action='ignore', category=FutureWarning)
warnings.simplefilter(action='ignore', category=DeprecationWarning)
warnings.simplefilter(action='ignore', category=ImportWarning)

# import warnings
# warnings.filterwarnings('error')

[docs]FORMAT = "[%(levelname)s:%(filename)s:%(lineno)s - %(funcName)20s()] %(message)s"
logging.basicConfig(format=FORMAT)
[docs]log = logging.getLogger(__name__)
# logging.basicConfig()
# log = logging.getLogger("tracksClass")
log.setLevel(logging.DEBUG)

[docs]DEFAULT_TRACK_HEIGHT = 0.5  # in centimeters
[docs]DEFAULT_FIGURE_WIDTH = 40  # in centimeters
# proportion of width dedicated to (figure, legends)
[docs]DEFAULT_WIDTH_RATIOS = (0.01, 0.90, 0.1)
[docs]DEFAULT_MARGINS = {'left': 0.04, 'right': 0.92, 'bottom': 0.03, 'top': 0.97}


[docs]class MultiDict(OrderedDict):
    """
    Class to allow identically named
    sections in configuration file
    by appending the section number
    for example:
    1. section name
    """
[docs]    _unique = 0

[docs]    def __setitem__(self, key, val):
        if isinstance(val, OrderedDict):
            self._unique += 1
            key = f"{str(self._unique)}. [{key}]"
        OrderedDict.__setitem__(self, key, val)


[docs]class PlotTracks(object):
    def __init__(self,
                 config,
                 fig_width=DEFAULT_FIGURE_WIDTH,
                 fig_height=None,
                 fontsize=None,
                 dpi=None,
                 track_label_width=None,
                 plot_regions=None,
                 plot_width=None):
        self.fig_width = fig_width
        self.fig_height = fig_height
        self.dpi = dpi
        self.vlines_intval_tree = None
        self.vlines_properties = None
        self.track_list = []
        start = self.print_elapsed(None)
        self.available_tracks = self.get_available_tracks()
        self.parse_tracks(config, plot_regions=plot_regions)
        if fontsize:
            fontsize = fontsize
        else:
            fontsize = float(fig_width) * 0.3
        # the track label width is the fraction of
        # the figure width that is used
        # for the track 'title' or label.
        if track_label_width is None:
            self.width_ratios = DEFAULT_WIDTH_RATIOS
        else:
            self.width_ratios = (0.01,
                                 1 - track_label_width,
                                 track_label_width)

        # Process the width:
        if plot_width is not None:
            self.fig_width = plot_width / (
                    DEFAULT_MARGINS['right'] - DEFAULT_MARGINS['left']) * (
                                     1 + 2 / 3 * 0.01) / (
                                     self.width_ratios[1] / sum(self.width_ratios))

        font = {'size': fontsize}
        matplotlib.rc('font', **font)
        # initialize each track
        self.track_obj_list = []
        for idx, properties in enumerate(self.track_list):
            log.info(f"initialize {properties['section_name']}")
            # the track_class is obtained from the available tracks
            track_class = self.available_tracks[properties['file_type']]
            properties['region'] = plot_regions
            self.track_obj_list.append(track_class(properties))

        log.info("time initializing track(s):")
        self.print_elapsed(start)

    @staticmethod
[docs]    def get_available_tracks():
        avail_tracks = {}
        work = [GenomeTrack]
        while work:
            parent = work.pop()
            for child in parent.__subclasses__():
                if child not in avail_tracks:
                    track_type = child.TRACK_TYPE
                    avail_tracks[track_type] = child
                    work.append(child)

        # plus tracks defined in ALLCools
        from .HiCMatrixCoolTrack import HiCMatrixCoolTrack
        avail_tracks['cooler'] = HiCMatrixCoolTrack

        # swap the GtfTrack in pygenometracks with this class in ALLCools
        from .GtfTrack import GtfTrack
        avail_tracks['gtf'] = GtfTrack
        return avail_tracks

[docs]    def get_tracks_height(self, start_region=None, end_region=None):
        """
        The main purpose of the following loop is
        to get the height of each of the tracks
        because for the Hi-C the height is variable with respect
        to the range being plotted, the function is called
        when each plot is going to be printed.

        Args:
            start_region: start of the region to plot.
                          Only used in case the plot is a Hi-C matrix
            end_region: end of the region to plot.
                        Only used in case the plot is a Hi-C matrix

        Returns:

        """
        track_height = []
        for i, track_dict in enumerate(self.track_list):
            if i == 0 and track_dict['overlay_previous'] != 'no':
                log.warning("First track can not have the `overlay_previous` option.\n")
                self.track_list[i]['overlay_previous'] = 'no'
            # if overlay_previous is set to a value other than no
            # then, skip this track height
            if track_dict['overlay_previous'] != 'no':
                continue
            elif 'height' in track_dict:
                height = track_dict['height']
            elif track_dict['file_type'] == 'x_axis':
                height = track_dict['fontsize'] / 8
            elif 'depth' in track_dict and \
                    track_dict['file_type'] in ('hic_matrix', 'cooler'):
                # compute the height of a Hi-C track
                # based on the depth such that the
                # resulting plot appears proportional
                #
                #      /|\
                #     / | \
                #    /  |d \   d is the depth that we want to be proportional
                #   /   |   \  when plotted in the figure
                # ------------------
                #   region len
                #
                # d (in cm) =  depth (in bp) * 0.5 *
                #              width (in cm) / region len (in bp)

                # to compute the actual width of the figure the margins
                # and the region
                # set for the legends have to be considered
                # DEFAULT_MARGINS['right'] - DEFAULT_MARGINS['left']
                # is the proportion of plotting area
                # This plotting area is divided in three part as specified in
                # self.width_ratios (normalized to 1)
                # And as wspace is specified 0.01,
                # 0.01 of the mean of the 3 regions is not occupied.
                # 1 / (1 + 2 / 3 * 0.01) is used to plot.

                hic_width = \
                    self.fig_width * \
                    (DEFAULT_MARGINS['right'] - DEFAULT_MARGINS['left']) / \
                    (1 + 2 / 3 * 0.01) * \
                    self.width_ratios[1] / sum(self.width_ratios)
                # the scale factor is to obtain each bin as a square
                # (a 45 degree rotated matrix)
                scale_factor = 0.5
                depth = min(track_dict['depth'],
                            int((end_region - start_region) * 1.25))

                height = scale_factor * depth * hic_width / (end_region - start_region)
            else:
                height = DEFAULT_TRACK_HEIGHT
                self.track_list[i]['height'] = height

            track_height.append(height)
        return track_height

[docs]    def plot(self, chrom, start, end, file_name=None, title=None,
             h_align_titles='left', decreasing_x_axis=False):
        track_height = self.get_tracks_height(start_region=start,
                                              end_region=end)

        if self.fig_height:
            fig_height = self.fig_height
        else:
            fig_height = sum(track_height) / \
                         (DEFAULT_MARGINS['top'] - DEFAULT_MARGINS['bottom'])

        log.debug(f"Figure size in cm is {self.fig_width} x {fig_height}."
                  f" Dpi is set to {self.dpi}\n")
        fig = plt.figure(figsize=self.cm2inch(self.fig_width, fig_height))

        fig.subplots_adjust(wspace=0, hspace=0.0,
                            left=DEFAULT_MARGINS['left'],
                            right=DEFAULT_MARGINS['right'],
                            bottom=DEFAULT_MARGINS['bottom'],
                            top=DEFAULT_MARGINS['top'])

        if title:
            fig.suptitle(title)

        grids = matplotlib.gridspec.GridSpec(len(track_height), 3,
                                             height_ratios=track_height,
                                             width_ratios=self.width_ratios,
                                             wspace=0.01)
        axis_list = []
        # skipped_tracks is the count of tracks that have the
        # 'overlay_previous' parameter and should be skipped
        skipped_tracks = 0
        plot_axis = None
        y_axis = None
        label_axis = None
        width_dpi = None
        ylim = None
        for idx, track in enumerate(self.track_obj_list):
            log.info(f"plotting {track.properties['section_name']}")

            if track.properties['overlay_previous'] in ['yes', 'share-y']:
                overlay = True
                skipped_tracks += 1
            else:
                overlay = False

            if track.properties['overlay_previous'] == 'share-y':
                ylim = plot_axis.get_ylim()
            else:
                idx -= skipped_tracks
                plot_axis = axisartist.Subplot(fig, grids[idx, 1])
                fig.add_subplot(plot_axis)
                # turns off the lines around the tracks
                plot_axis.axis[:].set_visible(False)
                # to make the background transparent
                plot_axis.patch.set_visible(False)
                if not overlay:
                    y_axis = plt.subplot(grids[idx, 0])
                    y_axis.set_axis_off()

                    label_axis = plt.subplot(grids[idx, 2])
                    label_axis.set_axis_off()
                    # I get the width of the label_axis to be able to wrap the
                    # labels when right or center aligned.
                    width_inch = label_axis.get_window_extent().width
                    width_dpi = width_inch * self.dpi / fig.dpi

            if decreasing_x_axis:
                plot_axis.set_xlim(end, start)
            else:
                plot_axis.set_xlim(start, end)
            track.plot(plot_axis, chrom, start, end)
            track.plot_y_axis(y_axis, plot_axis)
            track.plot_label(label_axis, width_dpi=width_dpi,
                             h_align=h_align_titles)

            if track.properties['overlay_previous'] == 'share-y':
                plot_axis.set_ylim(ylim)

            if not overlay:
                axis_list.append(plot_axis)

        if self.vlines_intval_tree:
            self.plot_vlines(axis_list, chrom, start, end)

        if file_name is not None:
            fig.savefig(file_name, dpi=self.dpi, transparent=False)
        return fig

[docs]    def plot_vlines(self, axis_list, chrom_region, start_region, end_region):
        """
        Plots dotted lines from the top of the first plot to the bottom
        of the last plot at the specified positions.

        :param axis_list: list of plotted axis
        :param chrom_region chromosome name
        :param start_region start position
        :param end_region end position

        :return: None
        """
        vlines_list = []
        if 'line_width' in self.vlines_properties:
            line_width = self.vlines_properties['line_width']
        else:
            line_width = 0.5

        if chrom_region not in list(self.vlines_intval_tree):
            chrom_region_before = chrom_region
            chrom_region = change_chrom_names(chrom_region)
            if chrom_region not in list(self.vlines_intval_tree):
                log.warning("*Warning*\nNo interval was found when "
                            f"overlapping with both {chrom_region_before}:{start_region}-{end_region}"
                            f" and {chrom_region}:{start_region}-{end_region} inside the "
                            "file with vertical lines. "
                            "No vertical lines will be "
                            "plotted!!\n")
                return
        chrom_region = GenomeTrack.check_chrom_str_bytes(self.vlines_intval_tree, chrom_region)

        for region in sorted(self.vlines_intval_tree[chrom_region][start_region - 10000:end_region + 10000]):
            vlines_list.append(region.begin)

        for ax in axis_list:
            ymin, ymax = ax.get_ylim()

            ax.vlines(vlines_list, ymin, ymax, linestyle='dashed', zorder=10,
                      linewidth=line_width,
                      color=(0, 0, 0, 0.7), alpha=0.5)

        return

[docs]    def parse_tracks(self, tracks_file, plot_regions=None):
        """
        Parses a configuration file

        :param tracks_file: file path containing the track configuration
        :param plot_regions: a list of tuple [(chrom1, start1, end1), (chrom2, start2, end2)]
                             on which the data should be loaded
                             here the vlines
        :return: array of dictionaries and vlines_file.
                 One dictionary per track
        """
        try:
            if isinstance(tracks_file, str) and not pathlib.Path(tracks_file).exists():
                # assume the tracks_file are the config string
                import io
                handle = io.StringIO(tracks_file)
            else:
                handle = open(tracks_file, 'r')
        except OSError:
            # if the config string too long, path exists raise error.
            import io
            handle = io.StringIO(tracks_file)

        parser = ConfigParser(dict_type=MultiDict, strict=False)
        parser.read_file(handle)
        handle.close()

        tracks_file_path = os.path.dirname(tracks_file)

        track_list = []
        for section_name in parser.sections():
            # track_options is what will become the self.properties
            track_options = dict({"section_name": section_name})
            all_keywords = [i[0] for i in parser.items(section_name)]
            # First we check if there is a skip set to true:
            if 'skip' in all_keywords and \
                    parser.getboolean(section_name, 'skip'):
                # In this case we just do not explore the section
                continue
            # Then the vlines are treated differently:
            if ('type', 'vlines') in parser.items(section_name):
                # The only thing to check is the file
                # There is no other parameters to use.
                if 'file' not in all_keywords:
                    raise InputError(f"The section {section_name} is supposed to be a vline"
                                     " but there is no file.")
                track_options['file'] = parser.get(section_name, 'file')
                if 'line_width' in all_keywords:
                    try:
                        track_options['line_width'] = float(parser.get(section_name, 'line_width'))
                    except ValueError:
                        raise InputError(f"In section {section_name}, line_width "
                                         f"was set to {parser.get(section_name, 'line_width')}"
                                         " whereas we should have a float "
                                         "value.")
                extra_keywords = [k for k in all_keywords
                                  if k not in ['file', 'type', 'line_width']]
                if len(extra_keywords) > 0:
                    log.warning("These parameters were specified but will not"
                                f" be used {' '.join(extra_keywords)}.\n")
                self.vlines_properties = \
                    self.check_file_exists(track_options, tracks_file_path)
                continue
            # For the other cases, we will append properties dictionnaries
            # to the track_list
            # If the sections are spacer or x-axis we fill the file_type:
            # (They are special sections where the title defines the track type)
            if section_name.endswith('[spacer]'):
                track_options['file_type'] = 'spacer'
                track_options['track_class'] = SpacerTrack
            elif section_name.endswith('[x-axis]'):
                track_options['file_type'] = 'x_axis'
                track_options['track_class'] = XAxisTrack
            # For the others we need to have a 'file_type'
            # Either the file_type is part of the keywords
            elif 'file_type' in all_keywords:
                track_options['file_type'] = parser.get(section_name,
                                                        'file_type')
                if track_options['file_type'] not in self.available_tracks:
                    raise InputError(f"Section {section_name}: the file_type "
                                     f"{track_options['file_type']} does not"
                                     " exists.\npossible file_type are:"
                                     f"{self.available_tracks.keys()}.")
                track_options['track_class'] = \
                    self.available_tracks[track_options['file_type']]
            # Or we guess it from the file:
            elif 'file' in all_keywords:
                track_options['file'] = parser.get(section_name,
                                                   'file')
                track_options['file_type'] = \
                    self.guess_filetype(track_options,
                                        self.available_tracks)
                track_options['track_class'] = \
                    self.available_tracks[track_options['file_type']]
            else:
                raise InputError(f"Section {section_name}: there is no file_type nor file "
                                 "specified and it is not a [spacer] nor a "
                                 "[x-axis] section. This is not a valid "
                                 "section.")
            # Now we should have a 'track_class' set.
            # We can get for it all the necessary and possible keywords
            track_class = track_options['track_class']
            NECESSARY_PROPERTIES = track_class.NECESSARY_PROPERTIES
            for necessary_name in NECESSARY_PROPERTIES:
                if necessary_name not in all_keywords:
                    raise InputError(f"The section {section_name} is "
                                     "describing a object of"
                                     f" type {track_class} but the necessary "
                                     f"property {necessary_name}"
                                     " is not part of the config file.")
            unused_keys = []
            # Now we can proceed with the keywords:
            for name, value in parser.items(section_name):
                # To be removed in the next 1.0 version
                if ' ' in name:
                    old_name = name
                    name = '_'.join(name.split(' '))
                    log.warning(f"Deprecated Warning: The section {section_name} "
                                f"uses parameter {old_name} but there is no more "
                                "parameter with space in name. "
                                f"Will be substituted by {name}.\n")
                else:
                    old_name = name
                # end
                SYNONYMOUS_PROPERTIES = track_class.SYNONYMOUS_PROPERTIES
                # If the name is part of the synonymous we substitute by
                # the synonymous value
                if name in SYNONYMOUS_PROPERTIES and \
                        value in SYNONYMOUS_PROPERTIES[name]:
                    track_options[name] = SYNONYMOUS_PROPERTIES[name][value]
                elif name in track_class.STRING_PROPERTIES:
                    track_options[name] = value
                elif name in track_class.BOOLEAN_PROPERTIES:
                    try:
                        # I need to use old_name here else I get a KeyError:
                        track_options[name] = parser.getboolean(section_name,
                                                                old_name)
                        # In the next 1.0 should be:
                        # track_options[name] = parser.getboolean(section_name,
                        #                                         name)
                    except ValueError:
                        raise InputError(f"In section {section_name}, "
                                         f"{old_name} was set to {value}"
                                         " whereas we should have a boolean "
                                         "value. Please, use true or false.")
                        # In the next 1.0 should be:
                        #                f"{name} was set to {value}"
                    if value.lower() not in ['true', 'false']:
                        log.warning("Deprecation Warning: "
                                    f"In section {section_name}, {name} was "
                                    f"set to {value}"
                                    " whereas in the future only"
                                    " true and false value will be"
                                    " accepted.\n")
                elif name in track_class.FLOAT_PROPERTIES:
                    try:
                        track_options[name] = float(value)
                    except ValueError:
                        raise InputError(f"In section {section_name}, {name} "
                                         f"was set to {value}"
                                         " whereas we should have a float "
                                         "value.")
                    min_value, max_value = track_class.FLOAT_PROPERTIES[name]
                    if track_options[name] < min_value or \
                            track_options[name] > max_value:
                        raise InputError(f"In section {section_name}, {name} "
                                         f"was set to {value}"
                                         " whereas it should be between "
                                         f"{min_value} and {max_value}.")
                elif name in track_class.INTEGER_PROPERTIES:
                    try:
                        track_options[name] = int(value)
                    except ValueError:
                        raise InputError(f"In section {section_name}, {name} "
                                         f"was set to {value}"
                                         " whereas we should have an integer "
                                         "value.")
                    min_value, max_value = track_class.INTEGER_PROPERTIES[name]
                    if track_options[name] < min_value or \
                            track_options[name] > max_value:
                        raise InputError(f"In section {section_name}, {name} "
                                         f"was set to {value}"
                                         " whereas it should be between "
                                         f"{min_value} and {max_value}.")
                else:
                    unused_keys.append(name)
            # If there are unused keys they are printed in a warning.
            if len(unused_keys) > 0:
                log.warning(f"In section {section_name}, these parameters are "
                            f"unused:{unused_keys}.\n")
            # The track_options will be checked for the file paths:
            track_options = self.check_file_exists(track_options,
                                                   tracks_file_path,
                                                   track_options['file_type'] == 'hic_matrix')
            # The 'overlay_previous' is initialized:
            if 'overlay_previous' not in track_options:
                track_options['overlay_previous'] = 'no'
            if track_options['overlay_previous'] not in ['no', 'yes', 'share-y']:
                raise InputError(f"In section {section_name}, overlay_previous "
                                 f"was set to {track_options['overlay_previous']}."
                                 " Possible options are no, yes, share-y")
            # If there is no title:
            if 'title' not in track_options:
                track_options['title'] = ''
                if track_options['overlay_previous'] == 'no' and \
                        track_options['track_class'] not in [SpacerTrack,
                                                             XAxisTrack]:
                    log.warning("title not set for section "
                                f"{track_options['section_name']}\n")
            # The track_options are added to the track_list
            track_list.append(track_options)
        # Now that they were all checked
        self.track_list = track_list
        if self.vlines_properties:
            self.vlines_intval_tree, __, __ = \
                file_to_intervaltree(self.vlines_properties['file'],
                                     plot_regions)

[docs]    def close_files(self):
        """
        Close all opened files
        """
        for track in self.track_obj_list:
            track.__del__()

    @staticmethod
[docs]    def check_file_exists(track_dict, tracks_path, is_hic=False):
        """
        Checks if a file or list of files exists. If the file does not exist
        tries to check if the file may be relative to the track_file path,
        in such case the path is updated.
        :param track_dict: dictionary of track values. Should contain
                            a 'file' key containing the path of the file
                            or files to be checked separated by space
                            For example: file1 file2 file3
        :param tracks_path: path of the tracks file
        :param is_hic:
        :return: None
        """
        for key in track_dict.keys():
            if key.endswith("file"):
                file_field_name = key
                # # THIS COULD BE REMOVED IN A NEXT 1.0 VERSION
                if file_field_name == 'boundaries_file':
                    log.warning("Deprecation Warning: "
                                "The boundaries_file is not used anymore."
                                " It will be ignored."
                                " Please use another track with the"
                                " `overlay_previous` option.\n")
                # # END
                file_names = [x for x in track_dict[file_field_name].split(" ") if x != '']
                full_path_file_names = []
                for file_name in file_names:
                    if is_hic and not file_name.endswith('.h5'):
                        file_name_to_check = file_name.split("::")[0]
                    else:
                        file_name_to_check = file_name

                    try:
                        open(file_name_to_check, 'r').close()
                        full_path_file_names.append(file_name)
                    except IOError:
                        try:
                            # try to find the file in the same path as the
                            # track file
                            name_with_tracks_path = tracks_path + "/" + file_name
                            name_with_tracks_path_to_check = tracks_path + "/" + file_name_to_check
                            open(name_with_tracks_path_to_check, 'r').close()
                            full_path_file_names.append(name_with_tracks_path)
                        except IOError:
                            raise InputError(f"File in section [{track_dict['section_name']}] "
                                             f"not found:\n{file_name}\n\n")

                track_dict[file_field_name] = " ".join(full_path_file_names)
        return track_dict

    @staticmethod
[docs]    def guess_filetype(track_dict, available_tracks):
        """
        :param track_dict: dictionary of track values with the 'file' key
                    containing a string path of the file or files.
                    Only the ending of the last file is used
                    in case when there are more files
        :param available_tracks: list of available tracks

        :return: string file type detected
        """
        file_ = track_dict['file'].strip()
        file_type = None
        for track_type, track_class in available_tracks.items():
            for ending in track_class.SUPPORTED_ENDINGS:
                if file_.endswith(ending):
                    if file_type == track_class.TRACK_TYPE:
                        raise InputError("file_type already defined in other"
                                         " GenomeTrack")
                    else:
                        file_type = track_class.TRACK_TYPE

        if file_type is None:
            raise InputError(f"Section {track_dict['section_name']}: can not "
                             "identify file type. Please"
                             " specify the file_type for '{file}'")

        return file_type

    @staticmethod
[docs]    def cm2inch(*tupl):
        inch = 2.54
        if isinstance(tupl[0], tuple):
            return tuple(i / inch for i in tupl[0])
        else:
            return tuple(i / inch for i in tupl)

    @staticmethod
[docs]    def print_elapsed(start):
        if start:
            log.info(time.time() - start)
        return time.time()


[docs]class SpacerTrack(GenomeTrack):
[docs]    SUPPORTED_ENDINGS = []
[docs]    TRACK_TYPE = 'spacer'
[docs]    DEFAULTS_PROPERTIES = {}
[docs]    NECESSARY_PROPERTIES = []
[docs]    SYNONYMOUS_PROPERTIES = {}
[docs]    POSSIBLE_PROPERTIES = {}
[docs]    BOOLEAN_PROPERTIES = []
[docs]    STRING_PROPERTIES = ['overlay_previous',
                         'title', 'file_type']
[docs]    FLOAT_PROPERTIES = {'height': [0, np.inf]}
[docs]    INTEGER_PROPERTIES = {}

[docs]    def plot(self, ax, chrom_region, start_region, end_region):
        pass

[docs]    def plot_y_axis(self, ax, plot_ax):
        pass


[docs]class XAxisTrack(GenomeTrack):
[docs]    SUPPORTED_ENDINGS = []
[docs]    TRACK_TYPE = 'x_axis'
[docs]    NECESSARY_PROPERTIES = []
[docs]    DEFAULTS_PROPERTIES = {'where': 'bottom',
                           'fontsize': 15}
[docs]    SYNONYMOUS_PROPERTIES = {}
[docs]    POSSIBLE_PROPERTIES = {'where': ['top', 'bottom']}
[docs]    BOOLEAN_PROPERTIES = []
[docs]    STRING_PROPERTIES = ['overlay_previous',
                         'title', 'where', 'file_type']
[docs]    FLOAT_PROPERTIES = {'fontsize': [0, np.inf],
                        'height': [0, np.inf]}
[docs]    INTEGER_PROPERTIES = {}

    def __init__(self, *args, **kwargs):
        super(XAxisTrack, self).__init__(*args, **kwargs)

[docs]    def plot(self, ax, chrom_region, region_start, region_end):
        type(region_start)
        type(region_end)

        start, end = ax.get_xlim()
        if self.properties['where'] == 'top':
            ax.axis["x"] = ax.new_floating_axis(0, 0.2)
            ax.axis["x"].set_axis_direction("top")
            label_y_pos = 0.99
            vert_align = 'top'
        else:
            ax.axis["x"] = ax.new_floating_axis(0, 0.9)
            label_y_pos = 0.01
            vert_align = 'bottom'

        # First adjust the size of the label
        ax.axis["x"].major_ticklabels.set(size=self.properties['fontsize'])

        # Get the ticks values
        ticks = ax.get_xticks()
        if ticks[-1] - ticks[1] <= 1e3:
            labels = [f"{x:,.0f}"
                      for x in ticks]
            labels[-2] += " b"

        elif ticks[-1] - ticks[1] <= 4e5:
            labels = [f"{x / 1000.0:,.0f}"
                      for x in ticks]
            labels[-2] += " Kb"

        else:
            labels = [f"{x / 1000000.0:,.1f} "
                      for x in ticks]
            labels[-2] += " Mbp"

        # Fix ticks values
        ax.set_xticks(ticks)

        # Fix the limits which can be overwritten by set_xticks:
        ax.set_xlim(start, end)

        # Put the label
        ax.set_xticklabels(labels)

        # Add the chromosome name
        ax.text(0.5, label_y_pos, chrom_region, horizontalalignment='center',
                fontsize=self.properties['fontsize'],
                verticalalignment=vert_align, transform=ax.transAxes)

[docs]    def plot_y_axis(self, ax, plot_ax):
        pass


[docs]def prepare_config(file_configs, add_spacer=True, spacer_height=0.5):
    """
    Prepare pyGenomeTracks config string.

    Parameters
    ----------
    file_configs
        A list of file paths, or a list of file config dicts, containing file path and other config.
        See pyGenomeTracks documentation for possible parameters.
    add_spacer
        Whether add spacer between tracks
    spacer_height
        spacer height in cm

    Returns
    -------
    a single config string that can be read by PlotTracks
    """
    config_str = f"""
# pyGenomeTrack documentation: https://pygenometracks.readthedocs.io/en/latest/content/all_tracks.html
[x-axis]
[spacer]
height = {spacer_height}
"""

    available_tracks = PlotTracks.get_available_tracks()
    for file_config in file_configs:
        if isinstance(file_config, (str, pathlib.Path)):
            # only file path provided
            file_config = {'file': file_config}

        if isinstance(file_config, dict):
            track_added = False
            if 'file' not in file_config:
                raise KeyError(f'file config dict do not contain "file" key. The provided config was \n{file_config}')
            file_path = file_config['file']
            file_path = pathlib.Path(file_path)
            if 'title' not in file_config:
                label = ".".join(file_path.name.split(".")[0:-1])
                file_config['title'] = label

            if file_path.name.endswith('cool'):
                # assume cool file
                file_config['file_type'] = 'cooler'

            this_add_spacer = add_spacer
            overlay = file_config.get('overlay_previous')
            if overlay in {'yes', 'share-y'}:
                this_add_spacer = False

            if 'file_type' in file_config:
                track_type = file_config['file_type']
                track_class = available_tracks[track_type]
                print(f"Adding {track_type} file: {file_path.name}")
                config_str += _prepare_track_config(file_config=file_config,
                                                    track_type=track_type,
                                                    track_class=track_class,
                                                    add_spacer=this_add_spacer,
                                                    spacer_height=spacer_height)
                track_added = True
            else:
                for track_type, track_class in available_tracks.items():
                    for ending in track_class.SUPPORTED_ENDINGS:
                        if file_path.name.endswith(ending):
                            print(f"Adding {track_type} file: {file_path.name}\n")
                            config_str += _prepare_track_config(file_config=file_config,
                                                                track_type=track_type,
                                                                track_class=track_class,
                                                                add_spacer=this_add_spacer,
                                                                spacer_height=spacer_height)
                            track_added = True

            if track_added is False:
                print(f"WARNING: file format not recognized for: {file_path.name}\n")
                print('Provide "file_type" key in the file config, or use supported endings:')
                for track_type, track_class in available_tracks.items():
                    print(f'{track_type}: {",".join(track_class.SUPPORTED_ENDINGS)}')
        else:
            raise TypeError(f'file_configs must be a list of file config dict, or file paths, '
                            f'got type {type(file_config)} with \n{file_config}')
    return config_str


[docs]def _prepare_track_config(file_config, track_type, track_class, add_spacer=True, spacer_height=0.5):
    config_str = ''
    if add_spacer:
        config_str += f"\n[spacer]\n" \
                      f"height = {spacer_height}\n"

    for required_config in track_class.NECESSARY_PROPERTIES:
        if required_config not in file_config:
            raise KeyError(f'file config dict of track_type {track_type} '
                           f'missing required config {required_config}. \n{file_config}')
    final_config = track_class.DEFAULTS_PROPERTIES.copy()
    final_config.update(file_config)

    kv_pairs = []
    for k, v in final_config.items():
        if v is None:
            kv_pair = f'{k} = none'  # config ini recognize None as string
        else:
            kv_pair = f'{k} = {v}'
        if k not in file_config:
            # comment out default value:
            kv_pair = '#' + kv_pair
        kv_pairs.append(kv_pair)

    file_config_str = '\n'.join(kv_pairs)
    config_str += f"\n[{final_config['title']}]\n{file_config_str}"
    config_str += f'\n# See doc: https://pygenometracks.readthedocs.io/en/latest/content/tracks/{track_type}.html\n'


    return config_str