"""
Modified from pygenometracks
LICENSE: https://github.com/deeptools/pyGenomeTracks/blob/master/LICENSE
"""
import logging
import os
import pathlib
import time
import warnings
from collections import OrderedDict
from configparser import ConfigParser
import matplotlib
import matplotlib.cm
import matplotlib.colors
import matplotlib.gridspec
import matplotlib.pyplot as plt
import matplotlib.textpath
import mpl_toolkits.axisartist as axisartist
import numpy as np
from pygenometracks.tracks.GenomeTrack import GenomeTrack
from pygenometracks.utilities import InputError
from pygenometracks.utilities import file_to_intervaltree, change_chrom_names
matplotlib.use('Agg')
warnings.filterwarnings("ignore", message="numpy.dtype size changed")
warnings.filterwarnings("ignore", message="numpy.ndarray size changed")
warnings.simplefilter(action='ignore', category=FutureWarning)
warnings.simplefilter(action='ignore', category=DeprecationWarning)
warnings.simplefilter(action='ignore', category=ImportWarning)
# import warnings
# warnings.filterwarnings('error')
logging.basicConfig(format=FORMAT)
[docs]log = logging.getLogger(__name__)
# logging.basicConfig()
# log = logging.getLogger("tracksClass")
log.setLevel(logging.DEBUG)
[docs]DEFAULT_TRACK_HEIGHT = 0.5 # in centimeters
# proportion of width dedicated to (figure, legends)
[docs]DEFAULT_WIDTH_RATIOS = (0.01, 0.90, 0.1)
[docs]DEFAULT_MARGINS = {'left': 0.04, 'right': 0.92, 'bottom': 0.03, 'top': 0.97}
[docs]class MultiDict(OrderedDict):
"""
Class to allow identically named
sections in configuration file
by appending the section number
for example:
1. section name
"""
[docs] def __setitem__(self, key, val):
if isinstance(val, OrderedDict):
self._unique += 1
key = f"{str(self._unique)}. [{key}]"
OrderedDict.__setitem__(self, key, val)
[docs]class PlotTracks(object):
def __init__(self,
config,
fig_width=DEFAULT_FIGURE_WIDTH,
fig_height=None,
fontsize=None,
dpi=None,
track_label_width=None,
plot_regions=None,
plot_width=None):
self.fig_width = fig_width
self.fig_height = fig_height
self.dpi = dpi
self.vlines_intval_tree = None
self.vlines_properties = None
self.track_list = []
start = self.print_elapsed(None)
self.available_tracks = self.get_available_tracks()
self.parse_tracks(config, plot_regions=plot_regions)
if fontsize:
fontsize = fontsize
else:
fontsize = float(fig_width) * 0.3
# the track label width is the fraction of
# the figure width that is used
# for the track 'title' or label.
if track_label_width is None:
self.width_ratios = DEFAULT_WIDTH_RATIOS
else:
self.width_ratios = (0.01,
1 - track_label_width,
track_label_width)
# Process the width:
if plot_width is not None:
self.fig_width = plot_width / (
DEFAULT_MARGINS['right'] - DEFAULT_MARGINS['left']) * (
1 + 2 / 3 * 0.01) / (
self.width_ratios[1] / sum(self.width_ratios))
font = {'size': fontsize}
matplotlib.rc('font', **font)
# initialize each track
self.track_obj_list = []
for idx, properties in enumerate(self.track_list):
log.info(f"initialize {properties['section_name']}")
# the track_class is obtained from the available tracks
track_class = self.available_tracks[properties['file_type']]
properties['region'] = plot_regions
self.track_obj_list.append(track_class(properties))
log.info("time initializing track(s):")
self.print_elapsed(start)
@staticmethod
[docs] def get_available_tracks():
avail_tracks = {}
work = [GenomeTrack]
while work:
parent = work.pop()
for child in parent.__subclasses__():
if child not in avail_tracks:
track_type = child.TRACK_TYPE
avail_tracks[track_type] = child
work.append(child)
# plus tracks defined in ALLCools
from .HiCMatrixCoolTrack import HiCMatrixCoolTrack
avail_tracks['cooler'] = HiCMatrixCoolTrack
# swap the GtfTrack in pygenometracks with this class in ALLCools
from .GtfTrack import GtfTrack
avail_tracks['gtf'] = GtfTrack
return avail_tracks
[docs] def get_tracks_height(self, start_region=None, end_region=None):
"""
The main purpose of the following loop is
to get the height of each of the tracks
because for the Hi-C the height is variable with respect
to the range being plotted, the function is called
when each plot is going to be printed.
Args:
start_region: start of the region to plot.
Only used in case the plot is a Hi-C matrix
end_region: end of the region to plot.
Only used in case the plot is a Hi-C matrix
Returns:
"""
track_height = []
for i, track_dict in enumerate(self.track_list):
if i == 0 and track_dict['overlay_previous'] != 'no':
log.warning("First track can not have the `overlay_previous` option.\n")
self.track_list[i]['overlay_previous'] = 'no'
# if overlay_previous is set to a value other than no
# then, skip this track height
if track_dict['overlay_previous'] != 'no':
continue
elif 'height' in track_dict:
height = track_dict['height']
elif track_dict['file_type'] == 'x_axis':
height = track_dict['fontsize'] / 8
elif 'depth' in track_dict and \
track_dict['file_type'] in ('hic_matrix', 'cooler'):
# compute the height of a Hi-C track
# based on the depth such that the
# resulting plot appears proportional
#
# /|\
# / | \
# / |d \ d is the depth that we want to be proportional
# / | \ when plotted in the figure
# ------------------
# region len
#
# d (in cm) = depth (in bp) * 0.5 *
# width (in cm) / region len (in bp)
# to compute the actual width of the figure the margins
# and the region
# set for the legends have to be considered
# DEFAULT_MARGINS['right'] - DEFAULT_MARGINS['left']
# is the proportion of plotting area
# This plotting area is divided in three part as specified in
# self.width_ratios (normalized to 1)
# And as wspace is specified 0.01,
# 0.01 of the mean of the 3 regions is not occupied.
# 1 / (1 + 2 / 3 * 0.01) is used to plot.
hic_width = \
self.fig_width * \
(DEFAULT_MARGINS['right'] - DEFAULT_MARGINS['left']) / \
(1 + 2 / 3 * 0.01) * \
self.width_ratios[1] / sum(self.width_ratios)
# the scale factor is to obtain each bin as a square
# (a 45 degree rotated matrix)
scale_factor = 0.5
depth = min(track_dict['depth'],
int((end_region - start_region) * 1.25))
height = scale_factor * depth * hic_width / (end_region - start_region)
else:
height = DEFAULT_TRACK_HEIGHT
self.track_list[i]['height'] = height
track_height.append(height)
return track_height
[docs] def plot(self, chrom, start, end, file_name=None, title=None,
h_align_titles='left', decreasing_x_axis=False):
track_height = self.get_tracks_height(start_region=start,
end_region=end)
if self.fig_height:
fig_height = self.fig_height
else:
fig_height = sum(track_height) / \
(DEFAULT_MARGINS['top'] - DEFAULT_MARGINS['bottom'])
log.debug(f"Figure size in cm is {self.fig_width} x {fig_height}."
f" Dpi is set to {self.dpi}\n")
fig = plt.figure(figsize=self.cm2inch(self.fig_width, fig_height))
fig.subplots_adjust(wspace=0, hspace=0.0,
left=DEFAULT_MARGINS['left'],
right=DEFAULT_MARGINS['right'],
bottom=DEFAULT_MARGINS['bottom'],
top=DEFAULT_MARGINS['top'])
if title:
fig.suptitle(title)
grids = matplotlib.gridspec.GridSpec(len(track_height), 3,
height_ratios=track_height,
width_ratios=self.width_ratios,
wspace=0.01)
axis_list = []
# skipped_tracks is the count of tracks that have the
# 'overlay_previous' parameter and should be skipped
skipped_tracks = 0
plot_axis = None
y_axis = None
label_axis = None
width_dpi = None
ylim = None
for idx, track in enumerate(self.track_obj_list):
log.info(f"plotting {track.properties['section_name']}")
if track.properties['overlay_previous'] in ['yes', 'share-y']:
overlay = True
skipped_tracks += 1
else:
overlay = False
if track.properties['overlay_previous'] == 'share-y':
ylim = plot_axis.get_ylim()
else:
idx -= skipped_tracks
plot_axis = axisartist.Subplot(fig, grids[idx, 1])
fig.add_subplot(plot_axis)
# turns off the lines around the tracks
plot_axis.axis[:].set_visible(False)
# to make the background transparent
plot_axis.patch.set_visible(False)
if not overlay:
y_axis = plt.subplot(grids[idx, 0])
y_axis.set_axis_off()
label_axis = plt.subplot(grids[idx, 2])
label_axis.set_axis_off()
# I get the width of the label_axis to be able to wrap the
# labels when right or center aligned.
width_inch = label_axis.get_window_extent().width
width_dpi = width_inch * self.dpi / fig.dpi
if decreasing_x_axis:
plot_axis.set_xlim(end, start)
else:
plot_axis.set_xlim(start, end)
track.plot(plot_axis, chrom, start, end)
track.plot_y_axis(y_axis, plot_axis)
track.plot_label(label_axis, width_dpi=width_dpi,
h_align=h_align_titles)
if track.properties['overlay_previous'] == 'share-y':
plot_axis.set_ylim(ylim)
if not overlay:
axis_list.append(plot_axis)
if self.vlines_intval_tree:
self.plot_vlines(axis_list, chrom, start, end)
if file_name is not None:
fig.savefig(file_name, dpi=self.dpi, transparent=False)
return fig
[docs] def plot_vlines(self, axis_list, chrom_region, start_region, end_region):
"""
Plots dotted lines from the top of the first plot to the bottom
of the last plot at the specified positions.
:param axis_list: list of plotted axis
:param chrom_region chromosome name
:param start_region start position
:param end_region end position
:return: None
"""
vlines_list = []
if 'line_width' in self.vlines_properties:
line_width = self.vlines_properties['line_width']
else:
line_width = 0.5
if chrom_region not in list(self.vlines_intval_tree):
chrom_region_before = chrom_region
chrom_region = change_chrom_names(chrom_region)
if chrom_region not in list(self.vlines_intval_tree):
log.warning("*Warning*\nNo interval was found when "
f"overlapping with both {chrom_region_before}:{start_region}-{end_region}"
f" and {chrom_region}:{start_region}-{end_region} inside the "
"file with vertical lines. "
"No vertical lines will be "
"plotted!!\n")
return
chrom_region = GenomeTrack.check_chrom_str_bytes(self.vlines_intval_tree, chrom_region)
for region in sorted(self.vlines_intval_tree[chrom_region][start_region - 10000:end_region + 10000]):
vlines_list.append(region.begin)
for ax in axis_list:
ymin, ymax = ax.get_ylim()
ax.vlines(vlines_list, ymin, ymax, linestyle='dashed', zorder=10,
linewidth=line_width,
color=(0, 0, 0, 0.7), alpha=0.5)
return
[docs] def parse_tracks(self, tracks_file, plot_regions=None):
"""
Parses a configuration file
:param tracks_file: file path containing the track configuration
:param plot_regions: a list of tuple [(chrom1, start1, end1), (chrom2, start2, end2)]
on which the data should be loaded
here the vlines
:return: array of dictionaries and vlines_file.
One dictionary per track
"""
try:
if isinstance(tracks_file, str) and not pathlib.Path(tracks_file).exists():
# assume the tracks_file are the config string
import io
handle = io.StringIO(tracks_file)
else:
handle = open(tracks_file, 'r')
except OSError:
# if the config string too long, path exists raise error.
import io
handle = io.StringIO(tracks_file)
parser = ConfigParser(dict_type=MultiDict, strict=False)
parser.read_file(handle)
handle.close()
tracks_file_path = os.path.dirname(tracks_file)
track_list = []
for section_name in parser.sections():
# track_options is what will become the self.properties
track_options = dict({"section_name": section_name})
all_keywords = [i[0] for i in parser.items(section_name)]
# First we check if there is a skip set to true:
if 'skip' in all_keywords and \
parser.getboolean(section_name, 'skip'):
# In this case we just do not explore the section
continue
# Then the vlines are treated differently:
if ('type', 'vlines') in parser.items(section_name):
# The only thing to check is the file
# There is no other parameters to use.
if 'file' not in all_keywords:
raise InputError(f"The section {section_name} is supposed to be a vline"
" but there is no file.")
track_options['file'] = parser.get(section_name, 'file')
if 'line_width' in all_keywords:
try:
track_options['line_width'] = float(parser.get(section_name, 'line_width'))
except ValueError:
raise InputError(f"In section {section_name}, line_width "
f"was set to {parser.get(section_name, 'line_width')}"
" whereas we should have a float "
"value.")
extra_keywords = [k for k in all_keywords
if k not in ['file', 'type', 'line_width']]
if len(extra_keywords) > 0:
log.warning("These parameters were specified but will not"
f" be used {' '.join(extra_keywords)}.\n")
self.vlines_properties = \
self.check_file_exists(track_options, tracks_file_path)
continue
# For the other cases, we will append properties dictionnaries
# to the track_list
# If the sections are spacer or x-axis we fill the file_type:
# (They are special sections where the title defines the track type)
if section_name.endswith('[spacer]'):
track_options['file_type'] = 'spacer'
track_options['track_class'] = SpacerTrack
elif section_name.endswith('[x-axis]'):
track_options['file_type'] = 'x_axis'
track_options['track_class'] = XAxisTrack
# For the others we need to have a 'file_type'
# Either the file_type is part of the keywords
elif 'file_type' in all_keywords:
track_options['file_type'] = parser.get(section_name,
'file_type')
if track_options['file_type'] not in self.available_tracks:
raise InputError(f"Section {section_name}: the file_type "
f"{track_options['file_type']} does not"
" exists.\npossible file_type are:"
f"{self.available_tracks.keys()}.")
track_options['track_class'] = \
self.available_tracks[track_options['file_type']]
# Or we guess it from the file:
elif 'file' in all_keywords:
track_options['file'] = parser.get(section_name,
'file')
track_options['file_type'] = \
self.guess_filetype(track_options,
self.available_tracks)
track_options['track_class'] = \
self.available_tracks[track_options['file_type']]
else:
raise InputError(f"Section {section_name}: there is no file_type nor file "
"specified and it is not a [spacer] nor a "
"[x-axis] section. This is not a valid "
"section.")
# Now we should have a 'track_class' set.
# We can get for it all the necessary and possible keywords
track_class = track_options['track_class']
NECESSARY_PROPERTIES = track_class.NECESSARY_PROPERTIES
for necessary_name in NECESSARY_PROPERTIES:
if necessary_name not in all_keywords:
raise InputError(f"The section {section_name} is "
"describing a object of"
f" type {track_class} but the necessary "
f"property {necessary_name}"
" is not part of the config file.")
unused_keys = []
# Now we can proceed with the keywords:
for name, value in parser.items(section_name):
# To be removed in the next 1.0 version
if ' ' in name:
old_name = name
name = '_'.join(name.split(' '))
log.warning(f"Deprecated Warning: The section {section_name} "
f"uses parameter {old_name} but there is no more "
"parameter with space in name. "
f"Will be substituted by {name}.\n")
else:
old_name = name
# end
SYNONYMOUS_PROPERTIES = track_class.SYNONYMOUS_PROPERTIES
# If the name is part of the synonymous we substitute by
# the synonymous value
if name in SYNONYMOUS_PROPERTIES and \
value in SYNONYMOUS_PROPERTIES[name]:
track_options[name] = SYNONYMOUS_PROPERTIES[name][value]
elif name in track_class.STRING_PROPERTIES:
track_options[name] = value
elif name in track_class.BOOLEAN_PROPERTIES:
try:
# I need to use old_name here else I get a KeyError:
track_options[name] = parser.getboolean(section_name,
old_name)
# In the next 1.0 should be:
# track_options[name] = parser.getboolean(section_name,
# name)
except ValueError:
raise InputError(f"In section {section_name}, "
f"{old_name} was set to {value}"
" whereas we should have a boolean "
"value. Please, use true or false.")
# In the next 1.0 should be:
# f"{name} was set to {value}"
if value.lower() not in ['true', 'false']:
log.warning("Deprecation Warning: "
f"In section {section_name}, {name} was "
f"set to {value}"
" whereas in the future only"
" true and false value will be"
" accepted.\n")
elif name in track_class.FLOAT_PROPERTIES:
try:
track_options[name] = float(value)
except ValueError:
raise InputError(f"In section {section_name}, {name} "
f"was set to {value}"
" whereas we should have a float "
"value.")
min_value, max_value = track_class.FLOAT_PROPERTIES[name]
if track_options[name] < min_value or \
track_options[name] > max_value:
raise InputError(f"In section {section_name}, {name} "
f"was set to {value}"
" whereas it should be between "
f"{min_value} and {max_value}.")
elif name in track_class.INTEGER_PROPERTIES:
try:
track_options[name] = int(value)
except ValueError:
raise InputError(f"In section {section_name}, {name} "
f"was set to {value}"
" whereas we should have an integer "
"value.")
min_value, max_value = track_class.INTEGER_PROPERTIES[name]
if track_options[name] < min_value or \
track_options[name] > max_value:
raise InputError(f"In section {section_name}, {name} "
f"was set to {value}"
" whereas it should be between "
f"{min_value} and {max_value}.")
else:
unused_keys.append(name)
# If there are unused keys they are printed in a warning.
if len(unused_keys) > 0:
log.warning(f"In section {section_name}, these parameters are "
f"unused:{unused_keys}.\n")
# The track_options will be checked for the file paths:
track_options = self.check_file_exists(track_options,
tracks_file_path,
track_options['file_type'] == 'hic_matrix')
# The 'overlay_previous' is initialized:
if 'overlay_previous' not in track_options:
track_options['overlay_previous'] = 'no'
if track_options['overlay_previous'] not in ['no', 'yes', 'share-y']:
raise InputError(f"In section {section_name}, overlay_previous "
f"was set to {track_options['overlay_previous']}."
" Possible options are no, yes, share-y")
# If there is no title:
if 'title' not in track_options:
track_options['title'] = ''
if track_options['overlay_previous'] == 'no' and \
track_options['track_class'] not in [SpacerTrack,
XAxisTrack]:
log.warning("title not set for section "
f"{track_options['section_name']}\n")
# The track_options are added to the track_list
track_list.append(track_options)
# Now that they were all checked
self.track_list = track_list
if self.vlines_properties:
self.vlines_intval_tree, __, __ = \
file_to_intervaltree(self.vlines_properties['file'],
plot_regions)
[docs] def close_files(self):
"""
Close all opened files
"""
for track in self.track_obj_list:
track.__del__()
@staticmethod
[docs] def check_file_exists(track_dict, tracks_path, is_hic=False):
"""
Checks if a file or list of files exists. If the file does not exist
tries to check if the file may be relative to the track_file path,
in such case the path is updated.
:param track_dict: dictionary of track values. Should contain
a 'file' key containing the path of the file
or files to be checked separated by space
For example: file1 file2 file3
:param tracks_path: path of the tracks file
:param is_hic:
:return: None
"""
for key in track_dict.keys():
if key.endswith("file"):
file_field_name = key
# # THIS COULD BE REMOVED IN A NEXT 1.0 VERSION
if file_field_name == 'boundaries_file':
log.warning("Deprecation Warning: "
"The boundaries_file is not used anymore."
" It will be ignored."
" Please use another track with the"
" `overlay_previous` option.\n")
# # END
file_names = [x for x in track_dict[file_field_name].split(" ") if x != '']
full_path_file_names = []
for file_name in file_names:
if is_hic and not file_name.endswith('.h5'):
file_name_to_check = file_name.split("::")[0]
else:
file_name_to_check = file_name
try:
open(file_name_to_check, 'r').close()
full_path_file_names.append(file_name)
except IOError:
try:
# try to find the file in the same path as the
# track file
name_with_tracks_path = tracks_path + "/" + file_name
name_with_tracks_path_to_check = tracks_path + "/" + file_name_to_check
open(name_with_tracks_path_to_check, 'r').close()
full_path_file_names.append(name_with_tracks_path)
except IOError:
raise InputError(f"File in section [{track_dict['section_name']}] "
f"not found:\n{file_name}\n\n")
track_dict[file_field_name] = " ".join(full_path_file_names)
return track_dict
@staticmethod
[docs] def guess_filetype(track_dict, available_tracks):
"""
:param track_dict: dictionary of track values with the 'file' key
containing a string path of the file or files.
Only the ending of the last file is used
in case when there are more files
:param available_tracks: list of available tracks
:return: string file type detected
"""
file_ = track_dict['file'].strip()
file_type = None
for track_type, track_class in available_tracks.items():
for ending in track_class.SUPPORTED_ENDINGS:
if file_.endswith(ending):
if file_type == track_class.TRACK_TYPE:
raise InputError("file_type already defined in other"
" GenomeTrack")
else:
file_type = track_class.TRACK_TYPE
if file_type is None:
raise InputError(f"Section {track_dict['section_name']}: can not "
"identify file type. Please"
" specify the file_type for '{file}'")
return file_type
@staticmethod
[docs] def cm2inch(*tupl):
inch = 2.54
if isinstance(tupl[0], tuple):
return tuple(i / inch for i in tupl[0])
else:
return tuple(i / inch for i in tupl)
@staticmethod
[docs] def print_elapsed(start):
if start:
log.info(time.time() - start)
return time.time()
[docs]class SpacerTrack(GenomeTrack):
[docs] DEFAULTS_PROPERTIES = {}
[docs] NECESSARY_PROPERTIES = []
[docs] SYNONYMOUS_PROPERTIES = {}
[docs] POSSIBLE_PROPERTIES = {}
[docs] BOOLEAN_PROPERTIES = []
[docs] STRING_PROPERTIES = ['overlay_previous',
'title', 'file_type']
[docs] FLOAT_PROPERTIES = {'height': [0, np.inf]}
[docs] INTEGER_PROPERTIES = {}
[docs] def plot(self, ax, chrom_region, start_region, end_region):
pass
[docs] def plot_y_axis(self, ax, plot_ax):
pass
[docs]class XAxisTrack(GenomeTrack):
[docs] NECESSARY_PROPERTIES = []
[docs] DEFAULTS_PROPERTIES = {'where': 'bottom',
'fontsize': 15}
[docs] SYNONYMOUS_PROPERTIES = {}
[docs] POSSIBLE_PROPERTIES = {'where': ['top', 'bottom']}
[docs] BOOLEAN_PROPERTIES = []
[docs] STRING_PROPERTIES = ['overlay_previous',
'title', 'where', 'file_type']
[docs] FLOAT_PROPERTIES = {'fontsize': [0, np.inf],
'height': [0, np.inf]}
[docs] INTEGER_PROPERTIES = {}
def __init__(self, *args, **kwargs):
super(XAxisTrack, self).__init__(*args, **kwargs)
[docs] def plot(self, ax, chrom_region, region_start, region_end):
type(region_start)
type(region_end)
start, end = ax.get_xlim()
if self.properties['where'] == 'top':
ax.axis["x"] = ax.new_floating_axis(0, 0.2)
ax.axis["x"].set_axis_direction("top")
label_y_pos = 0.99
vert_align = 'top'
else:
ax.axis["x"] = ax.new_floating_axis(0, 0.9)
label_y_pos = 0.01
vert_align = 'bottom'
# First adjust the size of the label
ax.axis["x"].major_ticklabels.set(size=self.properties['fontsize'])
# Get the ticks values
ticks = ax.get_xticks()
if ticks[-1] - ticks[1] <= 1e3:
labels = [f"{x:,.0f}"
for x in ticks]
labels[-2] += " b"
elif ticks[-1] - ticks[1] <= 4e5:
labels = [f"{x / 1000.0:,.0f}"
for x in ticks]
labels[-2] += " Kb"
else:
labels = [f"{x / 1000000.0:,.1f} "
for x in ticks]
labels[-2] += " Mbp"
# Fix ticks values
ax.set_xticks(ticks)
# Fix the limits which can be overwritten by set_xticks:
ax.set_xlim(start, end)
# Put the label
ax.set_xticklabels(labels)
# Add the chromosome name
ax.text(0.5, label_y_pos, chrom_region, horizontalalignment='center',
fontsize=self.properties['fontsize'],
verticalalignment=vert_align, transform=ax.transAxes)
[docs] def plot_y_axis(self, ax, plot_ax):
pass
[docs]def prepare_config(file_configs, add_spacer=True, spacer_height=0.5):
"""
Prepare pyGenomeTracks config string.
Parameters
----------
file_configs
A list of file paths, or a list of file config dicts, containing file path and other config.
See pyGenomeTracks documentation for possible parameters.
add_spacer
Whether add spacer between tracks
spacer_height
spacer height in cm
Returns
-------
a single config string that can be read by PlotTracks
"""
config_str = f"""
# pyGenomeTrack documentation: https://pygenometracks.readthedocs.io/en/latest/content/all_tracks.html
[x-axis]
[spacer]
height = {spacer_height}
"""
available_tracks = PlotTracks.get_available_tracks()
for file_config in file_configs:
if isinstance(file_config, (str, pathlib.Path)):
# only file path provided
file_config = {'file': file_config}
if isinstance(file_config, dict):
track_added = False
if 'file' not in file_config:
raise KeyError(f'file config dict do not contain "file" key. The provided config was \n{file_config}')
file_path = file_config['file']
file_path = pathlib.Path(file_path)
if 'title' not in file_config:
label = ".".join(file_path.name.split(".")[0:-1])
file_config['title'] = label
if file_path.name.endswith('cool'):
# assume cool file
file_config['file_type'] = 'cooler'
this_add_spacer = add_spacer
overlay = file_config.get('overlay_previous')
if overlay in {'yes', 'share-y'}:
this_add_spacer = False
if 'file_type' in file_config:
track_type = file_config['file_type']
track_class = available_tracks[track_type]
print(f"Adding {track_type} file: {file_path.name}")
config_str += _prepare_track_config(file_config=file_config,
track_type=track_type,
track_class=track_class,
add_spacer=this_add_spacer,
spacer_height=spacer_height)
track_added = True
else:
for track_type, track_class in available_tracks.items():
for ending in track_class.SUPPORTED_ENDINGS:
if file_path.name.endswith(ending):
print(f"Adding {track_type} file: {file_path.name}\n")
config_str += _prepare_track_config(file_config=file_config,
track_type=track_type,
track_class=track_class,
add_spacer=this_add_spacer,
spacer_height=spacer_height)
track_added = True
if track_added is False:
print(f"WARNING: file format not recognized for: {file_path.name}\n")
print('Provide "file_type" key in the file config, or use supported endings:')
for track_type, track_class in available_tracks.items():
print(f'{track_type}: {",".join(track_class.SUPPORTED_ENDINGS)}')
else:
raise TypeError(f'file_configs must be a list of file config dict, or file paths, '
f'got type {type(file_config)} with \n{file_config}')
return config_str
[docs]def _prepare_track_config(file_config, track_type, track_class, add_spacer=True, spacer_height=0.5):
config_str = ''
if add_spacer:
config_str += f"\n[spacer]\n" \
f"height = {spacer_height}\n"
for required_config in track_class.NECESSARY_PROPERTIES:
if required_config not in file_config:
raise KeyError(f'file config dict of track_type {track_type} '
f'missing required config {required_config}. \n{file_config}')
final_config = track_class.DEFAULTS_PROPERTIES.copy()
final_config.update(file_config)
kv_pairs = []
for k, v in final_config.items():
if v is None:
kv_pair = f'{k} = none' # config ini recognize None as string
else:
kv_pair = f'{k} = {v}'
if k not in file_config:
# comment out default value:
kv_pair = '#' + kv_pair
kv_pairs.append(kv_pair)
file_config_str = '\n'.join(kv_pairs)
config_str += f"\n[{final_config['title']}]\n{file_config_str}"
config_str += f'\n# See doc: https://pygenometracks.readthedocs.io/en/latest/content/tracks/{track_type}.html\n'
return config_str