diff --git a/Makefile b/Makefile index b674fc53..500c0d2e 100644 --- a/Makefile +++ b/Makefile @@ -105,7 +105,7 @@ test_para: $(OUTPUT2) clean: @make bats_cmd CMD=clean - @git checkout docs/manual/source/conf.py pygtftk/version.py; rm -rf pygtftk.egg-info build airway_love.txt* ENCFF630HEX_Total_RNAseq_K562_count_mini.txt STDIN.e* STDIN.o* dist cmd_list.txt example_list.txt tmp_list.txt simple.chromInfo prgm_list.txt test_list.txt *.bats *.completed *mini_real* heatmap_* tx_classes* *~ \#* hh profile_* toto tott; cd docs/manual/; make clean; cd ../..; find . -type f -name '*~' -exec rm -f '{}' \; + @git checkout docs/manual/source/conf.py pygtftk/version.py; rm -rf pygtftk.egg-info build airway_love.txt* ENCFF630HEX_Total_RNAseq_K562_count_mini.txt STDIN.e* closest_1.tsv STDIN.o* dist cmd_list.txt example_list.txt tmp_list.txt simple.chromInfo prgm_list.txt test_list.txt *.bats *.completed *mini_real* heatmap_* tx_classes* *~ \#* hh profile_* toto tott; cd docs/manual/; make clean; cd ../..; find . -type f -name '*~' -exec rm -f '{}' \; check_cmd_has_example: @for i in $$(gtftk -l); do if grep -q "^$$i" docs/manual/source/presentation.rst; then echo "" >/dev/null; else echo $$i; fi; done @@ -116,15 +116,10 @@ check_example_has_cmd: @for i in $$(cat example_list.txt); do if $$(cat cmd_list.txt | grep -q "^$$i") ; then echo "" >/dev/null; else echo $$i; fi; done @#rm -f cmd_list.txt example_list.txt tmp_list.txt -prepare_pip: - @touch pypi_release_in_progress - @rm -rf build/ dist/ pygtftk.egg-info/ - @python setup.py sdist - @python setup.py bdist_wheel - @rm -f pypi_release_in_progress - -send_to_pypi: - @twine upload --repository-url https://test.pypi.org/legacy/ dist/* --verbose - nb_test: @gtftk -p| perl -ne 'BEGIN{$$/="{"}{/\@test\s+"(\w+)_\d+"/; print $$1,"\n"}'| sort | uniq -c | sort -nr +release: + @touch release_in_progress + +unrelease: + @rm -f release_in_progress diff --git a/README.md b/README.md index 3bae091e..2d243d89 100644 --- a/README.md +++ b/README.md @@ -1,11 +1,10 @@ -[![Packagist](https://img.shields.io/packagist/l/doctrine/orm.svg)](https://github.com/dputhier/gtftk) [![contributions welcome](https://img.shields.io/badge/contributions-welcome-brightgreen.svg?style=flat)](https://github.com/dputhier/gtftk/issues) [![HitCount](http://hits.dwyl.io/puthier/gtftk.svg)](http://hits.dwyl.io/puthier/gtftk) -![GitHub release](https://img.shields.io/github/release/qubyte/rubidium.svg) +[![Packagist](https://img.shields.io/packagist/l/doctrine/orm.svg)](https://github.com/dputhier/pygtftk) [![contributions welcome](https://img.shields.io/badge/contributions-welcome-brightgreen.svg?style=flat)](https://github.com/dputhier/pygtftk/issues) [![HitCount](http://hits.dwyl.com/dputhier/pygtftk.svg)](http://hits.dwyl.com/dputhier/pygtftk) # Python GTF toolkit (pygtftk) -The **Python GTF toolkit (pygtftk) package** is intented to ease handling of GTF (Gene Transfer Format) files. The pygtftk package is compatible with Python 2.7 and relies on **libgtftk**, a library of functions **written in C**. +The **Python GTF toolkit (pygtftk) package** is intented to ease handling of GTF (Gene Transfer Format) files. The pygtftk package is compatible with Python 2.7 and Python >=3.5 and relies on **libgtftk**, a library of functions **written in C**. The package comes with a set of **UNIX commands** that can be accessed through the **gtftk program**. The gtftk program proposes several atomic tools to filter, convert, or extract data from GTF files. The gtftk set of Unix commands can be easily extended using a basic plugin architecture. All these aspects are covered in the help sections. @@ -13,20 +12,19 @@ While the gtftk Unix program comes with hundreds of unitary and functional tests ## System requirements -Depending on the **size of the GTF file**, pygtftk may require lot of memory to perform selected tasks. A computer with 16Go is recommended in order to be able to pipe several commands when working with human annotations from ensembl release (e.g. 91). +Depending on the **size of the GTF file**, pygtftk and gtftk may require lot of memory to perform selected tasks. A computer with 16Go is recommended in order to be able to pipe several commands when working with human annotations from ensembl release (e.g. 91). At the moment, the gtftk program has been tested on: - Linux (Ubuntu 12.04 and 18.04) - OSX (Yosemite, El Capitan). -- WSL/Bash on Ubuntu on Windows. ## Installation through conda package building -Installation through **conda** should be the **prefered install solution**. Although the GTF interface of pygtftk should work properly after a pip install (see next section), the UNIX commands (gtftk program) require several external dependencies with some version constrains. +Installation through **conda** should be the **prefered install solution**. The pygtftk package and gtftk command line tool require external dependencies with some version constrains (e.g. bedtools that, we observed, displays some back compatibility issue). -At the moment, there is no built conda package available. You can however create an environment with all prerequisites using the commands below. +A conda package will be available in the near future. In the meantime, you can however create an environment with all prerequisites using the commands below. If conda is not available on your system, first install miniconda from the official [web site](http://conda.pydata.org/miniconda.html). git clone git@github.com:dputhier/pygtftk.git pygtftk @@ -34,30 +32,27 @@ If conda is not available on your system, first install miniconda from the offic conda env create -n pygtftk_py3k -f conda/env.yaml python=3.6 source activate pygtftk_py3k make install + # It is important to call gtftk -h + # to find and dump plugin parsers + # before going further + gtftk -h -Note for developpers: You can install the develop branch using the same approach. - - git clone git@github.com:dputhier/pygtftk.git pygtftk - cd pygtftk - git checkout develop - conda env create -n pygtftk_py3k_dev -f conda/env.yaml python=3.6 - source activate pygtftk_py3k_dev - make install - ## Installation through pip ### Prerequesites -Again, this is not the prefered way for installation. Please choose conda whenever possible. The gtftk Unix command line program requires at least bedtools (command line). +Again, this is not the prefered way for installation. Please choose conda whenever possible. The gtftk Unix command line program has been tested with bedtools 2.27.1 (be aware that we have encountered some back compatibility issues with bedtools). ### Running pip Installation through pip can be done as follow. pip install -r requirements.txt - pip install pygtftk - + # It is important to call gtftk -h + # to find and dump plugin parsers + # before going further + gtftk -h ## Running functional tests diff --git a/bin/__init__.py b/bin/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/changelog.md b/changelog.md index 8d7309dc..fbd585a1 100644 --- a/changelog.md +++ b/changelog.md @@ -1,21 +1,34 @@ -## Changelog +# Changelog -### v0.9.2 (not-yet-release) +## v0.9.4 (not-yet-release) -#### Bug Fixes +### Bug Fixes -#### API Changes +### API Changes +### New Features -#### New Features -- pygtftk is now compatible with both python 2 and 3. +## v0.9.3 + +### Bug Fixes + +- User-defined colors are now applied when calling profile command (bug in 0.9.2). +- Fixed test issues when using md5sum under Linux. +- Lots of typo fixed (their must be lot remaining unfortunatly...). + +### API Changes + + +### New Features + +- pygtftk is now compatible with both python 2.7 and >=3.5. - libstdcxx is no more required in env.yaml. - 'Makefile clean' also reset version.py and conf.py to repository version. - Improved parser loading. - 5p_3p_coord has been renamed get_5p_3p_coords. -- Lots of typo fixed (their must be lot remaining unfortunatly...). - Added a pip requirement.txt file for developers. - Added a specific conda environment file for py2k. -- The default conda environment targets Python3.6. +- The default conda environment targets Python 3.6. - Improve garbage collector behavior upon exit. +- Added --system-info argument to gtftk. diff --git a/conda/env.yaml b/conda/env.yaml index d9810825..81c1cee4 100644 --- a/conda/env.yaml +++ b/conda/env.yaml @@ -17,8 +17,6 @@ dependencies: - pandas >=0.23.3 - scipy >=1.1.0 - pybedtools >=0.7.8 - - pybigwig >=0.3.10 - - pysam >=0.9.1.4 - pyyaml >=3.12 - gcc >=4.8.5 - requests >=2.13.0 @@ -30,4 +28,6 @@ dependencies: - plotnine >=0.4.0 - pip: - future + - pyBigWig >=0.3.12 + - future diff --git a/conda/env_py2k.yaml b/conda/env_py2k.yaml index 182d7927..b62ecc32 100644 --- a/conda/env_py2k.yaml +++ b/conda/env_py2k.yaml @@ -18,7 +18,6 @@ dependencies: - scipy >=1.1.0 - pybedtools >=0.7.8 - pybigwig >=0.3.10 - - pysam >=0.9.1.4 - pyyaml >=3.12 - gcc >=4.8.5 - requests >=2.13.0 @@ -26,8 +25,9 @@ dependencies: - pyparsing >=2.2.0 - biopython >=1.69 - zlib >=1.2.11 - - matplotlib >=2.0.2 + - matplotlib >=2.0.2,<3 - plotnine >=0.4.0 - pip: - future - - sphinxcontrib-programoutput \ No newline at end of file + - pyBigWig >=0.3.12 + - future \ No newline at end of file diff --git a/conda/meta.yaml b/conda/meta.yaml index 2ebfc3b9..a9b15544 100644 --- a/conda/meta.yaml +++ b/conda/meta.yaml @@ -21,7 +21,6 @@ requirements: - scipy >=1.1.0 - pybedtools >=0.7.8 - pybigwig >=0.3.10 - - pysam >=0.9.1.4 - pyyaml >=3.12 - gcc >=4.8.5 - requests >=2.13.0 @@ -33,6 +32,8 @@ requirements: - plotnine >=0.4.0 - pip: - future + - pyBigWig >=0.3.12 + - future run: - GitPython >=2.1.8 @@ -46,7 +47,6 @@ requirements: - scipy >=1.1.0 - pybedtools >=0.7.8 - pybigwig >=0.3.10 - - pysam >=0.9.1.4 - pyyaml >=3.12 - gcc >=4.8.5 - requests >=2.13.0 @@ -58,6 +58,8 @@ requirements: - plotnine >=0.4.0 - pip: - future + - pyBigWig >=0.3.12 + - future test: commands: diff --git a/conda/meta_py2k.yaml b/conda/meta_py2k.yaml index 5caed5b5..d72e24bf 100644 --- a/conda/meta_py2k.yaml +++ b/conda/meta_py2k.yaml @@ -20,8 +20,6 @@ requirements: - pandas >=0.23.3 - scipy >=1.1.0 - pybedtools >=0.7.8 - - pybigwig >=0.3.10 - - pysam >=0.9.1.4 - pyyaml >=3.12 - gcc >=4.8.5 - requests >=2.13.0 @@ -29,10 +27,12 @@ requirements: - pyparsing >=2.2.0 - biopython >=1.69 - zlib >=1.2.11 - - matplotlib >=2.0.2 + - matplotlib >=2.0.2,<3 - plotnine >=0.4.0 - pip: - future + - pybigwig >=0.3.12 + - future run: - GitPython >=2.1.8 @@ -45,8 +45,6 @@ requirements: - pandas >=0.23.3 - scipy >=1.1.0 - pybedtools >=0.7.8 - - pybigwig >=0.3.10 - - pysam >=0.9.1.4 - pyyaml >=3.12 - gcc >=4.8.5 - requests >=2.13.0 @@ -54,10 +52,12 @@ requirements: - pyparsing >=2.2.0 - biopython >=1.69 - zlib >=1.2.11 - - matplotlib >=2.0.2 + - matplotlib >=2.0.2,<3 - plotnine >=0.4.0 - pip: - future + - pybigwig >=0.3.12 + - future test: commands: diff --git a/docs/manual/build/html/.buildinfo b/docs/manual/build/html/.buildinfo index dd634509..54d8aaf3 100644 --- a/docs/manual/build/html/.buildinfo +++ b/docs/manual/build/html/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 5bba3f85f3e759061303af1056946e93 +config: 3eeb7851cd4315f822ba357e4cc51edd tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/docs/manual/build/html/_static/documentation_options.js b/docs/manual/build/html/_static/documentation_options.js index 5535fbf7..482f48fb 100644 --- a/docs/manual/build/html/_static/documentation_options.js +++ b/docs/manual/build/html/_static/documentation_options.js @@ -1,6 +1,6 @@ var DOCUMENTATION_OPTIONS = { URL_ROOT: document.getElementById("documentation_options").getAttribute('data-url_root'), - VERSION: '0.9.2', + VERSION: '0.9.3', LANGUAGE: 'en', COLLAPSE_INDEX: false, FILE_SUFFIX: '.html', diff --git a/docs/manual/build/html/about.html b/docs/manual/build/html/about.html index a9cb2d2d..7b0462ae 100644 --- a/docs/manual/build/html/about.html +++ b/docs/manual/build/html/about.html @@ -6,7 +6,7 @@ - About pygtftk — gtftk 0.9.2 documentation + About pygtftk — gtftk 0.9.3 documentation @@ -35,7 +35,7 @@

Navigation

  • previous |
  • - + @@ -199,7 +199,7 @@

    Navigation

  • previous |
  • - + @@ -3265,7 +3265,7 @@

    Navigation

  • previous |
  • - + @@ -157,7 +157,7 @@

    Navigation

  • previous |
  • - + @@ -232,7 +232,7 @@

    Navigation

  • previous |
  • - + @@ -485,7 +485,7 @@

    Navigation

  • modules |
  • - + @@ -119,7 +119,7 @@

    Navigation

  • next |
  • - + @@ -99,7 +99,7 @@

    Navigation

  • previous |
  • - + @@ -52,7 +52,7 @@

    Main parser arguments of gtftk

    The -h argument can be used to get a synopsis for implemented commands.

    $ gtftk -h
    -  Usage: gtftk [-h] [-b] [-p] [-v] [-l]  ...
    +  Usage: gtftk [-h] [-b] [-p] [-s] [-v] [-l]  ...
     
       A toolbox to handle GTF files.
     
    @@ -66,7 +66,7 @@ 

    Getting help with -hGetting help with -hapropos
    $ gtftk apropos -k promoter
    - |-- 12:56-INFO-apropos : >> Keyword 'promoter' was found in the following command:
    -	- coverage.
    + |-- 11:06-INFO-apropos : >> Keyword 'promoter' was found in the following command:
     	- divergent.
    +	- coverage.
     

    Arguments:

    @@ -313,36 +314,36 @@

    get_example
    $ gtftk get_example -d simple -f '*'
    - |-- 12:56-INFO-get_example : Copying: add_attr_to_pos.tab
    - |-- 12:56-INFO-get_example : Copying: simple.1.bt2
    - |-- 12:56-INFO-get_example : Copying: simple.2.bt2
    - |-- 12:56-INFO-get_example : Copying: simple.2.bw
    - |-- 12:56-INFO-get_example : Copying: simple.3.bt2
    - |-- 12:56-INFO-get_example : Copying: simple.3.bw
    - |-- 12:56-INFO-get_example : Copying: simple.4.bt2
    - |-- 12:56-INFO-get_example : Copying: simple.bam
    - |-- 12:56-INFO-get_example : Copying: simple.bam.bai
    - |-- 12:56-INFO-get_example : Copying: simple.bw
    - |-- 12:56-INFO-get_example : Copying: simple.chromInfo
    - |-- 12:56-INFO-get_example : Copying: simple.fa
    - |-- 12:56-INFO-get_example : Copying: simple.fa.fai
    - |-- 12:56-INFO-get_example : Copying: simple.geneList
    - |-- 12:56-INFO-get_example : Copying: simple.genes
    - |-- 12:56-INFO-get_example : Copying: simple.gtf
    - |-- 12:56-INFO-get_example : Copying: simple.join
    - |-- 12:56-INFO-get_example : Copying: simple.join_mat
    - |-- 12:56-INFO-get_example : Copying: simple.join_mat_2
    - |-- 12:56-INFO-get_example : Copying: simple.join_mat_3
    - |-- 12:56-INFO-get_example : Copying: simple.join_with_dup
    - |-- 12:56-INFO-get_example : Copying: simple.loc_bed
    - |-- 12:56-INFO-get_example : Copying: simple.map
    - |-- 12:56-INFO-get_example : Copying: simple.rev.1.bt2
    - |-- 12:56-INFO-get_example : Copying: simple.rev.2.bt2
    - |-- 12:56-INFO-get_example : Copying: simple_col.csv
    - |-- 12:56-INFO-get_example : Copying: simple_peaks.bed
    - |-- 12:56-INFO-get_example : Copying: simple_peaks.bed3
    - |-- 12:56-INFO-get_example : Copying: simple_peaks.bed6
    - |-- 12:56-INFO-get_example : Copying: simple_reads.fq
    + |-- 11:07-INFO-get_example : Copying: add_attr_to_pos.tab
    + |-- 11:07-INFO-get_example : Copying: simple.1.bt2
    + |-- 11:07-INFO-get_example : Copying: simple.2.bt2
    + |-- 11:07-INFO-get_example : Copying: simple.2.bw
    + |-- 11:07-INFO-get_example : Copying: simple.3.bt2
    + |-- 11:07-INFO-get_example : Copying: simple.3.bw
    + |-- 11:07-INFO-get_example : Copying: simple.4.bt2
    + |-- 11:07-INFO-get_example : Copying: simple.bam
    + |-- 11:07-INFO-get_example : Copying: simple.bam.bai
    + |-- 11:07-INFO-get_example : Copying: simple.bw
    + |-- 11:07-INFO-get_example : Copying: simple.chromInfo
    + |-- 11:07-INFO-get_example : Copying: simple.fa
    + |-- 11:07-INFO-get_example : Copying: simple.fa.fai
    + |-- 11:07-INFO-get_example : Copying: simple.geneList
    + |-- 11:07-INFO-get_example : Copying: simple.genes
    + |-- 11:07-INFO-get_example : Copying: simple.gtf
    + |-- 11:07-INFO-get_example : Copying: simple.join
    + |-- 11:07-INFO-get_example : Copying: simple.join_mat
    + |-- 11:07-INFO-get_example : Copying: simple.join_mat_2
    + |-- 11:07-INFO-get_example : Copying: simple.join_mat_3
    + |-- 11:07-INFO-get_example : Copying: simple.join_with_dup
    + |-- 11:07-INFO-get_example : Copying: simple.loc_bed
    + |-- 11:07-INFO-get_example : Copying: simple.map
    + |-- 11:07-INFO-get_example : Copying: simple.rev.1.bt2
    + |-- 11:07-INFO-get_example : Copying: simple.rev.2.bt2
    + |-- 11:07-INFO-get_example : Copying: simple_col.csv
    + |-- 11:07-INFO-get_example : Copying: simple_peaks.bed
    + |-- 11:07-INFO-get_example : Copying: simple_peaks.bed3
    + |-- 11:07-INFO-get_example : Copying: simple_peaks.bed6
    + |-- 11:07-INFO-get_example : Copying: simple_reads.fq
     

    Arguments:

    @@ -1182,22 +1183,22 @@

    merge_attr
    $ gtftk get_example |  gtftk merge_attr -k transcript_id,gene_id -d transcript_id -s "|" -f "*" | gtftk tabulate -k feature,transcript_id -x | head -n 6
     Traceback (most recent call last):
       File "/Users/puthier/miniconda3/envs/pygtftk_py3k/bin/gtftk", line 4, in <module>
    -    __import__('pkg_resources').run_script('pygtftk==0.9.1.dev0+7f5a', 'gtftk')
    +    __import__('pkg_resources').run_script('pygtftk==0.9.3', 'gtftk')
       File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pkg_resources/__init__.py", line 661, in run_script
         self.require(requires)[0].run_script(script_name, ns)
       File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pkg_resources/__init__.py", line 1441, in run_script
         exec(code, namespace, namespace)
    -  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.1.dev0+7f5a-py3.6-macosx-10.9-x86_64.egg/EGG-INFO/scripts/gtftk", line 83, in <module>
    +  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.3-py3.6-macosx-10.9-x86_64.egg/EGG-INFO/scripts/gtftk", line 83, in <module>
         args = main()
    -  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.1.dev0+7f5a-py3.6-macosx-10.9-x86_64.egg/EGG-INFO/scripts/gtftk", line 68, in main
    +  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.3-py3.6-macosx-10.9-x86_64.egg/EGG-INFO/scripts/gtftk", line 68, in main
         CmdManager.run(args)
    -  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.1.dev0+7f5a-py3.6-macosx-10.9-x86_64.egg/pygtftk/cmd_manager.py", line 939, in run
    +  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.3-py3.6-macosx-10.9-x86_64.egg/pygtftk/cmd_manager.py", line 977, in run
         fun(**args)
    -  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.1.dev0+7f5a-py3.6-macosx-10.9-x86_64.egg/pygtftk/plugins/merge_attr.py", line 92, in merge_attr
    +  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.3-py3.6-macosx-10.9-x86_64.egg/pygtftk/plugins/merge_attr.py", line 92, in merge_attr
         separator).write(outputfile,
    -  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.1.dev0+7f5a-py3.6-macosx-10.9-x86_64.egg/pygtftk/gtf_interface.py", line 536, in merge_attr
    +  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.3-py3.6-macosx-10.9-x86_64.egg/pygtftk/gtf_interface.py", line 538, in merge_attr
         self = self.add_attr_column(tmp_file, new_key)
    -  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.1.dev0+7f5a-py3.6-macosx-10.9-x86_64.egg/pygtftk/gtf_interface.py", line 3363, in add_attr_column
    +  File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pygtftk-0.9.3-py3.6-macosx-10.9-x86_64.egg/pygtftk/gtf_interface.py", line 3369, in add_attr_column
         tmp = input_file.readlines()
       File "/Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/tempfile.py", line 485, in func_wrapper
         return func(*args, **kwargs)
    @@ -1239,7 +1240,7 @@ 

    discretize_key
    $ gtftk get_example |  gtftk join_attr -j simple.join_mat -k gene_id -m | gtftk discretize_key -k S1 -d S1_d -n 2 | gtftk select_by_key -k feature -v gene
    - |-- 12:58-INFO-discretize_key : Categories: ['(0.231_0.616]', '(0.616_0.999]']
    + |-- 11:08-INFO-discretize_key : Categories: ['(0.231_0.616]', '(0.616_0.999]']
     chr1	gtftk	gene	125	138	.	+	.	gene_id "G0001";
     chr1	gtftk	gene	180	189	.	+	.	gene_id "G0002";
     chr1	gtftk	gene	50	61	.	-	.	gene_id "G0003"; S1 "0.2322"; S2 "0.4"; S1_d "(0.231_0.616]";
    @@ -1253,7 +1254,7 @@ 

    discretize_key @@ -1696,12 +1697,12 @@

    random_tx
    $ gtftk get_example -d mini_real -f '*'
    - |-- 13:01-INFO-get_example : Copying: #H3K4me3_cond_1.bed#
    - |-- 13:01-INFO-get_example : Copying: airway_love.txt.gz
    - |-- 13:01-INFO-get_example : Copying: ENCFF112BHN_H3K4me3_K562_sub.bed
    - |-- 13:01-INFO-get_example : Copying: ENCFF119BYM_H3K36me3_K562_sub.bed
    - |-- 13:01-INFO-get_example : Copying: ENCFF431HAA_H3K36me3_K562_sub.bw
    - |-- 13:01-INFO-get_example : Copying: ENCFF742FDS_H3K4me3_K562_sub.bw
    - |-- 13:01-INFO-get_example : Copying: ENCFF947DVY_H3K79me2_K562_sub.bw
    - |-- 13:01-INFO-get_example : Copying: H3K4me3_cond_1.bed
    - |-- 13:01-INFO-get_example : Copying: H3K4me3_cond_2.bed
    - |-- 13:01-INFO-get_example : Copying: H3K4me3_cond_3.bed
    - |-- 13:01-INFO-get_example : Copying: hg38.genome
    - |-- 13:01-INFO-get_example : Copying: hg38.genome.back
    - |-- 13:01-INFO-get_example : Copying: mini_real.gtf.gz
    - |-- 13:01-INFO-get_example : Copying: mini_real_control_1.txt
    - |-- 13:01-INFO-get_example : Copying: mini_real_counts_ENCFF630HEX.txt
    - |-- 13:01-INFO-get_example : Copying: mini_real_gn_list_hg38.txt
    - |-- 13:01-INFO-get_example : Copying: mini_real_noov_rnd_tx.gtf.gz
    - |-- 13:01-INFO-get_example : Copying: tx_classes.txt
    + |-- 11:41-INFO-get_example : Copying: #H3K4me3_cond_1.bed#
    + |-- 11:41-INFO-get_example : Copying: airway_love.txt.gz
    + |-- 11:41-INFO-get_example : Copying: ENCFF112BHN_H3K4me3_K562_sub.bed
    + |-- 11:41-INFO-get_example : Copying: ENCFF119BYM_H3K36me3_K562_sub.bed
    + |-- 11:41-INFO-get_example : Copying: ENCFF431HAA_H3K36me3_K562_sub.bw
    + |-- 11:41-INFO-get_example : Copying: ENCFF742FDS_H3K4me3_K562_sub.bw
    + |-- 11:41-INFO-get_example : Copying: ENCFF947DVY_H3K79me2_K562_sub.bw
    + |-- 11:41-INFO-get_example : Copying: H3K4me3_cond_1.bed
    + |-- 11:41-INFO-get_example : Copying: H3K4me3_cond_2.bed
    + |-- 11:41-INFO-get_example : Copying: H3K4me3_cond_3.bed
    + |-- 11:41-INFO-get_example : Copying: hg38.genome
    + |-- 11:41-INFO-get_example : Copying: hg38.genome.back
    + |-- 11:41-INFO-get_example : Copying: mini_real.gtf.gz
    + |-- 11:41-INFO-get_example : Copying: mini_real_control_1.txt
    + |-- 11:41-INFO-get_example : Copying: mini_real_counts_ENCFF630HEX.txt
    + |-- 11:41-INFO-get_example : Copying: mini_real_gn_list_hg38.txt
    + |-- 11:41-INFO-get_example : Copying: mini_real_noov_rnd_tx.gtf.gz
    + |-- 11:41-INFO-get_example : Copying: tx_classes.txt
     

    Although we could work on the full dataset, we will focus on transcripts whose promoter region do not overlaps with any transcript from another gene.

    @@ -3101,24 +3102,24 @@

    mk_matrix
    $ gtftk get_example -f '*' -d mini_real
    - |-- 13:01-INFO-get_example : Copying: #H3K4me3_cond_1.bed#
    - |-- 13:01-INFO-get_example : Copying: airway_love.txt.gz
    - |-- 13:01-INFO-get_example : Copying: ENCFF112BHN_H3K4me3_K562_sub.bed
    - |-- 13:01-INFO-get_example : Copying: ENCFF119BYM_H3K36me3_K562_sub.bed
    - |-- 13:01-INFO-get_example : Copying: ENCFF431HAA_H3K36me3_K562_sub.bw
    - |-- 13:01-INFO-get_example : Copying: ENCFF742FDS_H3K4me3_K562_sub.bw
    - |-- 13:01-INFO-get_example : Copying: ENCFF947DVY_H3K79me2_K562_sub.bw
    - |-- 13:01-INFO-get_example : Copying: H3K4me3_cond_1.bed
    - |-- 13:01-INFO-get_example : Copying: H3K4me3_cond_2.bed
    - |-- 13:01-INFO-get_example : Copying: H3K4me3_cond_3.bed
    - |-- 13:01-INFO-get_example : Copying: hg38.genome
    - |-- 13:01-INFO-get_example : Copying: hg38.genome.back
    - |-- 13:01-INFO-get_example : Copying: mini_real.gtf.gz
    - |-- 13:01-INFO-get_example : Copying: mini_real_control_1.txt
    - |-- 13:01-INFO-get_example : Copying: mini_real_counts_ENCFF630HEX.txt
    - |-- 13:01-INFO-get_example : Copying: mini_real_gn_list_hg38.txt
    - |-- 13:01-INFO-get_example : Copying: mini_real_noov_rnd_tx.gtf.gz
    - |-- 13:01-INFO-get_example : Copying: tx_classes.txt
    + |-- 11:41-INFO-get_example : Copying: #H3K4me3_cond_1.bed#
    + |-- 11:41-INFO-get_example : Copying: airway_love.txt.gz
    + |-- 11:41-INFO-get_example : Copying: ENCFF112BHN_H3K4me3_K562_sub.bed
    + |-- 11:41-INFO-get_example : Copying: ENCFF119BYM_H3K36me3_K562_sub.bed
    + |-- 11:41-INFO-get_example : Copying: ENCFF431HAA_H3K36me3_K562_sub.bw
    + |-- 11:41-INFO-get_example : Copying: ENCFF742FDS_H3K4me3_K562_sub.bw
    + |-- 11:41-INFO-get_example : Copying: ENCFF947DVY_H3K79me2_K562_sub.bw
    + |-- 11:41-INFO-get_example : Copying: H3K4me3_cond_1.bed
    + |-- 11:41-INFO-get_example : Copying: H3K4me3_cond_2.bed
    + |-- 11:41-INFO-get_example : Copying: H3K4me3_cond_3.bed
    + |-- 11:41-INFO-get_example : Copying: hg38.genome
    + |-- 11:41-INFO-get_example : Copying: hg38.genome.back
    + |-- 11:41-INFO-get_example : Copying: mini_real.gtf.gz
    + |-- 11:41-INFO-get_example : Copying: mini_real_control_1.txt
    + |-- 11:41-INFO-get_example : Copying: mini_real_counts_ENCFF630HEX.txt
    + |-- 11:41-INFO-get_example : Copying: mini_real_gn_list_hg38.txt
    + |-- 11:41-INFO-get_example : Copying: mini_real_noov_rnd_tx.gtf.gz
    + |-- 11:41-INFO-get_example : Copying: tx_classes.txt
     

    $ gtftk mk_matrix -k 5 -i mini_real_noov_rnd_tx.gtf.gz -d 5000 -u 5000 -w 200 -c hg38.genome  -l  H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_promoter
    @@ -3130,38 +3131,42 @@ 

    mk_matrix
    $ gtftk mk_matrix -k 5 -i mini_real_noov_rnd_tx.gtf.gz -t transcript  -d 5000 -u 5000 -w 200 -c hg38.genome  -l  H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_tx
    - |-- 13:02-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:02-WARNING-mk_matrix : ENST00000612829 has length : 85
    - |-- 13:02-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:02-WARNING-mk_matrix : Filter them out please.
    - |-- 13:02-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:02-WARNING-mk_matrix : ENST00000385018 has length : 82
    - |-- 13:02-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:02-WARNING-mk_matrix : Filter them out please.
    - |-- 13:02-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:02-WARNING-mk_matrix : ENST00000583764 has length : 85
    - |-- 13:02-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:02-WARNING-mk_matrix : Filter them out please.
    + |-- 11:42-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:42-WARNING-mk_matrix : ENST00000612829 has length : 85
    + |-- 11:42-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:42-WARNING-mk_matrix : Filter them out please.
    + |-- 11:42-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:42-WARNING-mk_matrix : ENST00000385018 has length : 82
    + |-- 11:42-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:42-WARNING-mk_matrix : Filter them out please.
    + |-- 11:42-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:42-WARNING-mk_matrix : ENST00000583764 has length : 85
    + |-- 11:42-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:42-WARNING-mk_matrix : Filter them out please.
    + |-- 11:42-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:42-WARNING-mk_matrix : ENST00000637495 has length : 68
    + |-- 11:42-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:42-WARNING-mk_matrix : Filter them out please.
     

    Along the whole transcript but increasing the number of windows dedicated to upstream and downstream regions.

    $ gtftk mk_matrix -k 5 --bin-around-frac 0.5 -i mini_real_noov_rnd_tx.gtf.gz -t transcript  -d 5000 -u 5000 -w 200 -c hg38.genome  -l  H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_tx_2
    - |-- 13:03-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:03-WARNING-mk_matrix : ENST00000612829 has length : 85
    - |-- 13:03-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:03-WARNING-mk_matrix : Filter them out please.
    - |-- 13:03-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:03-WARNING-mk_matrix : ENST00000385018 has length : 82
    - |-- 13:03-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:03-WARNING-mk_matrix : Filter them out please.
    - |-- 13:03-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:03-WARNING-mk_matrix : ENST00000583764 has length : 85
    - |-- 13:03-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:03-WARNING-mk_matrix : Filter them out please.
    - |-- 13:03-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:03-WARNING-mk_matrix : ENST00000637495 has length : 68
    - |-- 13:03-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:03-WARNING-mk_matrix : Filter them out please.
    + |-- 11:43-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:43-WARNING-mk_matrix : ENST00000612829 has length : 85
    + |-- 11:43-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:43-WARNING-mk_matrix : Filter them out please.
    + |-- 11:43-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:43-WARNING-mk_matrix : ENST00000385018 has length : 82
    + |-- 11:43-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:43-WARNING-mk_matrix : Filter them out please.
    + |-- 11:43-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:43-WARNING-mk_matrix : ENST00000583764 has length : 85
    + |-- 11:43-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:43-WARNING-mk_matrix : Filter them out please.
    + |-- 11:43-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:43-WARNING-mk_matrix : ENST00000637495 has length : 68
    + |-- 11:43-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:43-WARNING-mk_matrix : Filter them out please.
     

    Along a user defined set of regions (in bed6 format). Here we will used the transcript coordinates in bed format as an example.

    @@ -3169,22 +3174,22 @@

    mk_matrix
    $ gtftk mk_matrix -k 5 --bin-around-frac 0.5 -i mini_real_rnd_tx.bed -t user_regions  -d 5000 -u 5000 -w 200 -c hg38.genome  -l  H3K4me3,H3K79me,H3K36me3 ENCFF742FDS_H3K4me3_K562_sub.bw ENCFF947DVY_H3K79me2_K562_sub.bw ENCFF431HAA_H3K36me3_K562_sub.bw -o mini_real_user_def
    - |-- 13:04-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:04-WARNING-mk_matrix : ENSG00000187514|ENST00000612829 has length : 85
    - |-- 13:04-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:04-WARNING-mk_matrix : Filter them out please.
    - |-- 13:04-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:04-WARNING-mk_matrix : ENSG00000207751|ENST00000385018 has length : 82
    - |-- 13:04-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:04-WARNING-mk_matrix : Filter them out please.
    - |-- 13:04-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:04-WARNING-mk_matrix : ENSG00000110717|ENST00000583764 has length : 85
    - |-- 13:04-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:04-WARNING-mk_matrix : Filter them out please.
    - |-- 13:04-WARNING-mk_matrix : Encountered regions shorter than bin number.
    - |-- 13:04-WARNING-mk_matrix : ENSG00000148120|ENST00000637495 has length : 68
    - |-- 13:04-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    - |-- 13:04-WARNING-mk_matrix : Filter them out please.
    + |-- 11:45-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:45-WARNING-mk_matrix : ENSG00000187514|ENST00000612829 has length : 85
    + |-- 11:45-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:45-WARNING-mk_matrix : Filter them out please.
    + |-- 11:44-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:44-WARNING-mk_matrix : ENSG00000207751|ENST00000385018 has length : 82
    + |-- 11:44-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:44-WARNING-mk_matrix : Filter them out please.
    + |-- 11:45-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:45-WARNING-mk_matrix : ENSG00000110717|ENST00000583764 has length : 85
    + |-- 11:45-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:45-WARNING-mk_matrix : Filter them out please.
    + |-- 11:45-WARNING-mk_matrix : Encountered regions shorter than bin number.
    + |-- 11:45-WARNING-mk_matrix : ENSG00000148120|ENST00000637495 has length : 68
    + |-- 11:45-WARNING-mk_matrix : They will be set to NA or --pseudo-count depending on --zero-to-na.
    + |-- 11:45-WARNING-mk_matrix : Filter them out please.
     

    And finally using a set of single nucleotides coordinates that will be extend (-u/-d) and assessed for coverage. Here we will take the coordinates of TSS as example.

    @@ -3203,132 +3208,132 @@

    profile
    $ gtftk profile -D -i mini_real_promoter.zip -o profile_prom -pf png -if example_01.png
    - |-- 13:05-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:46-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_01.png

    The same diagram is obtained if a bed file pointing to TSS was provided to mk_matrix and used in single_nuc mode.

    $ gtftk profile -i mini_real_single_nuc.zip -o profile_prom -pf png -if example_01a.png
    - |-- 13:05-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:46-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_01a.png

    Changing colors and applying color order can be done using the following syntax:

    $ gtftk profile -D -i mini_real_promoter.zip -c 'red,blue,violet' -d H3K79me,H3K4me3,H3K36me3 -o profile_prom -pf png -if example_01b.png
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:46-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_01b.png

    A subset of bigwig assessed for coverage can be selected for plotting. This is achieved using the –subset-bwig argument:

    $ gtftk profile -f bwig -g tx_classes -D -i mini_real_tx.zip  -fo  -o profile_tx -pf png -if example_01c.png  -fo -c 'red' -V 2  -w  -tl -e -lw 0.5 -u H3K4me3
    - |-- 13:06-DEBUG-profile : Using pandas version 0.23.4
    - |-- 13:06-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    - |-- 13:06-DEBUG-profile : Using numpy version 1.13.3
    - |-- 13:06-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    - |-- 13:06-DEBUG-profile : Using plotnine version 0.4.0
    - |-- 13:06-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    - |-- 13:06-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_1xvoz2cs
    - |-- 13:06-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_1xvoz2cs/mini_real_tx
    - |-- 13:06-INFO-profile : Getting configuration info from input file.
    - |-- 13:06-DEBUG-profile : Color order :['All transcripts']
    - |-- 13:06-DEBUG-profile : Profile color :['red']
    - |-- 13:06-INFO-profile : Searching coverage columns.
    - |-- 13:06-INFO-profile : Melting.
    - |-- 13:06-INFO-profile : Ceiling
    - |-- 13:06-INFO-profile : Zero value detected. Adding a pseudocount (+1) before log transformation.
    - |-- 13:06-INFO-profile : Converting to log2.
    - |-- 13:06-INFO-profile : Computing column ordering.
    - |-- 13:06-INFO-profile : Preparing diagram
    - |-- 13:06-INFO-profile : Theming and ordering. Please be patient...
    - |-- 13:06-INFO-profile : Preparing x axis
    - |-- 13:06-INFO-profile : facet_col 1
    - |-- 13:06-INFO-profile : Highlighting upstream regions
    - |-- 13:06-INFO-profile : Page width set to 4
    - |-- 13:06-INFO-profile : Page height set to 2.0
    - |-- 13:06-INFO-profile : Saving diagram to file : example_01c.png
    - |-- 13:06-INFO-profile : Be patient. This may be long for large datasets.
    + |-- 11:46-DEBUG-profile : Using pandas version 0.23.4
    + |-- 11:46-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    + |-- 11:46-DEBUG-profile : Using numpy version 1.13.3
    + |-- 11:46-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    + |-- 11:46-DEBUG-profile : Using plotnine version 0.4.0
    + |-- 11:46-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    + |-- 11:46-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_jbh1ifex
    + |-- 11:46-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_jbh1ifex/mini_real_tx
    + |-- 11:46-INFO-profile : Getting configuration info from input file.
    + |-- 11:46-DEBUG-profile : Color order :['All transcripts']
    + |-- 11:46-DEBUG-profile : Profile color :['red']
    + |-- 11:46-INFO-profile : Searching coverage columns.
    + |-- 11:46-INFO-profile : Melting.
    + |-- 11:46-INFO-profile : Ceiling
    + |-- 11:46-INFO-profile : Zero value detected. Adding a pseudocount (+1) before log transformation.
    + |-- 11:46-INFO-profile : Converting to log2.
    + |-- 11:46-INFO-profile : Computing column ordering.
    + |-- 11:46-INFO-profile : Preparing diagram
    + |-- 11:46-INFO-profile : Theming and ordering. Please be patient...
    + |-- 11:46-INFO-profile : Preparing x axis
    + |-- 11:46-INFO-profile : facet_col 1
    + |-- 11:46-INFO-profile : Highlighting upstream regions
    + |-- 11:46-INFO-profile : Page width set to 4
    + |-- 11:46-INFO-profile : Page height set to 2.0
    + |-- 11:46-INFO-profile : Saving diagram to file : example_01c.png
    + |-- 11:46-INFO-profile : Be patient. This may be long for large datasets.
     
    example_01c.png

    Transcript coverage is obtained using the mini_real_tx.zip matrix. This provides a simple overlayed profile of all epigenetic marks along the transcript body extended in 5’ and 3’ regions:

    $ gtftk profile -D -i mini_real_tx.zip -o profile_tx -pf png -if example_02.png
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:46-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_02.png

    Almost the same but increasing the bins dedicated to upstream and dowstream regions (see —bin-around-frac argument of *mk_matrix).

    $ gtftk profile -D -i mini_real_tx_2.zip -o profile_tx -pf png -if example_03.png
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:46-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_03.png

    Note that the same is obtained when using user-defined regions (i.e when providing a bed as input corresponding to transcript coordinates).

    $ gtftk profile -D -i mini_real_user_def.zip -o profile_udef_4  -pf png -if example_04.png
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:47-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_04.png

    The same dataset used for plotting but adding a normalization step (ranging). When using ranging normalization, values are expressed as a percentage of the range between max and min value.

    $ gtftk profile -D -nm ranging -i mini_real_user_def.zip -o profile_udef_5  -pf png -if example_04b.png
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:47-WARNING-profile : --group-by not set. Choosing 'bwig'.
     
    example_04b.png

    Two examples using statistic ‘max’ and 2 differents values of ‘–upper-limit’.

    $ gtftk profile -D -i mini_real_promoter.zip -o profile_prom -pf png -if example_04_max_a.png  -V 2 -lw 1 -at 5 -s max -ul 1
    - |-- 13:06-DEBUG-profile : Using pandas version 0.23.4
    - |-- 13:06-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    - |-- 13:06-DEBUG-profile : Using numpy version 1.13.3
    - |-- 13:06-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    - |-- 13:06-DEBUG-profile : Using plotnine version 0.4.0
    - |-- 13:06-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    - |-- 13:06-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_qdroqb06
    - |-- 13:06-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_qdroqb06/mini_real_promoter
    - |-- 13:06-INFO-profile : Getting configuration info from input file.
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    - |-- 13:06-DEBUG-profile : Color order :['H3K79me', 'H3K36me3', 'H3K4me3']
    - |-- 13:06-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    - |-- 13:06-INFO-profile : Searching coverage columns.
    - |-- 13:06-INFO-profile : Melting.
    - |-- 13:06-INFO-profile : Computing column ordering.
    - |-- 13:06-INFO-profile : Preparing diagram
    - |-- 13:06-INFO-profile : Theming and ordering. Please be patient...
    - |-- 13:06-INFO-profile : Preparing x axis
    - |-- 13:06-INFO-profile : facet_col 1
    - |-- 13:06-INFO-profile : Page width set to 3
    - |-- 13:06-INFO-profile : Page height set to 2
    - |-- 13:06-INFO-profile : Saving diagram to file : example_04_max_a.png
    - |-- 13:06-INFO-profile : Be patient. This may be long for large datasets.
    + |-- 11:47-DEBUG-profile : Using pandas version 0.23.4
    + |-- 11:47-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    + |-- 11:47-DEBUG-profile : Using numpy version 1.13.3
    + |-- 11:47-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    + |-- 11:47-DEBUG-profile : Using plotnine version 0.4.0
    + |-- 11:47-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    + |-- 11:47-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_is7wskbl
    + |-- 11:47-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_is7wskbl/mini_real_promoter
    + |-- 11:47-INFO-profile : Getting configuration info from input file.
    + |-- 11:47-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:47-DEBUG-profile : Color order :['H3K79me', 'H3K4me3', 'H3K36me3']
    + |-- 11:47-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    + |-- 11:47-INFO-profile : Searching coverage columns.
    + |-- 11:47-INFO-profile : Melting.
    + |-- 11:47-INFO-profile : Computing column ordering.
    + |-- 11:47-INFO-profile : Preparing diagram
    + |-- 11:47-INFO-profile : Theming and ordering. Please be patient...
    + |-- 11:47-INFO-profile : Preparing x axis
    + |-- 11:47-INFO-profile : facet_col 1
    + |-- 11:47-INFO-profile : Page width set to 3
    + |-- 11:47-INFO-profile : Page height set to 2
    + |-- 11:47-INFO-profile : Saving diagram to file : example_04_max_a.png
    + |-- 11:47-INFO-profile : Be patient. This may be long for large datasets.
     
    example_04_max_a.png
    $ gtftk profile -D -i mini_real_promoter.zip -o profile_prom -pf png -if example_04_max_b.png  -V 2 -lw 1 -at 5 -s max -ul 0.99
    - |-- 13:06-DEBUG-profile : Using pandas version 0.23.4
    - |-- 13:06-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    - |-- 13:06-DEBUG-profile : Using numpy version 1.13.3
    - |-- 13:06-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    - |-- 13:06-DEBUG-profile : Using plotnine version 0.4.0
    - |-- 13:06-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    - |-- 13:06-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_8pslynl6
    - |-- 13:06-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_8pslynl6/mini_real_promoter
    - |-- 13:06-INFO-profile : Getting configuration info from input file.
    - |-- 13:06-WARNING-profile : --group-by not set. Choosing 'bwig'.
    - |-- 13:06-DEBUG-profile : Color order :['H3K4me3', 'H3K36me3', 'H3K79me']
    - |-- 13:06-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    - |-- 13:06-INFO-profile : Searching coverage columns.
    - |-- 13:06-INFO-profile : Melting.
    - |-- 13:06-INFO-profile : Ceiling
    - |-- 13:06-INFO-profile : Computing column ordering.
    - |-- 13:06-INFO-profile : Preparing diagram
    - |-- 13:06-INFO-profile : Theming and ordering. Please be patient...
    - |-- 13:06-INFO-profile : Preparing x axis
    - |-- 13:06-INFO-profile : facet_col 1
    - |-- 13:06-INFO-profile : Page width set to 3
    - |-- 13:06-INFO-profile : Page height set to 2
    - |-- 13:06-INFO-profile : Saving diagram to file : example_04_max_b.png
    - |-- 13:06-INFO-profile : Be patient. This may be long for large datasets.
    + |-- 11:47-DEBUG-profile : Using pandas version 0.23.4
    + |-- 11:47-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    + |-- 11:47-DEBUG-profile : Using numpy version 1.13.3
    + |-- 11:47-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    + |-- 11:47-DEBUG-profile : Using plotnine version 0.4.0
    + |-- 11:47-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    + |-- 11:47-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_ogporq3f
    + |-- 11:47-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_ogporq3f/mini_real_promoter
    + |-- 11:47-INFO-profile : Getting configuration info from input file.
    + |-- 11:47-WARNING-profile : --group-by not set. Choosing 'bwig'.
    + |-- 11:47-DEBUG-profile : Color order :['H3K36me3', 'H3K4me3', 'H3K79me']
    + |-- 11:47-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    + |-- 11:47-INFO-profile : Searching coverage columns.
    + |-- 11:47-INFO-profile : Melting.
    + |-- 11:47-INFO-profile : Ceiling
    + |-- 11:47-INFO-profile : Computing column ordering.
    + |-- 11:47-INFO-profile : Preparing diagram
    + |-- 11:47-INFO-profile : Theming and ordering. Please be patient...
    + |-- 11:47-INFO-profile : Preparing x axis
    + |-- 11:47-INFO-profile : facet_col 1
    + |-- 11:47-INFO-profile : Page width set to 3
    + |-- 11:47-INFO-profile : Page height set to 2
    + |-- 11:47-INFO-profile : Saving diagram to file : example_04_max_b.png
    + |-- 11:47-INFO-profile : Be patient. This may be long for large datasets.
     
    example_04_max_b.png @@ -3336,94 +3341,94 @@

    profile
    $ gtftk profile -D -i mini_real_promoter.zip -f tx_classes -g bwig -fo -t tx_classes.txt -o profile_prom  -pf png -if example_05.png -e -V 2 -fc 2
    - |-- 13:06-DEBUG-profile : Using pandas version 0.23.4
    - |-- 13:06-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    - |-- 13:06-DEBUG-profile : Using numpy version 1.13.3
    - |-- 13:06-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    - |-- 13:06-DEBUG-profile : Using plotnine version 0.4.0
    - |-- 13:06-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    - |-- 13:06-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_uymw1n8g
    - |-- 13:06-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_uymw1n8g/mini_real_promoter
    - |-- 13:06-INFO-profile : Getting configuration info from input file.
    - |-- 13:06-INFO-profile : Reading transcript file.
    - |-- 13:06-INFO-profile : Deleting duplicates in transcript-file.
    - |-- 13:06-INFO-profile : Checking how many genes where found in the transcript list.
    - |-- 13:06-INFO-profile : Keeping 804 transcript out of 833.
    - |-- 13:06-DEBUG-profile : Color order :['H3K79me', 'H3K36me3', 'H3K4me3']
    - |-- 13:06-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    - |-- 13:06-INFO-profile : Searching coverage columns.
    - |-- 13:06-INFO-profile : Melting.
    - |-- 13:06-INFO-profile : Ceiling
    - |-- 13:06-INFO-profile : Computing column ordering.
    - |-- 13:06-INFO-profile : Preparing diagram
    - |-- 13:06-INFO-profile : Theming and ordering. Please be patient...
    - |-- 13:06-INFO-profile : Preparing x axis
    - |-- 13:06-INFO-profile : facet_col 2
    - |-- 13:06-INFO-profile : Page width set to 6
    - |-- 13:06-INFO-profile : Page height set to 5.0
    - |-- 13:06-INFO-profile : Saving diagram to file : example_05.png
    - |-- 13:06-INFO-profile : Be patient. This may be long for large datasets.
    + |-- 11:47-DEBUG-profile : Using pandas version 0.23.4
    + |-- 11:47-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    + |-- 11:47-DEBUG-profile : Using numpy version 1.13.3
    + |-- 11:47-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    + |-- 11:47-DEBUG-profile : Using plotnine version 0.4.0
    + |-- 11:47-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    + |-- 11:47-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_bk158xze
    + |-- 11:47-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_bk158xze/mini_real_promoter
    + |-- 11:47-INFO-profile : Getting configuration info from input file.
    + |-- 11:47-INFO-profile : Reading transcript file.
    + |-- 11:47-INFO-profile : Deleting duplicates in transcript-file.
    + |-- 11:47-INFO-profile : Checking how many genes where found in the transcript list.
    + |-- 11:47-INFO-profile : Keeping 804 transcript out of 833.
    + |-- 11:47-DEBUG-profile : Color order :['H3K79me', 'H3K4me3', 'H3K36me3']
    + |-- 11:47-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    + |-- 11:47-INFO-profile : Searching coverage columns.
    + |-- 11:47-INFO-profile : Melting.
    + |-- 11:47-INFO-profile : Ceiling
    + |-- 11:47-INFO-profile : Computing column ordering.
    + |-- 11:47-INFO-profile : Preparing diagram
    + |-- 11:47-INFO-profile : Theming and ordering. Please be patient...
    + |-- 11:47-INFO-profile : Preparing x axis
    + |-- 11:47-INFO-profile : facet_col 2
    + |-- 11:47-INFO-profile : Page width set to 6
    + |-- 11:47-INFO-profile : Page height set to 5.0
    + |-- 11:47-INFO-profile : Saving diagram to file : example_05.png
    + |-- 11:47-INFO-profile : Be patient. This may be long for large datasets.
     
    example_05.png

    Alternatively, the groups can be set to chromosomes or transcript classes:

    $ gtftk profile -D -i mini_real_promoter.zip -g tx_classes -f bwig -fo -t tx_classes.txt -o profile_prom  -pf png -if example_06.png -V 2 -nm ranging
    - |-- 13:06-DEBUG-profile : Using pandas version 0.23.4
    - |-- 13:06-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    - |-- 13:06-DEBUG-profile : Using numpy version 1.13.3
    - |-- 13:06-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    - |-- 13:06-DEBUG-profile : Using plotnine version 0.4.0
    - |-- 13:06-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    - |-- 13:06-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_c7b7_tvf
    - |-- 13:06-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_c7b7_tvf/mini_real_promoter
    - |-- 13:06-INFO-profile : Getting configuration info from input file.
    - |-- 13:06-INFO-profile : Reading transcript file.
    - |-- 13:06-INFO-profile : Deleting duplicates in transcript-file.
    - |-- 13:06-INFO-profile : Checking how many genes where found in the transcript list.
    - |-- 13:06-INFO-profile : Keeping 804 transcript out of 833.
    - |-- 13:06-DEBUG-profile : Color order :['protein_coding', 'antisense', 'lincRNA']
    - |-- 13:06-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    - |-- 13:06-INFO-profile : Searching coverage columns.
    - |-- 13:06-INFO-profile : Melting.
    - |-- 13:06-INFO-profile : Ceiling
    - |-- 13:06-INFO-profile : Normalizing (ranging)
    - |-- 13:06-INFO-profile : Computing column ordering.
    - |-- 13:06-INFO-profile : Preparing diagram
    - |-- 13:06-INFO-profile : Theming and ordering. Please be patient...
    - |-- 13:06-INFO-profile : Preparing x axis
    - |-- 13:06-INFO-profile : facet_col 3
    - |-- 13:06-INFO-profile : Page width set to 9
    - |-- 13:06-INFO-profile : Page height set to 2.0
    - |-- 13:06-INFO-profile : Saving diagram to file : example_06.png
    - |-- 13:06-INFO-profile : Be patient. This may be long for large datasets.
    + |-- 11:47-DEBUG-profile : Using pandas version 0.23.4
    + |-- 11:47-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    + |-- 11:47-DEBUG-profile : Using numpy version 1.13.3
    + |-- 11:47-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    + |-- 11:47-DEBUG-profile : Using plotnine version 0.4.0
    + |-- 11:47-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    + |-- 11:47-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_61rt9cn9
    + |-- 11:47-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_61rt9cn9/mini_real_promoter
    + |-- 11:47-INFO-profile : Getting configuration info from input file.
    + |-- 11:47-INFO-profile : Reading transcript file.
    + |-- 11:47-INFO-profile : Deleting duplicates in transcript-file.
    + |-- 11:47-INFO-profile : Checking how many genes where found in the transcript list.
    + |-- 11:47-INFO-profile : Keeping 804 transcript out of 833.
    + |-- 11:47-DEBUG-profile : Color order :['protein_coding', 'antisense', 'lincRNA']
    + |-- 11:47-DEBUG-profile : Profile color :['#000000', '#00bb00', '#cccccc']
    + |-- 11:47-INFO-profile : Searching coverage columns.
    + |-- 11:47-INFO-profile : Melting.
    + |-- 11:47-INFO-profile : Ceiling
    + |-- 11:47-INFO-profile : Normalizing (ranging)
    + |-- 11:47-INFO-profile : Computing column ordering.
    + |-- 11:47-INFO-profile : Preparing diagram
    + |-- 11:47-INFO-profile : Theming and ordering. Please be patient...
    + |-- 11:47-INFO-profile : Preparing x axis
    + |-- 11:47-INFO-profile : facet_col 3
    + |-- 11:47-INFO-profile : Page width set to 9
    + |-- 11:47-INFO-profile : Page height set to 2.0
    + |-- 11:47-INFO-profile : Saving diagram to file : example_06.png
    + |-- 11:47-INFO-profile : Be patient. This may be long for large datasets.
     
    example_06.png
    $ gtftk profile -D -i mini_real_promoter.zip -g chrom -f bwig -fo -t tx_classes.txt -o profile_prom  -pf png -if example_06b.png -V 2 -nm ranging
    - |-- 13:06-DEBUG-profile : Using pandas version 0.23.4
    - |-- 13:06-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    - |-- 13:06-DEBUG-profile : Using numpy version 1.13.3
    - |-- 13:06-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    - |-- 13:06-DEBUG-profile : Using plotnine version 0.4.0
    - |-- 13:06-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    - |-- 13:06-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_r558a_vx
    - |-- 13:06-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_r558a_vx/mini_real_promoter
    - |-- 13:06-INFO-profile : Getting configuration info from input file.
    - |-- 13:06-DEBUG-profile : Color order :['chr10', 'chr19', 'chr21', 'chr1', 'chrX', 'chr12', 'chr7', 'chr15', 'chr4', 'chr16', 'chr3', 'chr5', 'chr2', 'chr8', 'chr20', 'chr11', 'chr13', 'chr9', 'chr6', 'chr18', 'chr14', 'chr17', 'chr22']
    - |-- 13:06-DEBUG-profile : Profile color :['#000000', '#6c007c', '#850096', '#2500a5', '#0000ca', '#0041dd', '#0086dd', '#009fca', '#00aaa1', '#00a76f', '#009c00', '#00bb00', '#00da00', '#00f900', '#88ff00', '#dbf400', '#f7db00', '#ffb500', '#ff6100', '#f60000', '#da0000', '#cc1313', '#cccccc']
    - |-- 13:06-INFO-profile : Searching coverage columns.
    - |-- 13:06-INFO-profile : Melting.
    - |-- 13:06-INFO-profile : Ceiling
    - |-- 13:07-INFO-profile : Normalizing (ranging)
    - |-- 13:07-INFO-profile : Computing column ordering.
    - |-- 13:07-INFO-profile : Preparing diagram
    - |-- 13:07-INFO-profile : Theming and ordering. Please be patient...
    - |-- 13:07-INFO-profile : Preparing x axis
    - |-- 13:07-INFO-profile : facet_col 3
    - |-- 13:07-INFO-profile : Page width set to 9
    - |-- 13:07-INFO-profile : Page height set to 2.0
    - |-- 13:07-INFO-profile : Saving diagram to file : example_06b.png
    - |-- 13:07-INFO-profile : Be patient. This may be long for large datasets.
    + |-- 11:47-DEBUG-profile : Using pandas version 0.23.4
    + |-- 11:47-DEBUG-profile : Pandas location /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/pandas/__init__.py
    + |-- 11:47-DEBUG-profile : Using numpy version 1.13.3
    + |-- 11:47-DEBUG-profile : Pandas numpy /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/numpy/__init__.py
    + |-- 11:47-DEBUG-profile : Using plotnine version 0.4.0
    + |-- 11:47-DEBUG-profile : Pandas plotnine /Users/puthier/miniconda3/envs/pygtftk_py3k/lib/python3.6/site-packages/plotnine/__init__.py
    + |-- 11:47-DEBUG-profile : Uncompressing : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_21k_ugzg
    + |-- 11:47-DEBUG-profile : Reading : /var/folders/nl/stqvvbcn4pg9v65k8kyjv5yh0000gn/T/pygtftk_matrix_21k_ugzg/mini_real_promoter
    + |-- 11:47-INFO-profile : Getting configuration info from input file.
    + |-- 11:47-DEBUG-profile : Color order :['chr20', 'chr7', 'chr19', 'chr12', 'chrX', 'chr2', 'chr10', 'chr6', 'chr21', 'chr22', 'chr11', 'chr3', 'chr9', 'chr18', 'chr16', 'chr17', 'chr14', 'chr1', 'chr15', 'chr5', 'chr8', 'chr13', 'chr4']
    + |-- 11:47-DEBUG-profile : Profile color :['#000000', '#6c007c', '#850096', '#2500a5', '#0000ca', '#0041dd', '#0086dd', '#009fca', '#00aaa1', '#00a76f', '#009c00', '#00bb00', '#00da00', '#00f900', '#88ff00', '#dbf400', '#f7db00', '#ffb500', '#ff6100', '#f60000', '#da0000', '#cc1313', '#cccccc']
    + |-- 11:47-INFO-profile : Searching coverage columns.
    + |-- 11:47-INFO-profile : Melting.
    + |-- 11:47-INFO-profile : Ceiling
    + |-- 11:47-INFO-profile : Normalizing (ranging)
    + |-- 11:48-INFO-profile : Computing column ordering.
    + |-- 11:48-INFO-profile : Preparing diagram
    + |-- 11:48-INFO-profile : Theming and ordering. Please be patient...
    + |-- 11:48-INFO-profile : Preparing x axis
    + |-- 11:48-INFO-profile : facet_col 3
    + |-- 11:48-INFO-profile : Page width set to 9
    + |-- 11:48-INFO-profile : Page height set to 2.0
    + |-- 11:48-INFO-profile : Saving diagram to file : example_06b.png
    + |-- 11:48-INFO-profile : Be patient. This may be long for large datasets.
     
    example_06b.png @@ -3454,7 +3459,7 @@

    profile
    $ gtftk join_attr -i mini_real_noov_rnd_tx.gtf  -j mini_real_counts_ENCFF630HEX.txt  -k gene_name -n counts | gtftk discretize_key -k  counts -n 6 -d count_levels -pu | gtftk tabulate -k transcript_id,count_levels -o tx_exp_classes.txt -Hun
    - |-- 13:09-INFO-discretize_key : Categories: ['(-41.703_183.167]', '(183.167_574.667]', '(574.667_1035.0]', '(1035.0_1647.333]', '(1647.333_3212.667]', '(3212.667_41703.0]']
    + |-- 11:50-INFO-discretize_key : Categories: ['(-41.703_183.167]', '(183.167_574.667]', '(574.667_1035.0]', '(1035.0_1647.333]', '(1647.333_3212.667]', '(3212.667_41703.0]']
     
    @@ -119,7 +119,7 @@

    Navigation

  • modules |
  • - + @@ -87,7 +87,7 @@

    Navigation

  • modules |
  • - +